From b3f881a54c8cb417645de67ee9e18fe6b23e21cc Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Thu, 23 Aug 2018 18:18:36 -0700
Subject: [PATCH 01/55] timfuz: rref test

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 experiments/timfuz/.gitignore           |    9 +
 experiments/timfuz/Makefile             |   22 +
 experiments/timfuz/README.txt           |   71 +
 experiments/timfuz/benchmark.py         |   71 +
 experiments/timfuz/generate.sh          |    9 +
 experiments/timfuz/generate.tcl         |  279 +++
 experiments/timfuz/node_unique.py       |   99 +
 experiments/timfuz/oneblinkw.v          |   37 +
 experiments/timfuz/picorv32.v           | 2977 +++++++++++++++++++++++
 experiments/timfuz/pip_unique.py        |   89 +
 experiments/timfuz/placelut.py          |   91 +
 experiments/timfuz/placelut_fb.py       |  103 +
 experiments/timfuz/placelut_ff_fb.py    |  126 +
 experiments/timfuz/speed.sh             |    8 +
 experiments/timfuz/speed.tcl            |  182 ++
 experiments/timfuz/speed_json.py        |   98 +
 experiments/timfuz/timfuz.py            |  819 +++++++
 experiments/timfuz/timfuz_checksub.py   |  259 ++
 experiments/timfuz/timfuz_corner_csv.py |   60 +
 experiments/timfuz/timfuz_csv.py        |  272 +++
 experiments/timfuz/timfuz_rref.py       |  206 ++
 experiments/timfuz/timfuz_solve.py      |   98 +
 experiments/timfuz/top.v                |  109 +
 experiments/timfuz/wire_unique.py       |   92 +
 24 files changed, 6186 insertions(+)
 create mode 100644 experiments/timfuz/.gitignore
 create mode 100644 experiments/timfuz/Makefile
 create mode 100644 experiments/timfuz/README.txt
 create mode 100644 experiments/timfuz/benchmark.py
 create mode 100755 experiments/timfuz/generate.sh
 create mode 100644 experiments/timfuz/generate.tcl
 create mode 100644 experiments/timfuz/node_unique.py
 create mode 100644 experiments/timfuz/oneblinkw.v
 create mode 100644 experiments/timfuz/picorv32.v
 create mode 100644 experiments/timfuz/pip_unique.py
 create mode 100644 experiments/timfuz/placelut.py
 create mode 100644 experiments/timfuz/placelut_fb.py
 create mode 100644 experiments/timfuz/placelut_ff_fb.py
 create mode 100755 experiments/timfuz/speed.sh
 create mode 100644 experiments/timfuz/speed.tcl
 create mode 100644 experiments/timfuz/speed_json.py
 create mode 100644 experiments/timfuz/timfuz.py
 create mode 100644 experiments/timfuz/timfuz_checksub.py
 create mode 100644 experiments/timfuz/timfuz_corner_csv.py
 create mode 100644 experiments/timfuz/timfuz_csv.py
 create mode 100644 experiments/timfuz/timfuz_rref.py
 create mode 100644 experiments/timfuz/timfuz_solve.py
 create mode 100644 experiments/timfuz/top.v
 create mode 100644 experiments/timfuz/wire_unique.py

diff --git a/experiments/timfuz/.gitignore b/experiments/timfuz/.gitignore
new file mode 100644
index 00000000..d0d215d0
--- /dev/null
+++ b/experiments/timfuz/.gitignore
@@ -0,0 +1,9 @@
+/.Xil
+/design/
+/design.bit
+/design.bits
+/design.dcp
+/usage_statistics_webtalk.*
+/vivado*
+/specimen_*
+build_speed
diff --git a/experiments/timfuz/Makefile b/experiments/timfuz/Makefile
new file mode 100644
index 00000000..8da96c3f
--- /dev/null
+++ b/experiments/timfuz/Makefile
@@ -0,0 +1,22 @@
+N := 1
+SPECIMENS := $(addprefix specimen_,$(shell seq -f '%03.0f' $(N)))
+SPECIMENS_OK := $(addsuffix /OK,$(SPECIMENS))
+
+all: $(SPECIMENS_OK)
+	#python timfuz.py specimen_*/timing.txt
+
+$(SPECIMENS_OK):
+	bash generate.sh $(subst /OK,,$@)
+	touch $@
+
+run:
+	$(MAKE) clean
+	$(MAKE) all
+	touch run.ok
+
+clean:
+	rm -rf specimen_[0-9][0-9][0-9]/ seg_clblx.segbits __pycache__ run.ok
+	rm -rf vivado*.log vivado_*.str vivado*.jou design *.bits *.dcp *.bit
+
+.PHONY: database pushdb run clean
+
diff --git a/experiments/timfuz/README.txt b/experiments/timfuz/README.txt
new file mode 100644
index 00000000..5d37ec78
--- /dev/null
+++ b/experiments/timfuz/README.txt
@@ -0,0 +1,71 @@
+Timing analysis fuzzer
+This runs some random designs through Vivado and extracts timing information in order to derive timing models
+While Vivado has more involved RC (spice?) models incorporating fanout and other things,
+for now we are shooting for simple, conservative models with a min and max timing delay
+
+
+*******************************************************************************
+Background
+*******************************************************************************
+
+Vivado seems to associate each delay model with a "speed index"
+In particular, we are currently looking at pips and wires, each of which have a speed index associated with them
+For every timeing path, we record the total delay from one site to another, excluding site delays
+(timing analyzer provides an option to make this easy)
+We then walk along the path and record all wires and pips in between
+These are converted to their associated speed indexes
+This gives an equation that a series of speed indexes was given a certain delay value
+These equations are then fed into scipy.optimize.linprog to give estimates for the delay models
+
+However, there are some complications. For example:
+Given a system of equations like:
+t0           = 5
+t0 + t1      = 10
+t0 + t1 + t2 = 12
+The solver puts all the delays in t0
+To get around this, we subtract equations from each other
+
+Some additional info here: https://github.com/SymbiFlow/prjxray/wiki/Timing
+
+
+*******************************************************************************
+Quick start
+*******************************************************************************
+
+./speed.sh
+python timfuz_delay.py --cols-max 9 timfuz_dat/s1_timing2.txt
+Which will report something like 
+Delay on 36 / 162
+
+Now add some more data in:
+python timfuz_delay.py --cols-max 9 timfuz_dat/speed_json.json timfuz_dat/s*_timing2.txt
+Which should get a few more delay elements, say:
+Delay on 57 / 185
+
+
+*******************************************************************************
+From scratch
+*******************************************************************************
+
+Roughly something like this
+Edit generate.tcl
+Uncomment speed_models2
+Run "make N=1"
+python speed_json.py specimen_001/speed_model.txt speed_json.json
+Edit generate.tcl
+Comment speed_models2
+Run "make N=4" to generate some more timing data
+Now run as in the quick start
+python timfuz_delay.py --cols-max 9 speed_json.json specimen_*/timing2.txt
+
+
+*******************************************************************************
+TODO:
+*******************************************************************************
+
+Verify elements are being imported correctly throughout the whole chain
+Can any wires or similar be aggregated?
+    Ex: if a node consisents of two wire delay models and that pair is never seen elsewhere
+Look at virtual switchboxes. Can these be removed?
+Look at suspicous elements like WIRE_RC_ZERO
+
diff --git a/experiments/timfuz/benchmark.py b/experiments/timfuz/benchmark.py
new file mode 100644
index 00000000..6da3e132
--- /dev/null
+++ b/experiments/timfuz/benchmark.py
@@ -0,0 +1,71 @@
+'''
+pr0ntools
+Benchmarking utility
+Copyright 2010 John McMaster
+'''
+
+import time
+
+def time_str(delta):
+    fraction = delta % 1
+    delta -= fraction
+    delta = int(delta)
+    seconds = delta % 60
+    delta /= 60
+    minutes = delta % 60
+    delta /= 60
+    hours = delta
+    return '%02d:%02d:%02d.%04d' % (hours, minutes, seconds, fraction * 10000)
+
+class Benchmark:
+    start_time = None
+    end_time = None
+    
+    def __init__(self, max_items = None):
+        # For the lazy
+        self.start_time = time.time()
+        self.end_time = None
+        self.max_items = max_items
+        self.cur_items = 0
+
+    def start(self):
+        self.start_time = time.time()
+        self.end_time = None
+        self.cur_items = 0
+
+    def stop(self):
+        self.end_time = time.time()
+    
+    def advance(self, n = 1):
+        self.cur_items += n
+
+    def set_cur_items(self, n):
+        self.cur_items = n
+		
+    def delta_s(self):    
+        if self.end_time:
+            return self.end_time - self.start_time
+        else:
+            return time.time() - self.start_time
+    
+    def __str__(self):
+        if self.end_time:
+            return time_str(self.end_time - self.start_time)
+        elif self.max_items:
+            cur_time = time.time()
+            delta_t = cur_time - self.start_time
+            rate_s = 'N/A'
+            if delta_t > 0.000001:
+                rate = self.cur_items / (delta_t)
+                rate_s = '%f items / sec' % rate
+                if rate == 0:
+                    eta_str = 'inf'
+                else:
+                    remaining = (self.max_items - self.cur_items) / rate
+                    eta_str = time_str(remaining)
+            else:
+                eta_str = "indeterminate"
+            return '%d / %d, ETA: %s @ %s' % (self.cur_items, self.max_items, eta_str, rate_s)
+        else:
+            return time_str(time.time() - self.start_time)
+
diff --git a/experiments/timfuz/generate.sh b/experiments/timfuz/generate.sh
new file mode 100755
index 00000000..eebd0388
--- /dev/null
+++ b/experiments/timfuz/generate.sh
@@ -0,0 +1,9 @@
+#!/bin/bash
+
+set -ex
+
+source ${XRAY_GENHEADER}
+
+python ../placelut_ff_fb.py --sdx 4 --sdy 4  >placelut.v
+vivado -mode batch -source ../generate.tcl
+
diff --git a/experiments/timfuz/generate.tcl b/experiments/timfuz/generate.tcl
new file mode 100644
index 00000000..a2e76c71
--- /dev/null
+++ b/experiments/timfuz/generate.tcl
@@ -0,0 +1,279 @@
+source ../../../utils/utils.tcl
+
+proc pin_info {pin} {
+    set cell [get_cells -of_objects $pin]
+    set bel [get_bels -of_objects $cell]
+    set site [get_sites -of_objects $bel]
+    return "$site $bel"
+}
+
+proc pin_bel {pin} {
+    set cell [get_cells -of_objects $pin]
+    set bel [get_bels -of_objects $cell]
+    return $bel
+}
+
+proc build_design {} {
+    create_project -force -part $::env(XRAY_PART) design design
+    #read_verilog ../top.v
+    #read_verilog ../picorv32.v
+    #read_verilog ../oneblinkw.v
+    read_verilog placelut.v
+    synth_design -top top
+
+    puts "Locking pins"
+    set_property LOCK_PINS {I0:A1 I1:A2 I2:A3 I3:A4 I4:A5 I5:A6} \
+		[get_cells -quiet -filter {REF_NAME == LUT6} -hierarchical]
+
+    puts "Package stuff"
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_00) IOSTANDARD LVCMOS33" [get_ports clk]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_01) IOSTANDARD LVCMOS33" [get_ports stb]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_02) IOSTANDARD LVCMOS33" [get_ports di]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_03) IOSTANDARD LVCMOS33" [get_ports do]
+
+    if {0 < 0} {
+        puts "pblocking"
+        create_pblock roi
+        set roipb [get_pblocks roi]
+        set_property EXCLUDE_PLACEMENT 1 $roipb
+        add_cells_to_pblock $roipb [get_cells roi]
+        resize_pblock $roipb -add "$::env(XRAY_ROI)"
+
+        puts "randplace"
+        randplace_pblock 150 $roipb
+    }
+
+    set_property CFGBVS VCCO [current_design]
+    set_property CONFIG_VOLTAGE 3.3 [current_design]
+    set_property BITSTREAM.GENERAL.PERFRAMECRC YES [current_design]
+
+    puts "dedicated route"
+    set_property CLOCK_DEDICATED_ROUTE FALSE [get_nets clk_IBUF]
+
+    place_design
+
+    
+    route_design
+
+    write_checkpoint -force design.dcp
+    # disable combinitorial loop
+    # set_property IS_ENABLED 0 [get_drc_checks {LUTLP-1}]
+    #write_bitstream -force design.bit
+}
+
+# Changed to group wires and nodes
+# This allows tracing the full path along with pips
+proc write_info3 {} {
+    set outdir "."
+    set fp [open "$outdir/timing3.txt" w]
+    # bel as site/bel, so don't bother with site
+    puts $fp "net src_bel dst_bel ico fast_max fast_min slow_max slow_min pips inodes wires"
+
+    set TIME_start [clock clicks -milliseconds]
+    set verbose 0
+    set equations 0
+    set site_src_nets 0
+    set site_dst_nets 0
+    set neti 0
+    set nets [get_nets -hierarchical]
+    set nnets [llength $nets]
+    foreach net $nets {
+        incr neti
+        #if {$neti >= 10} {
+        #    puts "Debug break"
+        #    break
+        #}
+
+        puts "Net $neti / $nnets: $net"
+        # The semantics of get_pins -leaf is kind of odd
+        # When no passthrough LUTs exist, it has no effect
+        # When passthrough LUT present:
+        # -w/o -leaf: some pins + passthrough LUT pins
+        # -w/ -leaf: different pins + passthrough LUT pins
+        # With OUT filter this seems to be sufficient
+        set src_pin [get_pins -leaf -filter {DIRECTION == OUT} -of_objects $net]
+        set src_bel [pin_bel $src_pin]
+        set src_site [get_sites -of_objects $src_bel]
+        # Only one net driver
+        set src_site_pins [get_site_pins -filter {DIRECTION == OUT} -of_objects $net]
+
+        # Sometimes this is empty for reasons that escape me
+        # Emitting direction doesn't help
+        if {[llength $src_site_pins] < 1} {
+            if $verbose {
+                puts "    Ignoring site internal net"
+            }
+            incr site_src_nets
+            continue
+        }
+        set dst_site_pins_net [get_site_pins -filter {DIRECTION == IN} -of_objects $net]
+        if {[llength $dst_site_pins_net] < 1} {
+            puts "  Skipping site internal source net"
+            incr site_dst_nets
+            continue
+        }
+        foreach src_site_pin $src_site_pins {
+            if $verbose {
+                puts "Source: $src_pin at site $src_site:$src_bel, spin $src_site_pin"
+            }
+
+            # Run with and without interconnect only
+            foreach ico "0 1" {
+                set ico_flag ""
+                if $ico {
+                    set ico_flag "-interconnect_only"
+                    set delays [get_net_delays $ico_flag -of_objects $net]
+                } else {
+                    set delays [get_net_delays -of_objects $net]
+                }
+                foreach delay $delays {
+                    set delaystr [get_property NAME $delay]
+                    set dst_pins [get_property TO_PIN $delay]
+                    set dst_pin [get_pins $dst_pins]
+                    #puts "  $delaystr: $src_pin => $dst_pin"
+                    set dst_bel [pin_bel $dst_pin]
+                    set dst_site [get_sites -of_objects $dst_bel]
+                    if $verbose {
+                        puts "  Dest: $dst_pin at site $dst_site:$dst_bel"
+                    }
+
+                    set dst_site_pins [get_site_pins -of_objects $dst_pin]
+                    # Some nets are internal
+                    # But should this happen on dest if we've already filtered source?
+                    if {"$dst_site_pins" eq ""} {
+                        continue
+                    }
+                    # Also apparantly you can have multiple of these as well
+                    foreach dst_site_pin $dst_site_pins {
+                        set fast_max [get_property "FAST_MAX" $delay]
+                        set fast_min [get_property "FAST_MIN" $delay]
+                        set slow_max [get_property "SLOW_MAX" $delay]
+                        set slow_min [get_property "SLOW_MIN" $delay]
+
+                        # Want:
+                        # Site / BEL at src
+                        # Site / BEL at dst
+                        # Pips in between
+                        # Walk net, looking for interesting elements in between
+                        set pips [get_pips -of_objects $net -from $src_site_pin -to $dst_site_pin]
+                        if $verbose {
+                            foreach pip $pips {
+                                puts "    PIP $pip"
+                            }
+                        }
+                        set nodes [get_nodes -of_objects $net -from $src_site_pin -to $dst_site_pin]
+                        #set wires [get_wires -of_objects $net -from $src_site_pin -to $dst_site_pin]
+                        set wires [get_wires -of_objects $nodes]
+
+                        # puts $fp "$net $src_bel $dst_bel $ico $fast_max $fast_min $slow_max $slow_min $pips"
+                        puts -nonewline $fp "$net $src_bel $dst_bel $ico $fast_max $fast_min $slow_max $slow_min"
+        
+                        # Write pips w/ speed index
+                        puts -nonewline $fp " "
+                        set needspace 0
+                        foreach pip $pips {
+                            if $needspace {
+                                puts -nonewline $fp "|"
+                            }
+                            set speed_index [get_property SPEED_INDEX $pip]
+                            puts -nonewline $fp "$pip:$speed_index"
+                            set needspace 1
+                        }
+
+                        # Write nodes
+                        #set nodes_str [string map {" " "|"} $nodes]
+                        #puts -nonewline $fp " $nodes_str"
+                        puts -nonewline $fp " "
+                        set needspace 0
+                        foreach node $nodes {
+                            if $needspace {
+                                puts -nonewline $fp "|"
+                            }
+                            set nwires [llength [get_wires -of_objects $node]]
+                            puts -nonewline $fp "$node:$nwires"
+                            set needspace 1
+                        }
+
+                        # Write wires
+                        puts -nonewline $fp " "
+                        set needspace 0
+                        foreach wire $wires {
+                            if $needspace {
+                                puts -nonewline $fp "|"
+                            }
+                            set speed_index [get_property SPEED_INDEX $wire]
+                            puts -nonewline $fp "$wire:$speed_index"
+                            set needspace 1
+                        }
+
+                        puts $fp ""
+
+                        incr equations
+                        break
+                    }
+                }
+            }
+        }
+    }
+    close $fp
+    set TIME_taken [expr [clock clicks -milliseconds] - $TIME_start]
+    puts "Took ms: $TIME_taken"
+    puts "Generated $equations equations"
+    puts "Skipped $site_src_nets (+ $site_dst_nets) site nets"
+}
+
+proc pips_all {} {
+    set outdir "."
+    set fp [open "$outdir/pip_all.txt" w]
+    set items [get_pips]
+    puts "Items: [llength $items]"
+
+    set needspace 0
+    set properties [list_property [lindex $items 0]]
+    foreach item $items {
+        set needspace 0
+        foreach property $properties {
+            set val [get_property $property $item]
+            if {"$val" ne ""} {
+                if $needspace {
+                    puts -nonewline $fp " "
+                }
+                puts -nonewline $fp "$property:$val"
+                set needspace 1
+            }
+        }
+        puts $fp ""
+    }
+    close $fp
+}
+proc wires_all {} {
+    set outdir "."
+    set fp [open "$outdir/wire_all.txt" w]
+    set items [get_wires]
+    puts "Items: [llength $items]"
+
+    set needspace 0
+    set properties [list_property [lindex $items 0]]
+    foreach item $items {
+        set needspace 0
+        foreach property $properties {
+            set val [get_property $property $item]
+            if {"$val" ne ""} {
+                if $needspace {
+                    puts -nonewline $fp " "
+                }
+                puts -nonewline $fp "$property:$val"
+                set needspace 1
+            }
+        }
+        puts $fp ""
+    }
+    close $fp
+}
+
+build_design
+#write_info2
+write_info3
+#wires_all
+#pips_all
+
diff --git a/experiments/timfuz/node_unique.py b/experiments/timfuz/node_unique.py
new file mode 100644
index 00000000..e5793e64
--- /dev/null
+++ b/experiments/timfuz/node_unique.py
@@ -0,0 +1,99 @@
+'''
+Verifies that node timing info is unique
+'''
+
+import re
+
+def gen_nodes(fin):
+    for l in fin:
+        lj = {}
+        l = l.strip()
+        for kvs in l.split():
+            name, value = kvs.split(':')
+            '''
+            NAME:LIOB33_SING_X0Y199/IOB_IBUF0
+
+            IS_BAD:0
+            IS_COMPLETE:1
+            IS_GND:0 IS_INPUT_PIN:1 IS_OUTPUT_PIN:0 IS_PIN:1 IS_VCC:0 
+            NUM_WIRES:2
+            PIN_WIRE:1
+            '''
+            if name in ('COST_CODE', 'SPEED_CLASS'):
+                value = int(value)
+            lj[name] = value
+            
+        tile_type, xy, wname = re.match(r'(.*)_(X[0-9]*Y[0-9]*)/(.*)', lj['NAME']).groups()
+        lj['tile_type'] = tile_type
+        lj['xy'] = xy
+        lj['wname'] = wname
+
+        lj['l'] = l
+
+        yield lj
+
+def run(node_fin, verbose=0):
+    refnodes = {}
+    nodei = 0
+    for nodei, anode in enumerate(gen_nodes(node_fin)):
+        def getk(anode):
+            return anode['wname']
+            #return (anode['tile_type'], anode['wname'])
+
+        if nodei % 1000 == 0:
+            print 'Check node %d' % nodei
+        # Existing node?
+        try:
+            refnode = refnodes[getk(anode)]
+        except KeyError:
+            # Set as reference
+            refnodes[getk(anode)] = anode
+            continue
+        # Verify equivilence
+        for k in (
+                'SPEED_CLASS',
+
+                'COST_CODE', 'COST_CODE_NAME',
+                'IS_BAD', 'IS_COMPLETE', 'IS_GND', 'IS_VCC',
+                ):
+            if k in refnode and k in anode:
+                def fail():
+                    print 'Mismatch on %s' % k
+                    print refnode[k], anode[k]
+                    print refnode['l']
+                    print anode['l']
+                    #assert 0
+                if k == 'SPEED_CLASS':
+                    # Parameters known to effect SPEED_CLASS
+                    # Verify at least one parameter is different
+                    if refnode[k] != anode[k]:
+                        for k2 in ('IS_PIN', 'IS_INPUT_PIN', 'IS_OUTPUT_PIN', 'PIN_WIRE', 'NUM_WIRES'):
+                            if refnode[k2] != anode[k2]:
+                                break
+                        else:
+                            if 0:
+                                print
+                                fail()
+                elif refnode[k] != anode[k]:
+                    print
+                    fail()
+            # A key in one but not the other?
+            elif k in refnode or k in anode:
+                assert 0
+
+if __name__ == '__main__':
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description=
+        'Timing fuzzer'
+    )
+
+    parser.add_argument('--verbose', type=int, help='')
+    parser.add_argument(
+        'node_fn_in',
+        default='/dev/stdin',
+        nargs='?',
+        help='Input file')
+    args = parser.parse_args()
+    run(open(args.node_fn_in, 'r'), verbose=args.verbose)
diff --git a/experiments/timfuz/oneblinkw.v b/experiments/timfuz/oneblinkw.v
new file mode 100644
index 00000000..5e133bac
--- /dev/null
+++ b/experiments/timfuz/oneblinkw.v
@@ -0,0 +1,37 @@
+module roi (
+        input wire clk,
+        output wire out);
+    reg [23:0] counter;
+    assign out = counter[23] ^ counter[22] ^ counter[2] && counter[1] || counter[0];
+
+    always @(posedge clk) begin
+        counter <= counter + 1;
+    end
+endmodule
+
+module top(input wire clk, input wire stb, input wire di, output wire do);
+    localparam integer DIN_N = 0;
+    localparam integer DOUT_N = 1;
+
+    reg [DIN_N-1:0] din;
+    wire [DOUT_N-1:0] dout;
+
+    reg [DIN_N-1:0] din_shr;
+    reg [DOUT_N-1:0] dout_shr;
+
+    always @(posedge clk) begin
+        din_shr <= {din_shr, di};
+        dout_shr <= {dout_shr, din_shr[DIN_N-1]};
+        if (stb) begin
+            din <= din_shr;
+            dout_shr <= dout;
+        end
+    end
+
+    assign do = dout_shr[DOUT_N-1];
+    roi roi(
+            .clk(clk),
+            .out(dout[0])
+            );
+endmodule
+
diff --git a/experiments/timfuz/picorv32.v b/experiments/timfuz/picorv32.v
new file mode 100644
index 00000000..af634b47
--- /dev/null
+++ b/experiments/timfuz/picorv32.v
@@ -0,0 +1,2977 @@
+/*
+ *  PicoRV32 -- A Small RISC-V (RV32I) Processor Core
+ *
+ *  Copyright (C) 2015  Clifford Wolf <clifford@clifford.at>
+ *
+ *  Permission to use, copy, modify, and/or distribute this software for any
+ *  purpose with or without fee is hereby granted, provided that the above
+ *  copyright notice and this permission notice appear in all copies.
+ *
+ *  THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
+ *  WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
+ *  MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
+ *  ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
+ *  WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
+ *  ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
+ *  OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
+ *
+ */
+
+`timescale 1 ns / 1 ps
+// `default_nettype none
+// `define DEBUGNETS
+// `define DEBUGREGS
+// `define DEBUGASM
+// `define DEBUG
+
+`ifdef DEBUG
+  `define debug(debug_command) debug_command
+`else
+  `define debug(debug_command)
+`endif
+
+`ifdef FORMAL
+  `define FORMAL_KEEP (* keep *)
+  `define assert(assert_expr) assert(assert_expr)
+`else
+  `ifdef DEBUGNETS
+    `define FORMAL_KEEP (* keep *)
+  `else
+    `define FORMAL_KEEP
+  `endif
+  `define assert(assert_expr) empty_statement
+`endif
+
+// uncomment this for register file in extra module
+// `define PICORV32_REGS picorv32_regs
+
+// this macro can be used to check if the verilog files in your
+// design are read in the correct order.
+`define PICORV32_V
+
+
+/***************************************************************
+ * picorv32
+ ***************************************************************/
+
+module picorv32 #(
+	parameter [ 0:0] ENABLE_COUNTERS = 1,
+	parameter [ 0:0] ENABLE_COUNTERS64 = 1,
+	parameter [ 0:0] ENABLE_REGS_16_31 = 1,
+	parameter [ 0:0] ENABLE_REGS_DUALPORT = 1,
+	parameter [ 0:0] LATCHED_MEM_RDATA = 0,
+	parameter [ 0:0] TWO_STAGE_SHIFT = 1,
+	parameter [ 0:0] BARREL_SHIFTER = 0,
+	parameter [ 0:0] TWO_CYCLE_COMPARE = 0,
+	parameter [ 0:0] TWO_CYCLE_ALU = 0,
+	parameter [ 0:0] COMPRESSED_ISA = 0,
+	parameter [ 0:0] CATCH_MISALIGN = 1,
+	parameter [ 0:0] CATCH_ILLINSN = 1,
+	parameter [ 0:0] ENABLE_PCPI = 0,
+	parameter [ 0:0] ENABLE_MUL = 0,
+	parameter [ 0:0] ENABLE_FAST_MUL = 0,
+	parameter [ 0:0] ENABLE_DIV = 0,
+	parameter [ 0:0] ENABLE_IRQ = 0,
+	parameter [ 0:0] ENABLE_IRQ_QREGS = 1,
+	parameter [ 0:0] ENABLE_IRQ_TIMER = 1,
+	parameter [ 0:0] ENABLE_TRACE = 0,
+	parameter [ 0:0] REGS_INIT_ZERO = 0,
+	parameter [31:0] MASKED_IRQ = 32'h 0000_0000,
+	parameter [31:0] LATCHED_IRQ = 32'h ffff_ffff,
+	parameter [31:0] PROGADDR_RESET = 32'h 0000_0000,
+	parameter [31:0] PROGADDR_IRQ = 32'h 0000_0010,
+	parameter [31:0] STACKADDR = 32'h ffff_ffff
+) (
+	input clk, resetn,
+	output reg trap,
+
+	output reg        mem_valid,
+	output reg        mem_instr,
+	input             mem_ready,
+
+	output reg [31:0] mem_addr,
+	output reg [31:0] mem_wdata,
+	output reg [ 3:0] mem_wstrb,
+	input      [31:0] mem_rdata,
+
+	// Look-Ahead Interface
+	output            mem_la_read,
+	output            mem_la_write,
+	output     [31:0] mem_la_addr,
+	output reg [31:0] mem_la_wdata,
+	output reg [ 3:0] mem_la_wstrb,
+
+	// Pico Co-Processor Interface (PCPI)
+	output reg        pcpi_valid,
+	output reg [31:0] pcpi_insn,
+	output     [31:0] pcpi_rs1,
+	output     [31:0] pcpi_rs2,
+	input             pcpi_wr,
+	input      [31:0] pcpi_rd,
+	input             pcpi_wait,
+	input             pcpi_ready,
+
+	// IRQ Interface
+	input      [31:0] irq,
+	output reg [31:0] eoi,
+
+`ifdef RISCV_FORMAL
+	output reg        rvfi_valid,
+	output reg [63:0] rvfi_order,
+	output reg [31:0] rvfi_insn,
+	output reg        rvfi_trap,
+	output reg        rvfi_halt,
+	output reg        rvfi_intr,
+	output reg [ 4:0] rvfi_rs1_addr,
+	output reg [ 4:0] rvfi_rs2_addr,
+	output reg [31:0] rvfi_rs1_rdata,
+	output reg [31:0] rvfi_rs2_rdata,
+	output reg [ 4:0] rvfi_rd_addr,
+	output reg [31:0] rvfi_rd_wdata,
+	output reg [31:0] rvfi_pc_rdata,
+	output reg [31:0] rvfi_pc_wdata,
+	output reg [31:0] rvfi_mem_addr,
+	output reg [ 3:0] rvfi_mem_rmask,
+	output reg [ 3:0] rvfi_mem_wmask,
+	output reg [31:0] rvfi_mem_rdata,
+	output reg [31:0] rvfi_mem_wdata,
+`endif
+
+	// Trace Interface
+	output reg        trace_valid,
+	output reg [35:0] trace_data
+);
+	localparam integer irq_timer = 0;
+	localparam integer irq_ebreak = 1;
+	localparam integer irq_buserror = 2;
+
+	localparam integer irqregs_offset = ENABLE_REGS_16_31 ? 32 : 16;
+	localparam integer regfile_size = (ENABLE_REGS_16_31 ? 32 : 16) + 4*ENABLE_IRQ*ENABLE_IRQ_QREGS;
+	localparam integer regindex_bits = (ENABLE_REGS_16_31 ? 5 : 4) + ENABLE_IRQ*ENABLE_IRQ_QREGS;
+
+	localparam WITH_PCPI = ENABLE_PCPI || ENABLE_MUL || ENABLE_FAST_MUL || ENABLE_DIV;
+
+	localparam [35:0] TRACE_BRANCH = {4'b 0001, 32'b 0};
+	localparam [35:0] TRACE_ADDR   = {4'b 0010, 32'b 0};
+	localparam [35:0] TRACE_IRQ    = {4'b 1000, 32'b 0};
+
+	reg [63:0] count_cycle, count_instr;
+	reg [31:0] reg_pc, reg_next_pc, reg_op1, reg_op2, reg_out;
+	reg [4:0] reg_sh;
+
+	reg [31:0] next_insn_opcode;
+	reg [31:0] dbg_insn_opcode;
+	reg [31:0] dbg_insn_addr;
+
+	wire dbg_mem_valid = mem_valid;
+	wire dbg_mem_instr = mem_instr;
+	wire dbg_mem_ready = mem_ready;
+	wire [31:0] dbg_mem_addr  = mem_addr;
+	wire [31:0] dbg_mem_wdata = mem_wdata;
+	wire [ 3:0] dbg_mem_wstrb = mem_wstrb;
+	wire [31:0] dbg_mem_rdata = mem_rdata;
+
+	assign pcpi_rs1 = reg_op1;
+	assign pcpi_rs2 = reg_op2;
+
+	wire [31:0] next_pc;
+
+	reg irq_delay;
+	reg irq_active;
+	reg [31:0] irq_mask;
+	reg [31:0] irq_pending;
+	reg [31:0] timer;
+
+`ifndef PICORV32_REGS
+	reg [31:0] cpuregs [0:regfile_size-1];
+
+	integer i;
+	initial begin
+		if (REGS_INIT_ZERO) begin
+			for (i = 0; i < regfile_size; i = i+1)
+				cpuregs[i] = 0;
+		end
+	end
+`endif
+
+	task empty_statement;
+		// This task is used by the `assert directive in non-formal mode to
+		// avoid empty statement (which are unsupported by plain Verilog syntax).
+		begin end
+	endtask
+
+`ifdef DEBUGREGS
+	wire [31:0] dbg_reg_x0  = 0;
+	wire [31:0] dbg_reg_x1  = cpuregs[1];
+	wire [31:0] dbg_reg_x2  = cpuregs[2];
+	wire [31:0] dbg_reg_x3  = cpuregs[3];
+	wire [31:0] dbg_reg_x4  = cpuregs[4];
+	wire [31:0] dbg_reg_x5  = cpuregs[5];
+	wire [31:0] dbg_reg_x6  = cpuregs[6];
+	wire [31:0] dbg_reg_x7  = cpuregs[7];
+	wire [31:0] dbg_reg_x8  = cpuregs[8];
+	wire [31:0] dbg_reg_x9  = cpuregs[9];
+	wire [31:0] dbg_reg_x10 = cpuregs[10];
+	wire [31:0] dbg_reg_x11 = cpuregs[11];
+	wire [31:0] dbg_reg_x12 = cpuregs[12];
+	wire [31:0] dbg_reg_x13 = cpuregs[13];
+	wire [31:0] dbg_reg_x14 = cpuregs[14];
+	wire [31:0] dbg_reg_x15 = cpuregs[15];
+	wire [31:0] dbg_reg_x16 = cpuregs[16];
+	wire [31:0] dbg_reg_x17 = cpuregs[17];
+	wire [31:0] dbg_reg_x18 = cpuregs[18];
+	wire [31:0] dbg_reg_x19 = cpuregs[19];
+	wire [31:0] dbg_reg_x20 = cpuregs[20];
+	wire [31:0] dbg_reg_x21 = cpuregs[21];
+	wire [31:0] dbg_reg_x22 = cpuregs[22];
+	wire [31:0] dbg_reg_x23 = cpuregs[23];
+	wire [31:0] dbg_reg_x24 = cpuregs[24];
+	wire [31:0] dbg_reg_x25 = cpuregs[25];
+	wire [31:0] dbg_reg_x26 = cpuregs[26];
+	wire [31:0] dbg_reg_x27 = cpuregs[27];
+	wire [31:0] dbg_reg_x28 = cpuregs[28];
+	wire [31:0] dbg_reg_x29 = cpuregs[29];
+	wire [31:0] dbg_reg_x30 = cpuregs[30];
+	wire [31:0] dbg_reg_x31 = cpuregs[31];
+`endif
+
+	// Internal PCPI Cores
+
+	wire        pcpi_mul_wr;
+	wire [31:0] pcpi_mul_rd;
+	wire        pcpi_mul_wait;
+	wire        pcpi_mul_ready;
+
+	wire        pcpi_div_wr;
+	wire [31:0] pcpi_div_rd;
+	wire        pcpi_div_wait;
+	wire        pcpi_div_ready;
+
+	reg        pcpi_int_wr;
+	reg [31:0] pcpi_int_rd;
+	reg        pcpi_int_wait;
+	reg        pcpi_int_ready;
+
+	generate if (ENABLE_FAST_MUL) begin
+		picorv32_pcpi_fast_mul pcpi_mul (
+			.clk       (clk            ),
+			.resetn    (resetn         ),
+			.pcpi_valid(pcpi_valid     ),
+			.pcpi_insn (pcpi_insn      ),
+			.pcpi_rs1  (pcpi_rs1       ),
+			.pcpi_rs2  (pcpi_rs2       ),
+			.pcpi_wr   (pcpi_mul_wr    ),
+			.pcpi_rd   (pcpi_mul_rd    ),
+			.pcpi_wait (pcpi_mul_wait  ),
+			.pcpi_ready(pcpi_mul_ready )
+		);
+	end else if (ENABLE_MUL) begin
+		picorv32_pcpi_mul pcpi_mul (
+			.clk       (clk            ),
+			.resetn    (resetn         ),
+			.pcpi_valid(pcpi_valid     ),
+			.pcpi_insn (pcpi_insn      ),
+			.pcpi_rs1  (pcpi_rs1       ),
+			.pcpi_rs2  (pcpi_rs2       ),
+			.pcpi_wr   (pcpi_mul_wr    ),
+			.pcpi_rd   (pcpi_mul_rd    ),
+			.pcpi_wait (pcpi_mul_wait  ),
+			.pcpi_ready(pcpi_mul_ready )
+		);
+	end else begin
+		assign pcpi_mul_wr = 0;
+		assign pcpi_mul_rd = 32'bx;
+		assign pcpi_mul_wait = 0;
+		assign pcpi_mul_ready = 0;
+	end endgenerate
+
+	generate if (ENABLE_DIV) begin
+		picorv32_pcpi_div pcpi_div (
+			.clk       (clk            ),
+			.resetn    (resetn         ),
+			.pcpi_valid(pcpi_valid     ),
+			.pcpi_insn (pcpi_insn      ),
+			.pcpi_rs1  (pcpi_rs1       ),
+			.pcpi_rs2  (pcpi_rs2       ),
+			.pcpi_wr   (pcpi_div_wr    ),
+			.pcpi_rd   (pcpi_div_rd    ),
+			.pcpi_wait (pcpi_div_wait  ),
+			.pcpi_ready(pcpi_div_ready )
+		);
+	end else begin
+		assign pcpi_div_wr = 0;
+		assign pcpi_div_rd = 32'bx;
+		assign pcpi_div_wait = 0;
+		assign pcpi_div_ready = 0;
+	end endgenerate
+
+	always @* begin
+		pcpi_int_wr = 0;
+		pcpi_int_rd = 32'bx;
+		pcpi_int_wait  = |{ENABLE_PCPI && pcpi_wait,  (ENABLE_MUL || ENABLE_FAST_MUL) && pcpi_mul_wait,  ENABLE_DIV && pcpi_div_wait};
+		pcpi_int_ready = |{ENABLE_PCPI && pcpi_ready, (ENABLE_MUL || ENABLE_FAST_MUL) && pcpi_mul_ready, ENABLE_DIV && pcpi_div_ready};
+
+		(* parallel_case *)
+		case (1'b1)
+			ENABLE_PCPI && pcpi_ready: begin
+				pcpi_int_wr = ENABLE_PCPI ? pcpi_wr : 0;
+				pcpi_int_rd = ENABLE_PCPI ? pcpi_rd : 0;
+			end
+			(ENABLE_MUL || ENABLE_FAST_MUL) && pcpi_mul_ready: begin
+				pcpi_int_wr = pcpi_mul_wr;
+				pcpi_int_rd = pcpi_mul_rd;
+			end
+			ENABLE_DIV && pcpi_div_ready: begin
+				pcpi_int_wr = pcpi_div_wr;
+				pcpi_int_rd = pcpi_div_rd;
+			end
+		endcase
+	end
+
+
+	// Memory Interface
+
+	reg [1:0] mem_state;
+	reg [1:0] mem_wordsize;
+	reg [31:0] mem_rdata_word;
+	reg [31:0] mem_rdata_q;
+	reg mem_do_prefetch;
+	reg mem_do_rinst;
+	reg mem_do_rdata;
+	reg mem_do_wdata;
+
+	wire mem_xfer;
+	reg mem_la_secondword, mem_la_firstword_reg, last_mem_valid;
+	wire mem_la_firstword = COMPRESSED_ISA && (mem_do_prefetch || mem_do_rinst) && next_pc[1] && !mem_la_secondword;
+	wire mem_la_firstword_xfer = COMPRESSED_ISA && mem_xfer && (!last_mem_valid ? mem_la_firstword : mem_la_firstword_reg);
+
+	reg prefetched_high_word;
+	reg clear_prefetched_high_word;
+	reg [15:0] mem_16bit_buffer;
+
+	wire [31:0] mem_rdata_latched_noshuffle;
+	wire [31:0] mem_rdata_latched;
+
+	wire mem_la_use_prefetched_high_word = COMPRESSED_ISA && mem_la_firstword && prefetched_high_word && !clear_prefetched_high_word;
+	assign mem_xfer = (mem_valid && mem_ready) || (mem_la_use_prefetched_high_word && mem_do_rinst);
+
+	wire mem_busy = |{mem_do_prefetch, mem_do_rinst, mem_do_rdata, mem_do_wdata};
+	wire mem_done = resetn && ((mem_xfer && |mem_state && (mem_do_rinst || mem_do_rdata || mem_do_wdata)) || (&mem_state && mem_do_rinst)) &&
+			(!mem_la_firstword || (~&mem_rdata_latched[1:0] && mem_xfer));
+
+	assign mem_la_write = resetn && !mem_state && mem_do_wdata;
+	assign mem_la_read = resetn && ((!mem_la_use_prefetched_high_word && !mem_state && (mem_do_rinst || mem_do_prefetch || mem_do_rdata)) ||
+			(COMPRESSED_ISA && mem_xfer && (!last_mem_valid ? mem_la_firstword : mem_la_firstword_reg) && !mem_la_secondword && &mem_rdata_latched[1:0]));
+	assign mem_la_addr = (mem_do_prefetch || mem_do_rinst) ? {next_pc[31:2] + mem_la_firstword_xfer, 2'b00} : {reg_op1[31:2], 2'b00};
+
+	assign mem_rdata_latched_noshuffle = (mem_xfer || LATCHED_MEM_RDATA) ? mem_rdata : mem_rdata_q;
+
+	assign mem_rdata_latched = COMPRESSED_ISA && mem_la_use_prefetched_high_word ? {16'bx, mem_16bit_buffer} :
+			COMPRESSED_ISA && mem_la_secondword ? {mem_rdata_latched_noshuffle[15:0], mem_16bit_buffer} :
+			COMPRESSED_ISA && mem_la_firstword ? {16'bx, mem_rdata_latched_noshuffle[31:16]} : mem_rdata_latched_noshuffle;
+
+	always @(posedge clk) begin
+		if (!resetn) begin
+			mem_la_firstword_reg <= 0;
+			last_mem_valid <= 0;
+		end else begin
+			if (!last_mem_valid)
+				mem_la_firstword_reg <= mem_la_firstword;
+			last_mem_valid <= mem_valid && !mem_ready;
+		end
+	end
+
+	always @* begin
+		(* full_case *)
+		case (mem_wordsize)
+			0: begin
+				mem_la_wdata = reg_op2;
+				mem_la_wstrb = 4'b1111;
+				mem_rdata_word = mem_rdata;
+			end
+			1: begin
+				mem_la_wdata = {2{reg_op2[15:0]}};
+				mem_la_wstrb = reg_op1[1] ? 4'b1100 : 4'b0011;
+				case (reg_op1[1])
+					1'b0: mem_rdata_word = {16'b0, mem_rdata[15: 0]};
+					1'b1: mem_rdata_word = {16'b0, mem_rdata[31:16]};
+				endcase
+			end
+			2: begin
+				mem_la_wdata = {4{reg_op2[7:0]}};
+				mem_la_wstrb = 4'b0001 << reg_op1[1:0];
+				case (reg_op1[1:0])
+					2'b00: mem_rdata_word = {24'b0, mem_rdata[ 7: 0]};
+					2'b01: mem_rdata_word = {24'b0, mem_rdata[15: 8]};
+					2'b10: mem_rdata_word = {24'b0, mem_rdata[23:16]};
+					2'b11: mem_rdata_word = {24'b0, mem_rdata[31:24]};
+				endcase
+			end
+		endcase
+	end
+
+	always @(posedge clk) begin
+		if (mem_xfer) begin
+			mem_rdata_q <= COMPRESSED_ISA ? mem_rdata_latched : mem_rdata;
+			next_insn_opcode <= COMPRESSED_ISA ? mem_rdata_latched : mem_rdata;
+		end
+
+		if (COMPRESSED_ISA && mem_done && (mem_do_prefetch || mem_do_rinst)) begin
+			case (mem_rdata_latched[1:0])
+				2'b00: begin // Quadrant 0
+					case (mem_rdata_latched[15:13])
+						3'b000: begin // C.ADDI4SPN
+							mem_rdata_q[14:12] <= 3'b000;
+							mem_rdata_q[31:20] <= {2'b0, mem_rdata_latched[10:7], mem_rdata_latched[12:11], mem_rdata_latched[5], mem_rdata_latched[6], 2'b00};
+						end
+						3'b010: begin // C.LW
+							mem_rdata_q[31:20] <= {5'b0, mem_rdata_latched[5], mem_rdata_latched[12:10], mem_rdata_latched[6], 2'b00};
+							mem_rdata_q[14:12] <= 3'b 010;
+						end
+						3'b 110: begin // C.SW
+							{mem_rdata_q[31:25], mem_rdata_q[11:7]} <= {5'b0, mem_rdata_latched[5], mem_rdata_latched[12:10], mem_rdata_latched[6], 2'b00};
+							mem_rdata_q[14:12] <= 3'b 010;
+						end
+					endcase
+				end
+				2'b01: begin // Quadrant 1
+					case (mem_rdata_latched[15:13])
+						3'b 000: begin // C.ADDI
+							mem_rdata_q[14:12] <= 3'b000;
+							mem_rdata_q[31:20] <= $signed({mem_rdata_latched[12], mem_rdata_latched[6:2]});
+						end
+						3'b 010: begin // C.LI
+							mem_rdata_q[14:12] <= 3'b000;
+							mem_rdata_q[31:20] <= $signed({mem_rdata_latched[12], mem_rdata_latched[6:2]});
+						end
+						3'b 011: begin
+							if (mem_rdata_latched[11:7] == 2) begin // C.ADDI16SP
+								mem_rdata_q[14:12] <= 3'b000;
+								mem_rdata_q[31:20] <= $signed({mem_rdata_latched[12], mem_rdata_latched[4:3],
+										mem_rdata_latched[5], mem_rdata_latched[2], mem_rdata_latched[6], 4'b 0000});
+							end else begin // C.LUI
+								mem_rdata_q[31:12] <= $signed({mem_rdata_latched[12], mem_rdata_latched[6:2]});
+							end
+						end
+						3'b100: begin
+							if (mem_rdata_latched[11:10] == 2'b00) begin // C.SRLI
+								mem_rdata_q[31:25] <= 7'b0000000;
+								mem_rdata_q[14:12] <= 3'b 101;
+							end
+							if (mem_rdata_latched[11:10] == 2'b01) begin // C.SRAI
+								mem_rdata_q[31:25] <= 7'b0100000;
+								mem_rdata_q[14:12] <= 3'b 101;
+							end
+							if (mem_rdata_latched[11:10] == 2'b10) begin // C.ANDI
+								mem_rdata_q[14:12] <= 3'b111;
+								mem_rdata_q[31:20] <= $signed({mem_rdata_latched[12], mem_rdata_latched[6:2]});
+							end
+							if (mem_rdata_latched[12:10] == 3'b011) begin // C.SUB, C.XOR, C.OR, C.AND
+								if (mem_rdata_latched[6:5] == 2'b00) mem_rdata_q[14:12] <= 3'b000;
+								if (mem_rdata_latched[6:5] == 2'b01) mem_rdata_q[14:12] <= 3'b100;
+								if (mem_rdata_latched[6:5] == 2'b10) mem_rdata_q[14:12] <= 3'b110;
+								if (mem_rdata_latched[6:5] == 2'b11) mem_rdata_q[14:12] <= 3'b111;
+								mem_rdata_q[31:25] <= mem_rdata_latched[6:5] == 2'b00 ? 7'b0100000 : 7'b0000000;
+							end
+						end
+						3'b 110: begin // C.BEQZ
+							mem_rdata_q[14:12] <= 3'b000;
+							{ mem_rdata_q[31], mem_rdata_q[7], mem_rdata_q[30:25], mem_rdata_q[11:8] } <=
+									$signed({mem_rdata_latched[12], mem_rdata_latched[6:5], mem_rdata_latched[2],
+											mem_rdata_latched[11:10], mem_rdata_latched[4:3]});
+						end
+						3'b 111: begin // C.BNEZ
+							mem_rdata_q[14:12] <= 3'b001;
+							{ mem_rdata_q[31], mem_rdata_q[7], mem_rdata_q[30:25], mem_rdata_q[11:8] } <=
+									$signed({mem_rdata_latched[12], mem_rdata_latched[6:5], mem_rdata_latched[2],
+											mem_rdata_latched[11:10], mem_rdata_latched[4:3]});
+						end
+					endcase
+				end
+				2'b10: begin // Quadrant 2
+					case (mem_rdata_latched[15:13])
+						3'b000: begin // C.SLLI
+							mem_rdata_q[31:25] <= 7'b0000000;
+							mem_rdata_q[14:12] <= 3'b 001;
+						end
+						3'b010: begin // C.LWSP
+							mem_rdata_q[31:20] <= {4'b0, mem_rdata_latched[3:2], mem_rdata_latched[12], mem_rdata_latched[6:4], 2'b00};
+							mem_rdata_q[14:12] <= 3'b 010;
+						end
+						3'b100: begin
+							if (mem_rdata_latched[12] == 0 && mem_rdata_latched[6:2] == 0) begin // C.JR
+								mem_rdata_q[14:12] <= 3'b000;
+								mem_rdata_q[31:20] <= 12'b0;
+							end
+							if (mem_rdata_latched[12] == 0 && mem_rdata_latched[6:2] != 0) begin // C.MV
+								mem_rdata_q[14:12] <= 3'b000;
+								mem_rdata_q[31:25] <= 7'b0000000;
+							end
+							if (mem_rdata_latched[12] != 0 && mem_rdata_latched[11:7] != 0 && mem_rdata_latched[6:2] == 0) begin // C.JALR
+								mem_rdata_q[14:12] <= 3'b000;
+								mem_rdata_q[31:20] <= 12'b0;
+							end
+							if (mem_rdata_latched[12] != 0 && mem_rdata_latched[6:2] != 0) begin // C.ADD
+								mem_rdata_q[14:12] <= 3'b000;
+								mem_rdata_q[31:25] <= 7'b0000000;
+							end
+						end
+						3'b110: begin // C.SWSP
+							{mem_rdata_q[31:25], mem_rdata_q[11:7]} <= {4'b0, mem_rdata_latched[8:7], mem_rdata_latched[12:9], 2'b00};
+							mem_rdata_q[14:12] <= 3'b 010;
+						end
+					endcase
+				end
+			endcase
+		end
+	end
+
+	always @(posedge clk) begin
+		if (resetn && !trap) begin
+			if (mem_do_prefetch || mem_do_rinst || mem_do_rdata)
+				`assert(!mem_do_wdata);
+
+			if (mem_do_prefetch || mem_do_rinst)
+				`assert(!mem_do_rdata);
+
+			if (mem_do_rdata)
+				`assert(!mem_do_prefetch && !mem_do_rinst);
+
+			if (mem_do_wdata)
+				`assert(!(mem_do_prefetch || mem_do_rinst || mem_do_rdata));
+
+			if (mem_state == 2 || mem_state == 3)
+				`assert(mem_valid || mem_do_prefetch);
+		end
+	end
+
+	always @(posedge clk) begin
+		if (!resetn || trap) begin
+			if (!resetn)
+				mem_state <= 0;
+			if (!resetn || mem_ready)
+				mem_valid <= 0;
+			mem_la_secondword <= 0;
+			prefetched_high_word <= 0;
+		end else begin
+			if (mem_la_read || mem_la_write) begin
+				mem_addr <= mem_la_addr;
+				mem_wstrb <= mem_la_wstrb & {4{mem_la_write}};
+			end
+			if (mem_la_write) begin
+				mem_wdata <= mem_la_wdata;
+			end
+			case (mem_state)
+				0: begin
+					if (mem_do_prefetch || mem_do_rinst || mem_do_rdata) begin
+						mem_valid <= !mem_la_use_prefetched_high_word;
+						mem_instr <= mem_do_prefetch || mem_do_rinst;
+						mem_wstrb <= 0;
+						mem_state <= 1;
+					end
+					if (mem_do_wdata) begin
+						mem_valid <= 1;
+						mem_instr <= 0;
+						mem_state <= 2;
+					end
+				end
+				1: begin
+					`assert(mem_wstrb == 0);
+					`assert(mem_do_prefetch || mem_do_rinst || mem_do_rdata);
+					`assert(mem_valid == !mem_la_use_prefetched_high_word);
+					`assert(mem_instr == (mem_do_prefetch || mem_do_rinst));
+					if (mem_xfer) begin
+						if (COMPRESSED_ISA && mem_la_read) begin
+							mem_valid <= 1;
+							mem_la_secondword <= 1;
+							if (!mem_la_use_prefetched_high_word)
+								mem_16bit_buffer <= mem_rdata[31:16];
+						end else begin
+							mem_valid <= 0;
+							mem_la_secondword <= 0;
+							if (COMPRESSED_ISA && !mem_do_rdata) begin
+								if (~&mem_rdata[1:0] || mem_la_secondword) begin
+									mem_16bit_buffer <= mem_rdata[31:16];
+									prefetched_high_word <= 1;
+								end else begin
+									prefetched_high_word <= 0;
+								end
+							end
+							mem_state <= mem_do_rinst || mem_do_rdata ? 0 : 3;
+						end
+					end
+				end
+				2: begin
+					`assert(mem_wstrb != 0);
+					`assert(mem_do_wdata);
+					if (mem_xfer) begin
+						mem_valid <= 0;
+						mem_state <= 0;
+					end
+				end
+				3: begin
+					`assert(mem_wstrb == 0);
+					`assert(mem_do_prefetch);
+					if (mem_do_rinst) begin
+						mem_state <= 0;
+					end
+				end
+			endcase
+		end
+
+		if (clear_prefetched_high_word)
+			prefetched_high_word <= 0;
+	end
+
+
+	// Instruction Decoder
+
+	reg instr_lui, instr_auipc, instr_jal, instr_jalr;
+	reg instr_beq, instr_bne, instr_blt, instr_bge, instr_bltu, instr_bgeu;
+	reg instr_lb, instr_lh, instr_lw, instr_lbu, instr_lhu, instr_sb, instr_sh, instr_sw;
+	reg instr_addi, instr_slti, instr_sltiu, instr_xori, instr_ori, instr_andi, instr_slli, instr_srli, instr_srai;
+	reg instr_add, instr_sub, instr_sll, instr_slt, instr_sltu, instr_xor, instr_srl, instr_sra, instr_or, instr_and;
+	reg instr_rdcycle, instr_rdcycleh, instr_rdinstr, instr_rdinstrh, instr_ecall_ebreak;
+	reg instr_getq, instr_setq, instr_retirq, instr_maskirq, instr_waitirq, instr_timer;
+	wire instr_trap;
+
+	reg [regindex_bits-1:0] decoded_rd, decoded_rs1, decoded_rs2;
+	reg [31:0] decoded_imm, decoded_imm_uj;
+	reg decoder_trigger;
+	reg decoder_trigger_q;
+	reg decoder_pseudo_trigger;
+	reg decoder_pseudo_trigger_q;
+	reg compressed_instr;
+
+	reg is_lui_auipc_jal;
+	reg is_lb_lh_lw_lbu_lhu;
+	reg is_slli_srli_srai;
+	reg is_jalr_addi_slti_sltiu_xori_ori_andi;
+	reg is_sb_sh_sw;
+	reg is_sll_srl_sra;
+	reg is_lui_auipc_jal_jalr_addi_add_sub;
+	reg is_slti_blt_slt;
+	reg is_sltiu_bltu_sltu;
+	reg is_beq_bne_blt_bge_bltu_bgeu;
+	reg is_lbu_lhu_lw;
+	reg is_alu_reg_imm;
+	reg is_alu_reg_reg;
+	reg is_compare;
+
+	assign instr_trap = (CATCH_ILLINSN || WITH_PCPI) && !{instr_lui, instr_auipc, instr_jal, instr_jalr,
+			instr_beq, instr_bne, instr_blt, instr_bge, instr_bltu, instr_bgeu,
+			instr_lb, instr_lh, instr_lw, instr_lbu, instr_lhu, instr_sb, instr_sh, instr_sw,
+			instr_addi, instr_slti, instr_sltiu, instr_xori, instr_ori, instr_andi, instr_slli, instr_srli, instr_srai,
+			instr_add, instr_sub, instr_sll, instr_slt, instr_sltu, instr_xor, instr_srl, instr_sra, instr_or, instr_and,
+			instr_rdcycle, instr_rdcycleh, instr_rdinstr, instr_rdinstrh,
+			instr_getq, instr_setq, instr_retirq, instr_maskirq, instr_waitirq, instr_timer};
+
+	wire is_rdcycle_rdcycleh_rdinstr_rdinstrh;
+	assign is_rdcycle_rdcycleh_rdinstr_rdinstrh = |{instr_rdcycle, instr_rdcycleh, instr_rdinstr, instr_rdinstrh};
+
+	reg [63:0] new_ascii_instr;
+	`FORMAL_KEEP reg [63:0] dbg_ascii_instr;
+	`FORMAL_KEEP reg [31:0] dbg_insn_imm;
+	`FORMAL_KEEP reg [4:0] dbg_insn_rs1;
+	`FORMAL_KEEP reg [4:0] dbg_insn_rs2;
+	`FORMAL_KEEP reg [4:0] dbg_insn_rd;
+	`FORMAL_KEEP reg [31:0] dbg_rs1val;
+	`FORMAL_KEEP reg [31:0] dbg_rs2val;
+	`FORMAL_KEEP reg dbg_rs1val_valid;
+	`FORMAL_KEEP reg dbg_rs2val_valid;
+
+	always @* begin
+		new_ascii_instr = "";
+
+		if (instr_lui)      new_ascii_instr = "lui";
+		if (instr_auipc)    new_ascii_instr = "auipc";
+		if (instr_jal)      new_ascii_instr = "jal";
+		if (instr_jalr)     new_ascii_instr = "jalr";
+
+		if (instr_beq)      new_ascii_instr = "beq";
+		if (instr_bne)      new_ascii_instr = "bne";
+		if (instr_blt)      new_ascii_instr = "blt";
+		if (instr_bge)      new_ascii_instr = "bge";
+		if (instr_bltu)     new_ascii_instr = "bltu";
+		if (instr_bgeu)     new_ascii_instr = "bgeu";
+
+		if (instr_lb)       new_ascii_instr = "lb";
+		if (instr_lh)       new_ascii_instr = "lh";
+		if (instr_lw)       new_ascii_instr = "lw";
+		if (instr_lbu)      new_ascii_instr = "lbu";
+		if (instr_lhu)      new_ascii_instr = "lhu";
+		if (instr_sb)       new_ascii_instr = "sb";
+		if (instr_sh)       new_ascii_instr = "sh";
+		if (instr_sw)       new_ascii_instr = "sw";
+
+		if (instr_addi)     new_ascii_instr = "addi";
+		if (instr_slti)     new_ascii_instr = "slti";
+		if (instr_sltiu)    new_ascii_instr = "sltiu";
+		if (instr_xori)     new_ascii_instr = "xori";
+		if (instr_ori)      new_ascii_instr = "ori";
+		if (instr_andi)     new_ascii_instr = "andi";
+		if (instr_slli)     new_ascii_instr = "slli";
+		if (instr_srli)     new_ascii_instr = "srli";
+		if (instr_srai)     new_ascii_instr = "srai";
+
+		if (instr_add)      new_ascii_instr = "add";
+		if (instr_sub)      new_ascii_instr = "sub";
+		if (instr_sll)      new_ascii_instr = "sll";
+		if (instr_slt)      new_ascii_instr = "slt";
+		if (instr_sltu)     new_ascii_instr = "sltu";
+		if (instr_xor)      new_ascii_instr = "xor";
+		if (instr_srl)      new_ascii_instr = "srl";
+		if (instr_sra)      new_ascii_instr = "sra";
+		if (instr_or)       new_ascii_instr = "or";
+		if (instr_and)      new_ascii_instr = "and";
+
+		if (instr_rdcycle)  new_ascii_instr = "rdcycle";
+		if (instr_rdcycleh) new_ascii_instr = "rdcycleh";
+		if (instr_rdinstr)  new_ascii_instr = "rdinstr";
+		if (instr_rdinstrh) new_ascii_instr = "rdinstrh";
+
+		if (instr_getq)     new_ascii_instr = "getq";
+		if (instr_setq)     new_ascii_instr = "setq";
+		if (instr_retirq)   new_ascii_instr = "retirq";
+		if (instr_maskirq)  new_ascii_instr = "maskirq";
+		if (instr_waitirq)  new_ascii_instr = "waitirq";
+		if (instr_timer)    new_ascii_instr = "timer";
+	end
+
+	reg [63:0] q_ascii_instr;
+	reg [31:0] q_insn_imm;
+	reg [31:0] q_insn_opcode;
+	reg [4:0] q_insn_rs1;
+	reg [4:0] q_insn_rs2;
+	reg [4:0] q_insn_rd;
+	reg dbg_next;
+
+	wire launch_next_insn;
+	reg dbg_valid_insn;
+
+	reg [63:0] cached_ascii_instr;
+	reg [31:0] cached_insn_imm;
+	reg [31:0] cached_insn_opcode;
+	reg [4:0] cached_insn_rs1;
+	reg [4:0] cached_insn_rs2;
+	reg [4:0] cached_insn_rd;
+
+	always @(posedge clk) begin
+		q_ascii_instr <= dbg_ascii_instr;
+		q_insn_imm <= dbg_insn_imm;
+		q_insn_opcode <= dbg_insn_opcode;
+		q_insn_rs1 <= dbg_insn_rs1;
+		q_insn_rs2 <= dbg_insn_rs2;
+		q_insn_rd <= dbg_insn_rd;
+		dbg_next <= launch_next_insn;
+
+		if (!resetn || trap)
+			dbg_valid_insn <= 0;
+		else if (launch_next_insn)
+			dbg_valid_insn <= 1;
+
+		if (decoder_trigger_q) begin
+			cached_ascii_instr <= new_ascii_instr;
+			cached_insn_imm <= decoded_imm;
+			if (&next_insn_opcode[1:0])
+				cached_insn_opcode <= next_insn_opcode;
+			else
+				cached_insn_opcode <= {16'b0, next_insn_opcode[15:0]};
+			cached_insn_rs1 <= decoded_rs1;
+			cached_insn_rs2 <= decoded_rs2;
+			cached_insn_rd <= decoded_rd;
+		end
+
+		if (launch_next_insn) begin
+			dbg_insn_addr <= next_pc;
+		end
+	end
+
+	always @* begin
+		dbg_ascii_instr = q_ascii_instr;
+		dbg_insn_imm = q_insn_imm;
+		dbg_insn_opcode = q_insn_opcode;
+		dbg_insn_rs1 = q_insn_rs1;
+		dbg_insn_rs2 = q_insn_rs2;
+		dbg_insn_rd = q_insn_rd;
+
+		if (dbg_next) begin
+			if (decoder_pseudo_trigger_q) begin
+				dbg_ascii_instr = cached_ascii_instr;
+				dbg_insn_imm = cached_insn_imm;
+				dbg_insn_opcode = cached_insn_opcode;
+				dbg_insn_rs1 = cached_insn_rs1;
+				dbg_insn_rs2 = cached_insn_rs2;
+				dbg_insn_rd = cached_insn_rd;
+			end else begin
+				dbg_ascii_instr = new_ascii_instr;
+				if (&next_insn_opcode[1:0])
+					dbg_insn_opcode = next_insn_opcode;
+				else
+					dbg_insn_opcode = {16'b0, next_insn_opcode[15:0]};
+				dbg_insn_imm = decoded_imm;
+				dbg_insn_rs1 = decoded_rs1;
+				dbg_insn_rs2 = decoded_rs2;
+				dbg_insn_rd = decoded_rd;
+			end
+		end
+	end
+
+`ifdef DEBUGASM
+	always @(posedge clk) begin
+		if (dbg_next) begin
+			$display("debugasm %x %x %s", dbg_insn_addr, dbg_insn_opcode, dbg_ascii_instr ? dbg_ascii_instr : "*");
+		end
+	end
+`endif
+
+`ifdef DEBUG
+	always @(posedge clk) begin
+		if (dbg_next) begin
+			if (&dbg_insn_opcode[1:0])
+				$display("DECODE: 0x%08x 0x%08x %-0s", dbg_insn_addr, dbg_insn_opcode, dbg_ascii_instr ? dbg_ascii_instr : "UNKNOWN");
+			else
+				$display("DECODE: 0x%08x     0x%04x %-0s", dbg_insn_addr, dbg_insn_opcode[15:0], dbg_ascii_instr ? dbg_ascii_instr : "UNKNOWN");
+		end
+	end
+`endif
+
+	always @(posedge clk) begin
+		is_lui_auipc_jal <= |{instr_lui, instr_auipc, instr_jal};
+		is_lui_auipc_jal_jalr_addi_add_sub <= |{instr_lui, instr_auipc, instr_jal, instr_jalr, instr_addi, instr_add, instr_sub};
+		is_slti_blt_slt <= |{instr_slti, instr_blt, instr_slt};
+		is_sltiu_bltu_sltu <= |{instr_sltiu, instr_bltu, instr_sltu};
+		is_lbu_lhu_lw <= |{instr_lbu, instr_lhu, instr_lw};
+		is_compare <= |{is_beq_bne_blt_bge_bltu_bgeu, instr_slti, instr_slt, instr_sltiu, instr_sltu};
+
+		if (mem_do_rinst && mem_done) begin
+			instr_lui     <= mem_rdata_latched[6:0] == 7'b0110111;
+			instr_auipc   <= mem_rdata_latched[6:0] == 7'b0010111;
+			instr_jal     <= mem_rdata_latched[6:0] == 7'b1101111;
+			instr_jalr    <= mem_rdata_latched[6:0] == 7'b1100111 && mem_rdata_latched[14:12] == 3'b000;
+			instr_retirq  <= mem_rdata_latched[6:0] == 7'b0001011 && mem_rdata_latched[31:25] == 7'b0000010 && ENABLE_IRQ;
+			instr_waitirq <= mem_rdata_latched[6:0] == 7'b0001011 && mem_rdata_latched[31:25] == 7'b0000100 && ENABLE_IRQ;
+
+			is_beq_bne_blt_bge_bltu_bgeu <= mem_rdata_latched[6:0] == 7'b1100011;
+			is_lb_lh_lw_lbu_lhu          <= mem_rdata_latched[6:0] == 7'b0000011;
+			is_sb_sh_sw                  <= mem_rdata_latched[6:0] == 7'b0100011;
+			is_alu_reg_imm               <= mem_rdata_latched[6:0] == 7'b0010011;
+			is_alu_reg_reg               <= mem_rdata_latched[6:0] == 7'b0110011;
+
+			{ decoded_imm_uj[31:20], decoded_imm_uj[10:1], decoded_imm_uj[11], decoded_imm_uj[19:12], decoded_imm_uj[0] } <= $signed({mem_rdata_latched[31:12], 1'b0});
+
+			decoded_rd <= mem_rdata_latched[11:7];
+			decoded_rs1 <= mem_rdata_latched[19:15];
+			decoded_rs2 <= mem_rdata_latched[24:20];
+
+			if (mem_rdata_latched[6:0] == 7'b0001011 && mem_rdata_latched[31:25] == 7'b0000000 && ENABLE_IRQ && ENABLE_IRQ_QREGS)
+				decoded_rs1[regindex_bits-1] <= 1; // instr_getq
+
+			if (mem_rdata_latched[6:0] == 7'b0001011 && mem_rdata_latched[31:25] == 7'b0000010 && ENABLE_IRQ)
+				decoded_rs1 <= ENABLE_IRQ_QREGS ? irqregs_offset : 3; // instr_retirq
+
+			compressed_instr <= 0;
+			if (COMPRESSED_ISA && mem_rdata_latched[1:0] != 2'b11) begin
+				compressed_instr <= 1;
+				decoded_rd <= 0;
+				decoded_rs1 <= 0;
+				decoded_rs2 <= 0;
+
+				{ decoded_imm_uj[31:11], decoded_imm_uj[4], decoded_imm_uj[9:8], decoded_imm_uj[10], decoded_imm_uj[6],
+				  decoded_imm_uj[7], decoded_imm_uj[3:1], decoded_imm_uj[5], decoded_imm_uj[0] } <= $signed({mem_rdata_latched[12:2], 1'b0});
+
+				case (mem_rdata_latched[1:0])
+					2'b00: begin // Quadrant 0
+						case (mem_rdata_latched[15:13])
+							3'b000: begin // C.ADDI4SPN
+								is_alu_reg_imm <= |mem_rdata_latched[12:5];
+								decoded_rs1 <= 2;
+								decoded_rd <= 8 + mem_rdata_latched[4:2];
+							end
+							3'b010: begin // C.LW
+								is_lb_lh_lw_lbu_lhu <= 1;
+								decoded_rs1 <= 8 + mem_rdata_latched[9:7];
+								decoded_rd <= 8 + mem_rdata_latched[4:2];
+							end
+							3'b110: begin // C.SW
+								is_sb_sh_sw <= 1;
+								decoded_rs1 <= 8 + mem_rdata_latched[9:7];
+								decoded_rs2 <= 8 + mem_rdata_latched[4:2];
+							end
+						endcase
+					end
+					2'b01: begin // Quadrant 1
+						case (mem_rdata_latched[15:13])
+							3'b000: begin // C.NOP / C.ADDI
+								is_alu_reg_imm <= 1;
+								decoded_rd <= mem_rdata_latched[11:7];
+								decoded_rs1 <= mem_rdata_latched[11:7];
+							end
+							3'b001: begin // C.JAL
+								instr_jal <= 1;
+								decoded_rd <= 1;
+							end
+							3'b 010: begin // C.LI
+								is_alu_reg_imm <= 1;
+								decoded_rd <= mem_rdata_latched[11:7];
+								decoded_rs1 <= 0;
+							end
+							3'b 011: begin
+								if (mem_rdata_latched[12] || mem_rdata_latched[6:2]) begin
+									if (mem_rdata_latched[11:7] == 2) begin // C.ADDI16SP
+										is_alu_reg_imm <= 1;
+										decoded_rd <= mem_rdata_latched[11:7];
+										decoded_rs1 <= mem_rdata_latched[11:7];
+									end else begin // C.LUI
+										instr_lui <= 1;
+										decoded_rd <= mem_rdata_latched[11:7];
+										decoded_rs1 <= 0;
+									end
+								end
+							end
+							3'b100: begin
+								if (!mem_rdata_latched[11] && !mem_rdata_latched[12]) begin // C.SRLI, C.SRAI
+									is_alu_reg_imm <= 1;
+									decoded_rd <= 8 + mem_rdata_latched[9:7];
+									decoded_rs1 <= 8 + mem_rdata_latched[9:7];
+									decoded_rs2 <= {mem_rdata_latched[12], mem_rdata_latched[6:2]};
+								end
+								if (mem_rdata_latched[11:10] == 2'b10) begin // C.ANDI
+									is_alu_reg_imm <= 1;
+									decoded_rd <= 8 + mem_rdata_latched[9:7];
+									decoded_rs1 <= 8 + mem_rdata_latched[9:7];
+								end
+								if (mem_rdata_latched[12:10] == 3'b011) begin // C.SUB, C.XOR, C.OR, C.AND
+									is_alu_reg_reg <= 1;
+									decoded_rd <= 8 + mem_rdata_latched[9:7];
+									decoded_rs1 <= 8 + mem_rdata_latched[9:7];
+									decoded_rs2 <= 8 + mem_rdata_latched[4:2];
+								end
+							end
+							3'b101: begin // C.J
+								instr_jal <= 1;
+							end
+							3'b110: begin // C.BEQZ
+								is_beq_bne_blt_bge_bltu_bgeu <= 1;
+								decoded_rs1 <= 8 + mem_rdata_latched[9:7];
+								decoded_rs2 <= 0;
+							end
+							3'b111: begin // C.BNEZ
+								is_beq_bne_blt_bge_bltu_bgeu <= 1;
+								decoded_rs1 <= 8 + mem_rdata_latched[9:7];
+								decoded_rs2 <= 0;
+							end
+						endcase
+					end
+					2'b10: begin // Quadrant 2
+						case (mem_rdata_latched[15:13])
+							3'b000: begin // C.SLLI
+								if (!mem_rdata_latched[12]) begin
+									is_alu_reg_imm <= 1;
+									decoded_rd <= mem_rdata_latched[11:7];
+									decoded_rs1 <= mem_rdata_latched[11:7];
+									decoded_rs2 <= {mem_rdata_latched[12], mem_rdata_latched[6:2]};
+								end
+							end
+							3'b010: begin // C.LWSP
+								if (mem_rdata_latched[11:7]) begin
+									is_lb_lh_lw_lbu_lhu <= 1;
+									decoded_rd <= mem_rdata_latched[11:7];
+									decoded_rs1 <= 2;
+								end
+							end
+							3'b100: begin
+								if (mem_rdata_latched[12] == 0 && mem_rdata_latched[11:7] != 0 && mem_rdata_latched[6:2] == 0) begin // C.JR
+									instr_jalr <= 1;
+									decoded_rd <= 0;
+									decoded_rs1 <= mem_rdata_latched[11:7];
+								end
+								if (mem_rdata_latched[12] == 0 && mem_rdata_latched[6:2] != 0) begin // C.MV
+									is_alu_reg_reg <= 1;
+									decoded_rd <= mem_rdata_latched[11:7];
+									decoded_rs1 <= 0;
+									decoded_rs2 <= mem_rdata_latched[6:2];
+								end
+								if (mem_rdata_latched[12] != 0 && mem_rdata_latched[11:7] != 0 && mem_rdata_latched[6:2] == 0) begin // C.JALR
+									instr_jalr <= 1;
+									decoded_rd <= 1;
+									decoded_rs1 <= mem_rdata_latched[11:7];
+								end
+								if (mem_rdata_latched[12] != 0 && mem_rdata_latched[6:2] != 0) begin // C.ADD
+									is_alu_reg_reg <= 1;
+									decoded_rd <= mem_rdata_latched[11:7];
+									decoded_rs1 <= mem_rdata_latched[11:7];
+									decoded_rs2 <= mem_rdata_latched[6:2];
+								end
+							end
+							3'b110: begin // C.SWSP
+								is_sb_sh_sw <= 1;
+								decoded_rs1 <= 2;
+								decoded_rs2 <= mem_rdata_latched[6:2];
+							end
+						endcase
+					end
+				endcase
+			end
+		end
+
+		if (decoder_trigger && !decoder_pseudo_trigger) begin
+			pcpi_insn <= WITH_PCPI ? mem_rdata_q : 'bx;
+
+			instr_beq   <= is_beq_bne_blt_bge_bltu_bgeu && mem_rdata_q[14:12] == 3'b000;
+			instr_bne   <= is_beq_bne_blt_bge_bltu_bgeu && mem_rdata_q[14:12] == 3'b001;
+			instr_blt   <= is_beq_bne_blt_bge_bltu_bgeu && mem_rdata_q[14:12] == 3'b100;
+			instr_bge   <= is_beq_bne_blt_bge_bltu_bgeu && mem_rdata_q[14:12] == 3'b101;
+			instr_bltu  <= is_beq_bne_blt_bge_bltu_bgeu && mem_rdata_q[14:12] == 3'b110;
+			instr_bgeu  <= is_beq_bne_blt_bge_bltu_bgeu && mem_rdata_q[14:12] == 3'b111;
+
+			instr_lb    <= is_lb_lh_lw_lbu_lhu && mem_rdata_q[14:12] == 3'b000;
+			instr_lh    <= is_lb_lh_lw_lbu_lhu && mem_rdata_q[14:12] == 3'b001;
+			instr_lw    <= is_lb_lh_lw_lbu_lhu && mem_rdata_q[14:12] == 3'b010;
+			instr_lbu   <= is_lb_lh_lw_lbu_lhu && mem_rdata_q[14:12] == 3'b100;
+			instr_lhu   <= is_lb_lh_lw_lbu_lhu && mem_rdata_q[14:12] == 3'b101;
+
+			instr_sb    <= is_sb_sh_sw && mem_rdata_q[14:12] == 3'b000;
+			instr_sh    <= is_sb_sh_sw && mem_rdata_q[14:12] == 3'b001;
+			instr_sw    <= is_sb_sh_sw && mem_rdata_q[14:12] == 3'b010;
+
+			instr_addi  <= is_alu_reg_imm && mem_rdata_q[14:12] == 3'b000;
+			instr_slti  <= is_alu_reg_imm && mem_rdata_q[14:12] == 3'b010;
+			instr_sltiu <= is_alu_reg_imm && mem_rdata_q[14:12] == 3'b011;
+			instr_xori  <= is_alu_reg_imm && mem_rdata_q[14:12] == 3'b100;
+			instr_ori   <= is_alu_reg_imm && mem_rdata_q[14:12] == 3'b110;
+			instr_andi  <= is_alu_reg_imm && mem_rdata_q[14:12] == 3'b111;
+
+			instr_slli  <= is_alu_reg_imm && mem_rdata_q[14:12] == 3'b001 && mem_rdata_q[31:25] == 7'b0000000;
+			instr_srli  <= is_alu_reg_imm && mem_rdata_q[14:12] == 3'b101 && mem_rdata_q[31:25] == 7'b0000000;
+			instr_srai  <= is_alu_reg_imm && mem_rdata_q[14:12] == 3'b101 && mem_rdata_q[31:25] == 7'b0100000;
+
+			instr_add   <= is_alu_reg_reg && mem_rdata_q[14:12] == 3'b000 && mem_rdata_q[31:25] == 7'b0000000;
+			instr_sub   <= is_alu_reg_reg && mem_rdata_q[14:12] == 3'b000 && mem_rdata_q[31:25] == 7'b0100000;
+			instr_sll   <= is_alu_reg_reg && mem_rdata_q[14:12] == 3'b001 && mem_rdata_q[31:25] == 7'b0000000;
+			instr_slt   <= is_alu_reg_reg && mem_rdata_q[14:12] == 3'b010 && mem_rdata_q[31:25] == 7'b0000000;
+			instr_sltu  <= is_alu_reg_reg && mem_rdata_q[14:12] == 3'b011 && mem_rdata_q[31:25] == 7'b0000000;
+			instr_xor   <= is_alu_reg_reg && mem_rdata_q[14:12] == 3'b100 && mem_rdata_q[31:25] == 7'b0000000;
+			instr_srl   <= is_alu_reg_reg && mem_rdata_q[14:12] == 3'b101 && mem_rdata_q[31:25] == 7'b0000000;
+			instr_sra   <= is_alu_reg_reg && mem_rdata_q[14:12] == 3'b101 && mem_rdata_q[31:25] == 7'b0100000;
+			instr_or    <= is_alu_reg_reg && mem_rdata_q[14:12] == 3'b110 && mem_rdata_q[31:25] == 7'b0000000;
+			instr_and   <= is_alu_reg_reg && mem_rdata_q[14:12] == 3'b111 && mem_rdata_q[31:25] == 7'b0000000;
+
+			instr_rdcycle  <= ((mem_rdata_q[6:0] == 7'b1110011 && mem_rdata_q[31:12] == 'b11000000000000000010) ||
+			                   (mem_rdata_q[6:0] == 7'b1110011 && mem_rdata_q[31:12] == 'b11000000000100000010)) && ENABLE_COUNTERS;
+			instr_rdcycleh <= ((mem_rdata_q[6:0] == 7'b1110011 && mem_rdata_q[31:12] == 'b11001000000000000010) ||
+			                   (mem_rdata_q[6:0] == 7'b1110011 && mem_rdata_q[31:12] == 'b11001000000100000010)) && ENABLE_COUNTERS && ENABLE_COUNTERS64;
+			instr_rdinstr  <=  (mem_rdata_q[6:0] == 7'b1110011 && mem_rdata_q[31:12] == 'b11000000001000000010) && ENABLE_COUNTERS;
+			instr_rdinstrh <=  (mem_rdata_q[6:0] == 7'b1110011 && mem_rdata_q[31:12] == 'b11001000001000000010) && ENABLE_COUNTERS && ENABLE_COUNTERS64;
+
+			instr_ecall_ebreak <= ((mem_rdata_q[6:0] == 7'b1110011 && !mem_rdata_q[31:21] && !mem_rdata_q[19:7]) ||
+					(COMPRESSED_ISA && mem_rdata_q[15:0] == 16'h9002));
+
+			instr_getq    <= mem_rdata_q[6:0] == 7'b0001011 && mem_rdata_q[31:25] == 7'b0000000 && ENABLE_IRQ && ENABLE_IRQ_QREGS;
+			instr_setq    <= mem_rdata_q[6:0] == 7'b0001011 && mem_rdata_q[31:25] == 7'b0000001 && ENABLE_IRQ && ENABLE_IRQ_QREGS;
+			instr_maskirq <= mem_rdata_q[6:0] == 7'b0001011 && mem_rdata_q[31:25] == 7'b0000011 && ENABLE_IRQ;
+			instr_timer   <= mem_rdata_q[6:0] == 7'b0001011 && mem_rdata_q[31:25] == 7'b0000101 && ENABLE_IRQ && ENABLE_IRQ_TIMER;
+
+			is_slli_srli_srai <= is_alu_reg_imm && |{
+				mem_rdata_q[14:12] == 3'b001 && mem_rdata_q[31:25] == 7'b0000000,
+				mem_rdata_q[14:12] == 3'b101 && mem_rdata_q[31:25] == 7'b0000000,
+				mem_rdata_q[14:12] == 3'b101 && mem_rdata_q[31:25] == 7'b0100000
+			};
+
+			is_jalr_addi_slti_sltiu_xori_ori_andi <= instr_jalr || is_alu_reg_imm && |{
+				mem_rdata_q[14:12] == 3'b000,
+				mem_rdata_q[14:12] == 3'b010,
+				mem_rdata_q[14:12] == 3'b011,
+				mem_rdata_q[14:12] == 3'b100,
+				mem_rdata_q[14:12] == 3'b110,
+				mem_rdata_q[14:12] == 3'b111
+			};
+
+			is_sll_srl_sra <= is_alu_reg_reg && |{
+				mem_rdata_q[14:12] == 3'b001 && mem_rdata_q[31:25] == 7'b0000000,
+				mem_rdata_q[14:12] == 3'b101 && mem_rdata_q[31:25] == 7'b0000000,
+				mem_rdata_q[14:12] == 3'b101 && mem_rdata_q[31:25] == 7'b0100000
+			};
+
+			is_lui_auipc_jal_jalr_addi_add_sub <= 0;
+			is_compare <= 0;
+
+			(* parallel_case *)
+			case (1'b1)
+				instr_jal:
+					decoded_imm <= decoded_imm_uj;
+				|{instr_lui, instr_auipc}:
+					decoded_imm <= mem_rdata_q[31:12] << 12;
+				|{instr_jalr, is_lb_lh_lw_lbu_lhu, is_alu_reg_imm}:
+					decoded_imm <= $signed(mem_rdata_q[31:20]);
+				is_beq_bne_blt_bge_bltu_bgeu:
+					decoded_imm <= $signed({mem_rdata_q[31], mem_rdata_q[7], mem_rdata_q[30:25], mem_rdata_q[11:8], 1'b0});
+				is_sb_sh_sw:
+					decoded_imm <= $signed({mem_rdata_q[31:25], mem_rdata_q[11:7]});
+				default:
+					decoded_imm <= 1'bx;
+			endcase
+		end
+
+		if (!resetn) begin
+			is_beq_bne_blt_bge_bltu_bgeu <= 0;
+			is_compare <= 0;
+
+			instr_beq   <= 0;
+			instr_bne   <= 0;
+			instr_blt   <= 0;
+			instr_bge   <= 0;
+			instr_bltu  <= 0;
+			instr_bgeu  <= 0;
+
+			instr_addi  <= 0;
+			instr_slti  <= 0;
+			instr_sltiu <= 0;
+			instr_xori  <= 0;
+			instr_ori   <= 0;
+			instr_andi  <= 0;
+
+			instr_add   <= 0;
+			instr_sub   <= 0;
+			instr_sll   <= 0;
+			instr_slt   <= 0;
+			instr_sltu  <= 0;
+			instr_xor   <= 0;
+			instr_srl   <= 0;
+			instr_sra   <= 0;
+			instr_or    <= 0;
+			instr_and   <= 0;
+		end
+	end
+
+
+	// Main State Machine
+
+	localparam cpu_state_trap   = 8'b10000000;
+	localparam cpu_state_fetch  = 8'b01000000;
+	localparam cpu_state_ld_rs1 = 8'b00100000;
+	localparam cpu_state_ld_rs2 = 8'b00010000;
+	localparam cpu_state_exec   = 8'b00001000;
+	localparam cpu_state_shift  = 8'b00000100;
+	localparam cpu_state_stmem  = 8'b00000010;
+	localparam cpu_state_ldmem  = 8'b00000001;
+
+	reg [7:0] cpu_state;
+	reg [1:0] irq_state;
+
+	`FORMAL_KEEP reg [127:0] dbg_ascii_state;
+
+	always @* begin
+		dbg_ascii_state = "";
+		if (cpu_state == cpu_state_trap)   dbg_ascii_state = "trap";
+		if (cpu_state == cpu_state_fetch)  dbg_ascii_state = "fetch";
+		if (cpu_state == cpu_state_ld_rs1) dbg_ascii_state = "ld_rs1";
+		if (cpu_state == cpu_state_ld_rs2) dbg_ascii_state = "ld_rs2";
+		if (cpu_state == cpu_state_exec)   dbg_ascii_state = "exec";
+		if (cpu_state == cpu_state_shift)  dbg_ascii_state = "shift";
+		if (cpu_state == cpu_state_stmem)  dbg_ascii_state = "stmem";
+		if (cpu_state == cpu_state_ldmem)  dbg_ascii_state = "ldmem";
+	end
+
+	reg set_mem_do_rinst;
+	reg set_mem_do_rdata;
+	reg set_mem_do_wdata;
+
+	reg latched_store;
+	reg latched_stalu;
+	reg latched_branch;
+	reg latched_compr;
+	reg latched_trace;
+	reg latched_is_lu;
+	reg latched_is_lh;
+	reg latched_is_lb;
+	reg [regindex_bits-1:0] latched_rd;
+
+	reg [31:0] current_pc;
+	assign next_pc = latched_store && latched_branch ? reg_out & ~1 : reg_next_pc;
+
+	reg [3:0] pcpi_timeout_counter;
+	reg pcpi_timeout;
+
+	reg [31:0] next_irq_pending;
+	reg do_waitirq;
+
+	reg [31:0] alu_out, alu_out_q;
+	reg alu_out_0, alu_out_0_q;
+	reg alu_wait, alu_wait_2;
+
+	reg [31:0] alu_add_sub;
+	reg [31:0] alu_shl, alu_shr;
+	reg alu_eq, alu_ltu, alu_lts;
+
+	generate if (TWO_CYCLE_ALU) begin
+		always @(posedge clk) begin
+			alu_add_sub <= instr_sub ? reg_op1 - reg_op2 : reg_op1 + reg_op2;
+			alu_eq <= reg_op1 == reg_op2;
+			alu_lts <= $signed(reg_op1) < $signed(reg_op2);
+			alu_ltu <= reg_op1 < reg_op2;
+			alu_shl <= reg_op1 << reg_op2[4:0];
+			alu_shr <= $signed({instr_sra || instr_srai ? reg_op1[31] : 1'b0, reg_op1}) >>> reg_op2[4:0];
+		end
+	end else begin
+		always @* begin
+			alu_add_sub = instr_sub ? reg_op1 - reg_op2 : reg_op1 + reg_op2;
+			alu_eq = reg_op1 == reg_op2;
+			alu_lts = $signed(reg_op1) < $signed(reg_op2);
+			alu_ltu = reg_op1 < reg_op2;
+			alu_shl = reg_op1 << reg_op2[4:0];
+			alu_shr = $signed({instr_sra || instr_srai ? reg_op1[31] : 1'b0, reg_op1}) >>> reg_op2[4:0];
+		end
+	end endgenerate
+
+	always @* begin
+		alu_out_0 = 'bx;
+		(* parallel_case, full_case *)
+		case (1'b1)
+			instr_beq:
+				alu_out_0 = alu_eq;
+			instr_bne:
+				alu_out_0 = !alu_eq;
+			instr_bge:
+				alu_out_0 = !alu_lts;
+			instr_bgeu:
+				alu_out_0 = !alu_ltu;
+			is_slti_blt_slt && (!TWO_CYCLE_COMPARE || !{instr_beq,instr_bne,instr_bge,instr_bgeu}):
+				alu_out_0 = alu_lts;
+			is_sltiu_bltu_sltu && (!TWO_CYCLE_COMPARE || !{instr_beq,instr_bne,instr_bge,instr_bgeu}):
+				alu_out_0 = alu_ltu;
+		endcase
+
+		alu_out = 'bx;
+		(* parallel_case, full_case *)
+		case (1'b1)
+			is_lui_auipc_jal_jalr_addi_add_sub:
+				alu_out = alu_add_sub;
+			is_compare:
+				alu_out = alu_out_0;
+			instr_xori || instr_xor:
+				alu_out = reg_op1 ^ reg_op2;
+			instr_ori || instr_or:
+				alu_out = reg_op1 | reg_op2;
+			instr_andi || instr_and:
+				alu_out = reg_op1 & reg_op2;
+			BARREL_SHIFTER && (instr_sll || instr_slli):
+				alu_out = alu_shl;
+			BARREL_SHIFTER && (instr_srl || instr_srli || instr_sra || instr_srai):
+				alu_out = alu_shr;
+		endcase
+
+`ifdef RISCV_FORMAL_BLACKBOX_ALU
+		alu_out_0 = $anyseq;
+		alu_out = $anyseq;
+`endif
+	end
+
+	reg clear_prefetched_high_word_q;
+	always @(posedge clk) clear_prefetched_high_word_q <= clear_prefetched_high_word;
+
+	always @* begin
+		clear_prefetched_high_word = clear_prefetched_high_word_q;
+		if (!prefetched_high_word)
+			clear_prefetched_high_word = 0;
+		if (latched_branch || irq_state || !resetn)
+			clear_prefetched_high_word = COMPRESSED_ISA;
+	end
+
+	reg cpuregs_write;
+	reg [31:0] cpuregs_wrdata;
+	reg [31:0] cpuregs_rs1;
+	reg [31:0] cpuregs_rs2;
+	reg [regindex_bits-1:0] decoded_rs;
+
+	always @* begin
+		cpuregs_write = 0;
+		cpuregs_wrdata = 'bx;
+
+		if (cpu_state == cpu_state_fetch) begin
+			(* parallel_case *)
+			case (1'b1)
+				latched_branch: begin
+					cpuregs_wrdata = reg_pc + (latched_compr ? 2 : 4);
+					cpuregs_write = 1;
+				end
+				latched_store && !latched_branch: begin
+					cpuregs_wrdata = latched_stalu ? alu_out_q : reg_out;
+					cpuregs_write = 1;
+				end
+				ENABLE_IRQ && irq_state[0]: begin
+					cpuregs_wrdata = reg_next_pc | latched_compr;
+					cpuregs_write = 1;
+				end
+				ENABLE_IRQ && irq_state[1]: begin
+					cpuregs_wrdata = irq_pending & ~irq_mask;
+					cpuregs_write = 1;
+				end
+			endcase
+		end
+	end
+
+`ifndef PICORV32_REGS
+	always @(posedge clk) begin
+		if (resetn && cpuregs_write && latched_rd)
+			cpuregs[latched_rd] <= cpuregs_wrdata;
+	end
+
+	always @* begin
+		decoded_rs = 'bx;
+		if (ENABLE_REGS_DUALPORT) begin
+`ifndef RISCV_FORMAL_BLACKBOX_REGS
+			cpuregs_rs1 = decoded_rs1 ? cpuregs[decoded_rs1] : 0;
+			cpuregs_rs2 = decoded_rs2 ? cpuregs[decoded_rs2] : 0;
+`else
+			cpuregs_rs1 = decoded_rs1 ? $anyseq : 0;
+			cpuregs_rs2 = decoded_rs2 ? $anyseq : 0;
+`endif
+		end else begin
+			decoded_rs = (cpu_state == cpu_state_ld_rs2) ? decoded_rs2 : decoded_rs1;
+`ifndef RISCV_FORMAL_BLACKBOX_REGS
+			cpuregs_rs1 = decoded_rs ? cpuregs[decoded_rs] : 0;
+`else
+			cpuregs_rs1 = decoded_rs ? $anyseq : 0;
+`endif
+			cpuregs_rs2 = cpuregs_rs1;
+		end
+	end
+`else
+	wire[31:0] cpuregs_rdata1;
+	wire[31:0] cpuregs_rdata2;
+
+	wire [5:0] cpuregs_waddr = latched_rd;
+	wire [5:0] cpuregs_raddr1 = ENABLE_REGS_DUALPORT ? decoded_rs1 : decoded_rs;
+	wire [5:0] cpuregs_raddr2 = ENABLE_REGS_DUALPORT ? decoded_rs2 : 0;
+
+	`PICORV32_REGS cpuregs (
+		.clk(clk),
+		.wen(resetn && cpuregs_write && latched_rd),
+		.waddr(cpuregs_waddr),
+		.raddr1(cpuregs_raddr1),
+		.raddr2(cpuregs_raddr2),
+		.wdata(cpuregs_wrdata),
+		.rdata1(cpuregs_rdata1),
+		.rdata2(cpuregs_rdata2)
+	);
+
+	always @* begin
+		decoded_rs = 'bx;
+		if (ENABLE_REGS_DUALPORT) begin
+			cpuregs_rs1 = decoded_rs1 ? cpuregs_rdata1 : 0;
+			cpuregs_rs2 = decoded_rs2 ? cpuregs_rdata2 : 0;
+		end else begin
+			decoded_rs = (cpu_state == cpu_state_ld_rs2) ? decoded_rs2 : decoded_rs1;
+			cpuregs_rs1 = decoded_rs ? cpuregs_rdata1 : 0;
+			cpuregs_rs2 = cpuregs_rs1;
+		end
+	end
+`endif
+
+	assign launch_next_insn = cpu_state == cpu_state_fetch && decoder_trigger && (!ENABLE_IRQ || irq_delay || irq_active || !(irq_pending & ~irq_mask));
+
+	always @(posedge clk) begin
+		trap <= 0;
+		reg_sh <= 'bx;
+		reg_out <= 'bx;
+		set_mem_do_rinst = 0;
+		set_mem_do_rdata = 0;
+		set_mem_do_wdata = 0;
+
+		alu_out_0_q <= alu_out_0;
+		alu_out_q <= alu_out;
+
+		alu_wait <= 0;
+		alu_wait_2 <= 0;
+
+		if (launch_next_insn) begin
+			dbg_rs1val <= 'bx;
+			dbg_rs2val <= 'bx;
+			dbg_rs1val_valid <= 0;
+			dbg_rs2val_valid <= 0;
+		end
+
+		if (WITH_PCPI && CATCH_ILLINSN) begin
+			if (resetn && pcpi_valid && !pcpi_int_wait) begin
+				if (pcpi_timeout_counter)
+					pcpi_timeout_counter <= pcpi_timeout_counter - 1;
+			end else
+				pcpi_timeout_counter <= ~0;
+			pcpi_timeout <= !pcpi_timeout_counter;
+		end
+
+		if (ENABLE_COUNTERS) begin
+			count_cycle <= resetn ? count_cycle + 1 : 0;
+			if (!ENABLE_COUNTERS64) count_cycle[63:32] <= 0;
+		end else begin
+			count_cycle <= 'bx;
+			count_instr <= 'bx;
+		end
+
+		next_irq_pending = ENABLE_IRQ ? irq_pending & LATCHED_IRQ : 'bx;
+
+		if (ENABLE_IRQ && ENABLE_IRQ_TIMER && timer) begin
+			if (timer - 1 == 0)
+				next_irq_pending[irq_timer] = 1;
+			timer <= timer - 1;
+		end
+
+		if (ENABLE_IRQ) begin
+			next_irq_pending = next_irq_pending | irq;
+		end
+
+		decoder_trigger <= mem_do_rinst && mem_done;
+		decoder_trigger_q <= decoder_trigger;
+		decoder_pseudo_trigger <= 0;
+		decoder_pseudo_trigger_q <= decoder_pseudo_trigger;
+		do_waitirq <= 0;
+
+		trace_valid <= 0;
+
+		if (!ENABLE_TRACE)
+			trace_data <= 'bx;
+
+		if (!resetn) begin
+			reg_pc <= PROGADDR_RESET;
+			reg_next_pc <= PROGADDR_RESET;
+			if (ENABLE_COUNTERS)
+				count_instr <= 0;
+			latched_store <= 0;
+			latched_stalu <= 0;
+			latched_branch <= 0;
+			latched_trace <= 0;
+			latched_is_lu <= 0;
+			latched_is_lh <= 0;
+			latched_is_lb <= 0;
+			pcpi_valid <= 0;
+			pcpi_timeout <= 0;
+			irq_active <= 0;
+			irq_delay <= 0;
+			irq_mask <= ~0;
+			next_irq_pending = 0;
+			irq_state <= 0;
+			eoi <= 0;
+			timer <= 0;
+			if (~STACKADDR) begin
+				latched_store <= 1;
+				latched_rd <= 2;
+				reg_out <= STACKADDR;
+			end
+			cpu_state <= cpu_state_fetch;
+		end else
+		(* parallel_case, full_case *)
+		case (cpu_state)
+			cpu_state_trap: begin
+				trap <= 1;
+			end
+
+			cpu_state_fetch: begin
+				mem_do_rinst <= !decoder_trigger && !do_waitirq;
+				mem_wordsize <= 0;
+
+				current_pc = reg_next_pc;
+
+				(* parallel_case *)
+				case (1'b1)
+					latched_branch: begin
+						current_pc = latched_store ? (latched_stalu ? alu_out_q : reg_out) & ~1 : reg_next_pc;
+						`debug($display("ST_RD:  %2d 0x%08x, BRANCH 0x%08x", latched_rd, reg_pc + (latched_compr ? 2 : 4), current_pc);)
+					end
+					latched_store && !latched_branch: begin
+						`debug($display("ST_RD:  %2d 0x%08x", latched_rd, latched_stalu ? alu_out_q : reg_out);)
+					end
+					ENABLE_IRQ && irq_state[0]: begin
+						current_pc = PROGADDR_IRQ;
+						irq_active <= 1;
+						mem_do_rinst <= 1;
+					end
+					ENABLE_IRQ && irq_state[1]: begin
+						eoi <= irq_pending & ~irq_mask;
+						next_irq_pending = next_irq_pending & irq_mask;
+					end
+				endcase
+
+				if (ENABLE_TRACE && latched_trace) begin
+					latched_trace <= 0;
+					trace_valid <= 1;
+					if (latched_branch)
+						trace_data <= (irq_active ? TRACE_IRQ : 0) | TRACE_BRANCH | (current_pc & 32'hfffffffe);
+					else
+						trace_data <= (irq_active ? TRACE_IRQ : 0) | (latched_stalu ? alu_out_q : reg_out);
+				end
+
+				reg_pc <= current_pc;
+				reg_next_pc <= current_pc;
+
+				latched_store <= 0;
+				latched_stalu <= 0;
+				latched_branch <= 0;
+				latched_is_lu <= 0;
+				latched_is_lh <= 0;
+				latched_is_lb <= 0;
+				latched_rd <= decoded_rd;
+				latched_compr <= compressed_instr;
+
+				if (ENABLE_IRQ && ((decoder_trigger && !irq_active && !irq_delay && |(irq_pending & ~irq_mask)) || irq_state)) begin
+					irq_state <=
+						irq_state == 2'b00 ? 2'b01 :
+						irq_state == 2'b01 ? 2'b10 : 2'b00;
+					latched_compr <= latched_compr;
+					if (ENABLE_IRQ_QREGS)
+						latched_rd <= irqregs_offset | irq_state[0];
+					else
+						latched_rd <= irq_state[0] ? 4 : 3;
+				end else
+				if (ENABLE_IRQ && (decoder_trigger || do_waitirq) && instr_waitirq) begin
+					if (irq_pending) begin
+						latched_store <= 1;
+						reg_out <= irq_pending;
+						reg_next_pc <= current_pc + (compressed_instr ? 2 : 4);
+						mem_do_rinst <= 1;
+					end else
+						do_waitirq <= 1;
+				end else
+				if (decoder_trigger) begin
+					`debug($display("-- %-0t", $time);)
+					irq_delay <= irq_active;
+					reg_next_pc <= current_pc + (compressed_instr ? 2 : 4);
+					if (ENABLE_TRACE)
+						latched_trace <= 1;
+					if (ENABLE_COUNTERS) begin
+						count_instr <= count_instr + 1;
+						if (!ENABLE_COUNTERS64) count_instr[63:32] <= 0;
+					end
+					if (instr_jal) begin
+						mem_do_rinst <= 1;
+						reg_next_pc <= current_pc + decoded_imm_uj;
+						latched_branch <= 1;
+					end else begin
+						mem_do_rinst <= 0;
+						mem_do_prefetch <= !instr_jalr && !instr_retirq;
+						cpu_state <= cpu_state_ld_rs1;
+					end
+				end
+			end
+
+			cpu_state_ld_rs1: begin
+				reg_op1 <= 'bx;
+				reg_op2 <= 'bx;
+
+				(* parallel_case *)
+				case (1'b1)
+					(CATCH_ILLINSN || WITH_PCPI) && instr_trap: begin
+						if (WITH_PCPI) begin
+							`debug($display("LD_RS1: %2d 0x%08x", decoded_rs1, cpuregs_rs1);)
+							reg_op1 <= cpuregs_rs1;
+							dbg_rs1val <= cpuregs_rs1;
+							dbg_rs1val_valid <= 1;
+							if (ENABLE_REGS_DUALPORT) begin
+								pcpi_valid <= 1;
+								`debug($display("LD_RS2: %2d 0x%08x", decoded_rs2, cpuregs_rs2);)
+								reg_sh <= cpuregs_rs2;
+								reg_op2 <= cpuregs_rs2;
+								dbg_rs2val <= cpuregs_rs2;
+								dbg_rs2val_valid <= 1;
+								if (pcpi_int_ready) begin
+									mem_do_rinst <= 1;
+									pcpi_valid <= 0;
+									reg_out <= pcpi_int_rd;
+									latched_store <= pcpi_int_wr;
+									cpu_state <= cpu_state_fetch;
+								end else
+								if (CATCH_ILLINSN && (pcpi_timeout || instr_ecall_ebreak)) begin
+									pcpi_valid <= 0;
+									`debug($display("EBREAK OR UNSUPPORTED INSN AT 0x%08x", reg_pc);)
+									if (ENABLE_IRQ && !irq_mask[irq_ebreak] && !irq_active) begin
+										next_irq_pending[irq_ebreak] = 1;
+										cpu_state <= cpu_state_fetch;
+									end else
+										cpu_state <= cpu_state_trap;
+								end
+							end else begin
+								cpu_state <= cpu_state_ld_rs2;
+							end
+						end else begin
+							`debug($display("EBREAK OR UNSUPPORTED INSN AT 0x%08x", reg_pc);)
+							if (ENABLE_IRQ && !irq_mask[irq_ebreak] && !irq_active) begin
+								next_irq_pending[irq_ebreak] = 1;
+								cpu_state <= cpu_state_fetch;
+							end else
+								cpu_state <= cpu_state_trap;
+						end
+					end
+					ENABLE_COUNTERS && is_rdcycle_rdcycleh_rdinstr_rdinstrh: begin
+						(* parallel_case, full_case *)
+						case (1'b1)
+							instr_rdcycle:
+								reg_out <= count_cycle[31:0];
+							instr_rdcycleh && ENABLE_COUNTERS64:
+								reg_out <= count_cycle[63:32];
+							instr_rdinstr:
+								reg_out <= count_instr[31:0];
+							instr_rdinstrh && ENABLE_COUNTERS64:
+								reg_out <= count_instr[63:32];
+						endcase
+						latched_store <= 1;
+						cpu_state <= cpu_state_fetch;
+					end
+					is_lui_auipc_jal: begin
+						reg_op1 <= instr_lui ? 0 : reg_pc;
+						reg_op2 <= decoded_imm;
+						if (TWO_CYCLE_ALU)
+							alu_wait <= 1;
+						else
+							mem_do_rinst <= mem_do_prefetch;
+						cpu_state <= cpu_state_exec;
+					end
+					ENABLE_IRQ && ENABLE_IRQ_QREGS && instr_getq: begin
+						`debug($display("LD_RS1: %2d 0x%08x", decoded_rs1, cpuregs_rs1);)
+						reg_out <= cpuregs_rs1;
+						dbg_rs1val <= cpuregs_rs1;
+						dbg_rs1val_valid <= 1;
+						latched_store <= 1;
+						cpu_state <= cpu_state_fetch;
+					end
+					ENABLE_IRQ && ENABLE_IRQ_QREGS && instr_setq: begin
+						`debug($display("LD_RS1: %2d 0x%08x", decoded_rs1, cpuregs_rs1);)
+						reg_out <= cpuregs_rs1;
+						dbg_rs1val <= cpuregs_rs1;
+						dbg_rs1val_valid <= 1;
+						latched_rd <= latched_rd | irqregs_offset;
+						latched_store <= 1;
+						cpu_state <= cpu_state_fetch;
+					end
+					ENABLE_IRQ && instr_retirq: begin
+						eoi <= 0;
+						irq_active <= 0;
+						latched_branch <= 1;
+						latched_store <= 1;
+						`debug($display("LD_RS1: %2d 0x%08x", decoded_rs1, cpuregs_rs1);)
+						reg_out <= CATCH_MISALIGN ? (cpuregs_rs1 & 32'h fffffffe) : cpuregs_rs1;
+						dbg_rs1val <= cpuregs_rs1;
+						dbg_rs1val_valid <= 1;
+						cpu_state <= cpu_state_fetch;
+					end
+					ENABLE_IRQ && instr_maskirq: begin
+						latched_store <= 1;
+						reg_out <= irq_mask;
+						`debug($display("LD_RS1: %2d 0x%08x", decoded_rs1, cpuregs_rs1);)
+						irq_mask <= cpuregs_rs1 | MASKED_IRQ;
+						dbg_rs1val <= cpuregs_rs1;
+						dbg_rs1val_valid <= 1;
+						cpu_state <= cpu_state_fetch;
+					end
+					ENABLE_IRQ && ENABLE_IRQ_TIMER && instr_timer: begin
+						latched_store <= 1;
+						reg_out <= timer;
+						`debug($display("LD_RS1: %2d 0x%08x", decoded_rs1, cpuregs_rs1);)
+						timer <= cpuregs_rs1;
+						dbg_rs1val <= cpuregs_rs1;
+						dbg_rs1val_valid <= 1;
+						cpu_state <= cpu_state_fetch;
+					end
+					is_lb_lh_lw_lbu_lhu && !instr_trap: begin
+						`debug($display("LD_RS1: %2d 0x%08x", decoded_rs1, cpuregs_rs1);)
+						reg_op1 <= cpuregs_rs1;
+						dbg_rs1val <= cpuregs_rs1;
+						dbg_rs1val_valid <= 1;
+						cpu_state <= cpu_state_ldmem;
+						mem_do_rinst <= 1;
+					end
+					is_slli_srli_srai && !BARREL_SHIFTER: begin
+						`debug($display("LD_RS1: %2d 0x%08x", decoded_rs1, cpuregs_rs1);)
+						reg_op1 <= cpuregs_rs1;
+						dbg_rs1val <= cpuregs_rs1;
+						dbg_rs1val_valid <= 1;
+						reg_sh <= decoded_rs2;
+						cpu_state <= cpu_state_shift;
+					end
+					is_jalr_addi_slti_sltiu_xori_ori_andi, is_slli_srli_srai && BARREL_SHIFTER: begin
+						`debug($display("LD_RS1: %2d 0x%08x", decoded_rs1, cpuregs_rs1);)
+						reg_op1 <= cpuregs_rs1;
+						dbg_rs1val <= cpuregs_rs1;
+						dbg_rs1val_valid <= 1;
+						reg_op2 <= is_slli_srli_srai && BARREL_SHIFTER ? decoded_rs2 : decoded_imm;
+						if (TWO_CYCLE_ALU)
+							alu_wait <= 1;
+						else
+							mem_do_rinst <= mem_do_prefetch;
+						cpu_state <= cpu_state_exec;
+					end
+					default: begin
+						`debug($display("LD_RS1: %2d 0x%08x", decoded_rs1, cpuregs_rs1);)
+						reg_op1 <= cpuregs_rs1;
+						dbg_rs1val <= cpuregs_rs1;
+						dbg_rs1val_valid <= 1;
+						if (ENABLE_REGS_DUALPORT) begin
+							`debug($display("LD_RS2: %2d 0x%08x", decoded_rs2, cpuregs_rs2);)
+							reg_sh <= cpuregs_rs2;
+							reg_op2 <= cpuregs_rs2;
+							dbg_rs2val <= cpuregs_rs2;
+							dbg_rs2val_valid <= 1;
+							(* parallel_case *)
+							case (1'b1)
+								is_sb_sh_sw: begin
+									cpu_state <= cpu_state_stmem;
+									mem_do_rinst <= 1;
+								end
+								is_sll_srl_sra && !BARREL_SHIFTER: begin
+									cpu_state <= cpu_state_shift;
+								end
+								default: begin
+									if (TWO_CYCLE_ALU || (TWO_CYCLE_COMPARE && is_beq_bne_blt_bge_bltu_bgeu)) begin
+										alu_wait_2 <= TWO_CYCLE_ALU && (TWO_CYCLE_COMPARE && is_beq_bne_blt_bge_bltu_bgeu);
+										alu_wait <= 1;
+									end else
+										mem_do_rinst <= mem_do_prefetch;
+									cpu_state <= cpu_state_exec;
+								end
+							endcase
+						end else
+							cpu_state <= cpu_state_ld_rs2;
+					end
+				endcase
+			end
+
+			cpu_state_ld_rs2: begin
+				`debug($display("LD_RS2: %2d 0x%08x", decoded_rs2, cpuregs_rs2);)
+				reg_sh <= cpuregs_rs2;
+				reg_op2 <= cpuregs_rs2;
+				dbg_rs2val <= cpuregs_rs2;
+				dbg_rs2val_valid <= 1;
+
+				(* parallel_case *)
+				case (1'b1)
+					WITH_PCPI && instr_trap: begin
+						pcpi_valid <= 1;
+						if (pcpi_int_ready) begin
+							mem_do_rinst <= 1;
+							pcpi_valid <= 0;
+							reg_out <= pcpi_int_rd;
+							latched_store <= pcpi_int_wr;
+							cpu_state <= cpu_state_fetch;
+						end else
+						if (CATCH_ILLINSN && (pcpi_timeout || instr_ecall_ebreak)) begin
+							pcpi_valid <= 0;
+							`debug($display("EBREAK OR UNSUPPORTED INSN AT 0x%08x", reg_pc);)
+							if (ENABLE_IRQ && !irq_mask[irq_ebreak] && !irq_active) begin
+								next_irq_pending[irq_ebreak] = 1;
+								cpu_state <= cpu_state_fetch;
+							end else
+								cpu_state <= cpu_state_trap;
+						end
+					end
+					is_sb_sh_sw: begin
+						cpu_state <= cpu_state_stmem;
+						mem_do_rinst <= 1;
+					end
+					is_sll_srl_sra && !BARREL_SHIFTER: begin
+						cpu_state <= cpu_state_shift;
+					end
+					default: begin
+						if (TWO_CYCLE_ALU || (TWO_CYCLE_COMPARE && is_beq_bne_blt_bge_bltu_bgeu)) begin
+							alu_wait_2 <= TWO_CYCLE_ALU && (TWO_CYCLE_COMPARE && is_beq_bne_blt_bge_bltu_bgeu);
+							alu_wait <= 1;
+						end else
+							mem_do_rinst <= mem_do_prefetch;
+						cpu_state <= cpu_state_exec;
+					end
+				endcase
+			end
+
+			cpu_state_exec: begin
+				reg_out <= reg_pc + decoded_imm;
+				if ((TWO_CYCLE_ALU || TWO_CYCLE_COMPARE) && (alu_wait || alu_wait_2)) begin
+					mem_do_rinst <= mem_do_prefetch && !alu_wait_2;
+					alu_wait <= alu_wait_2;
+				end else
+				if (is_beq_bne_blt_bge_bltu_bgeu) begin
+					latched_rd <= 0;
+					latched_store <= TWO_CYCLE_COMPARE ? alu_out_0_q : alu_out_0;
+					latched_branch <= TWO_CYCLE_COMPARE ? alu_out_0_q : alu_out_0;
+					if (mem_done)
+						cpu_state <= cpu_state_fetch;
+					if (TWO_CYCLE_COMPARE ? alu_out_0_q : alu_out_0) begin
+						decoder_trigger <= 0;
+						set_mem_do_rinst = 1;
+					end
+				end else begin
+					latched_branch <= instr_jalr;
+					latched_store <= 1;
+					latched_stalu <= 1;
+					cpu_state <= cpu_state_fetch;
+				end
+			end
+
+			cpu_state_shift: begin
+				latched_store <= 1;
+				if (reg_sh == 0) begin
+					reg_out <= reg_op1;
+					mem_do_rinst <= mem_do_prefetch;
+					cpu_state <= cpu_state_fetch;
+				end else if (TWO_STAGE_SHIFT && reg_sh >= 4) begin
+					(* parallel_case, full_case *)
+					case (1'b1)
+						instr_slli || instr_sll: reg_op1 <= reg_op1 << 4;
+						instr_srli || instr_srl: reg_op1 <= reg_op1 >> 4;
+						instr_srai || instr_sra: reg_op1 <= $signed(reg_op1) >>> 4;
+					endcase
+					reg_sh <= reg_sh - 4;
+				end else begin
+					(* parallel_case, full_case *)
+					case (1'b1)
+						instr_slli || instr_sll: reg_op1 <= reg_op1 << 1;
+						instr_srli || instr_srl: reg_op1 <= reg_op1 >> 1;
+						instr_srai || instr_sra: reg_op1 <= $signed(reg_op1) >>> 1;
+					endcase
+					reg_sh <= reg_sh - 1;
+				end
+			end
+
+			cpu_state_stmem: begin
+				if (ENABLE_TRACE)
+					reg_out <= reg_op2;
+				if (!mem_do_prefetch || mem_done) begin
+					if (!mem_do_wdata) begin
+						(* parallel_case, full_case *)
+						case (1'b1)
+							instr_sb: mem_wordsize <= 2;
+							instr_sh: mem_wordsize <= 1;
+							instr_sw: mem_wordsize <= 0;
+						endcase
+						if (ENABLE_TRACE) begin
+							trace_valid <= 1;
+							trace_data <= (irq_active ? TRACE_IRQ : 0) | TRACE_ADDR | ((reg_op1 + decoded_imm) & 32'hffffffff);
+						end
+						reg_op1 <= reg_op1 + decoded_imm;
+						set_mem_do_wdata = 1;
+					end
+					if (!mem_do_prefetch && mem_done) begin
+						cpu_state <= cpu_state_fetch;
+						decoder_trigger <= 1;
+						decoder_pseudo_trigger <= 1;
+					end
+				end
+			end
+
+			cpu_state_ldmem: begin
+				latched_store <= 1;
+				if (!mem_do_prefetch || mem_done) begin
+					if (!mem_do_rdata) begin
+						(* parallel_case, full_case *)
+						case (1'b1)
+							instr_lb || instr_lbu: mem_wordsize <= 2;
+							instr_lh || instr_lhu: mem_wordsize <= 1;
+							instr_lw: mem_wordsize <= 0;
+						endcase
+						latched_is_lu <= is_lbu_lhu_lw;
+						latched_is_lh <= instr_lh;
+						latched_is_lb <= instr_lb;
+						if (ENABLE_TRACE) begin
+							trace_valid <= 1;
+							trace_data <= (irq_active ? TRACE_IRQ : 0) | TRACE_ADDR | ((reg_op1 + decoded_imm) & 32'hffffffff);
+						end
+						reg_op1 <= reg_op1 + decoded_imm;
+						set_mem_do_rdata = 1;
+					end
+					if (!mem_do_prefetch && mem_done) begin
+						(* parallel_case, full_case *)
+						case (1'b1)
+							latched_is_lu: reg_out <= mem_rdata_word;
+							latched_is_lh: reg_out <= $signed(mem_rdata_word[15:0]);
+							latched_is_lb: reg_out <= $signed(mem_rdata_word[7:0]);
+						endcase
+						decoder_trigger <= 1;
+						decoder_pseudo_trigger <= 1;
+						cpu_state <= cpu_state_fetch;
+					end
+				end
+			end
+		endcase
+
+		if (CATCH_MISALIGN && resetn && (mem_do_rdata || mem_do_wdata)) begin
+			if (mem_wordsize == 0 && reg_op1[1:0] != 0) begin
+				`debug($display("MISALIGNED WORD: 0x%08x", reg_op1);)
+				if (ENABLE_IRQ && !irq_mask[irq_buserror] && !irq_active) begin
+					next_irq_pending[irq_buserror] = 1;
+				end else
+					cpu_state <= cpu_state_trap;
+			end
+			if (mem_wordsize == 1 && reg_op1[0] != 0) begin
+				`debug($display("MISALIGNED HALFWORD: 0x%08x", reg_op1);)
+				if (ENABLE_IRQ && !irq_mask[irq_buserror] && !irq_active) begin
+					next_irq_pending[irq_buserror] = 1;
+				end else
+					cpu_state <= cpu_state_trap;
+			end
+		end
+		if (CATCH_MISALIGN && resetn && mem_do_rinst && (COMPRESSED_ISA ? reg_pc[0] : |reg_pc[1:0])) begin
+			`debug($display("MISALIGNED INSTRUCTION: 0x%08x", reg_pc);)
+			if (ENABLE_IRQ && !irq_mask[irq_buserror] && !irq_active) begin
+				next_irq_pending[irq_buserror] = 1;
+			end else
+				cpu_state <= cpu_state_trap;
+		end
+		if (!CATCH_ILLINSN && decoder_trigger_q && !decoder_pseudo_trigger_q && instr_ecall_ebreak) begin
+			cpu_state <= cpu_state_trap;
+		end
+
+		if (!resetn || mem_done) begin
+			mem_do_prefetch <= 0;
+			mem_do_rinst <= 0;
+			mem_do_rdata <= 0;
+			mem_do_wdata <= 0;
+		end
+
+		if (set_mem_do_rinst)
+			mem_do_rinst <= 1;
+		if (set_mem_do_rdata)
+			mem_do_rdata <= 1;
+		if (set_mem_do_wdata)
+			mem_do_wdata <= 1;
+
+		irq_pending <= next_irq_pending & ~MASKED_IRQ;
+
+		if (!CATCH_MISALIGN) begin
+			if (COMPRESSED_ISA) begin
+				reg_pc[0] <= 0;
+				reg_next_pc[0] <= 0;
+			end else begin
+				reg_pc[1:0] <= 0;
+				reg_next_pc[1:0] <= 0;
+			end
+		end
+		current_pc = 'bx;
+	end
+
+`ifdef RISCV_FORMAL
+	reg dbg_irq_call;
+	reg dbg_irq_enter;
+	reg [31:0] dbg_irq_ret;
+	always @(posedge clk) begin
+		rvfi_valid <= resetn && (launch_next_insn || trap) && dbg_valid_insn;
+		rvfi_order <= resetn ? rvfi_order + rvfi_valid : 0;
+
+		rvfi_insn <= dbg_insn_opcode;
+		rvfi_rs1_addr <= dbg_rs1val_valid ? dbg_insn_rs1 : 0;
+		rvfi_rs2_addr <= dbg_rs2val_valid ? dbg_insn_rs2 : 0;
+		rvfi_pc_rdata <= dbg_insn_addr;
+		rvfi_rs1_rdata <= dbg_rs1val_valid ? dbg_rs1val : 0;
+		rvfi_rs2_rdata <= dbg_rs2val_valid ? dbg_rs2val : 0;
+		rvfi_trap <= trap;
+		rvfi_halt <= trap;
+		rvfi_intr <= dbg_irq_enter;
+
+		if (!resetn) begin
+			dbg_irq_call <= 0;
+			dbg_irq_enter <= 0;
+		end else
+		if (rvfi_valid) begin
+			dbg_irq_call <= 0;
+			dbg_irq_enter <= dbg_irq_call;
+		end else
+		if (irq_state == 1) begin
+			dbg_irq_call <= 1;
+			dbg_irq_ret <= next_pc;
+		end
+
+		if (!resetn) begin
+			rvfi_rd_addr <= 0;
+			rvfi_rd_wdata <= 0;
+		end else
+		if (cpuregs_write && !irq_state) begin
+			rvfi_rd_addr <= latched_rd;
+			rvfi_rd_wdata <= latched_rd ? cpuregs_wrdata : 0;
+		end else
+		if (rvfi_valid) begin
+			rvfi_rd_addr <= 0;
+			rvfi_rd_wdata <= 0;
+		end
+
+		casez (dbg_insn_opcode)
+			32'b 0000000_?????_000??_???_?????_0001011: begin // getq
+				rvfi_rs1_addr <= 0;
+				rvfi_rs1_rdata <= 0;
+			end
+			32'b 0000001_?????_?????_???_000??_0001011: begin // setq
+				rvfi_rd_addr <= 0;
+				rvfi_rd_wdata <= 0;
+			end
+			32'b 0000010_?????_00000_???_00000_0001011: begin // retirq
+				rvfi_rs1_addr <= 0;
+				rvfi_rs1_rdata <= 0;
+			end
+		endcase
+
+		if (!dbg_irq_call) begin
+			if (dbg_mem_instr) begin
+				rvfi_mem_addr <= 0;
+				rvfi_mem_rmask <= 0;
+				rvfi_mem_wmask <= 0;
+				rvfi_mem_rdata <= 0;
+				rvfi_mem_wdata <= 0;
+			end else
+			if (dbg_mem_valid && dbg_mem_ready) begin
+				rvfi_mem_addr <= dbg_mem_addr;
+				rvfi_mem_rmask <= dbg_mem_wstrb ? 0 : ~0;
+				rvfi_mem_wmask <= dbg_mem_wstrb;
+				rvfi_mem_rdata <= dbg_mem_rdata;
+				rvfi_mem_wdata <= dbg_mem_wdata;
+			end
+		end
+	end
+
+	always @* begin
+		rvfi_pc_wdata = dbg_irq_call ? dbg_irq_ret : dbg_insn_addr;
+	end
+`endif
+
+	// Formal Verification
+`ifdef FORMAL
+	reg [3:0] last_mem_nowait;
+	always @(posedge clk)
+		last_mem_nowait <= {last_mem_nowait, mem_ready || !mem_valid};
+
+	// stall the memory interface for max 4 cycles
+	restrict property (|last_mem_nowait || mem_ready || !mem_valid);
+
+	// resetn low in first cycle, after that resetn high
+	restrict property (resetn != $initstate);
+
+	// this just makes it much easier to read traces. uncomment as needed.
+	// assume property (mem_valid || !mem_ready);
+
+	reg ok;
+	always @* begin
+		if (resetn) begin
+			// instruction fetches are read-only
+			if (mem_valid && mem_instr)
+				assert (mem_wstrb == 0);
+
+			// cpu_state must be valid
+			ok = 0;
+			if (cpu_state == cpu_state_trap)   ok = 1;
+			if (cpu_state == cpu_state_fetch)  ok = 1;
+			if (cpu_state == cpu_state_ld_rs1) ok = 1;
+			if (cpu_state == cpu_state_ld_rs2) ok = !ENABLE_REGS_DUALPORT;
+			if (cpu_state == cpu_state_exec)   ok = 1;
+			if (cpu_state == cpu_state_shift)  ok = 1;
+			if (cpu_state == cpu_state_stmem)  ok = 1;
+			if (cpu_state == cpu_state_ldmem)  ok = 1;
+			assert (ok);
+		end
+	end
+
+	reg last_mem_la_read = 0;
+	reg last_mem_la_write = 0;
+	reg [31:0] last_mem_la_addr;
+	reg [31:0] last_mem_la_wdata;
+	reg [3:0] last_mem_la_wstrb = 0;
+
+	always @(posedge clk) begin
+		last_mem_la_read <= mem_la_read;
+		last_mem_la_write <= mem_la_write;
+		last_mem_la_addr <= mem_la_addr;
+		last_mem_la_wdata <= mem_la_wdata;
+		last_mem_la_wstrb <= mem_la_wstrb;
+
+		if (last_mem_la_read) begin
+			assert(mem_valid);
+			assert(mem_addr == last_mem_la_addr);
+			assert(mem_wstrb == 0);
+		end
+		if (last_mem_la_write) begin
+			assert(mem_valid);
+			assert(mem_addr == last_mem_la_addr);
+			assert(mem_wdata == last_mem_la_wdata);
+			assert(mem_wstrb == last_mem_la_wstrb);
+		end
+		if (mem_la_read || mem_la_write) begin
+			assert(!mem_valid || mem_ready);
+		end
+	end
+`endif
+endmodule
+
+// This is a simple example implementation of PICORV32_REGS.
+// Use the PICORV32_REGS mechanism if you want to use custom
+// memory resources to implement the processor register file.
+// Note that your implementation must match the requirements of
+// the PicoRV32 configuration. (e.g. QREGS, etc)
+module picorv32_regs (
+	input clk, wen,
+	input [5:0] waddr,
+	input [5:0] raddr1,
+	input [5:0] raddr2,
+	input [31:0] wdata,
+	output [31:0] rdata1,
+	output [31:0] rdata2
+);
+	reg [31:0] regs [0:30];
+
+	always @(posedge clk)
+		if (wen) regs[~waddr[4:0]] <= wdata;
+
+	assign rdata1 = regs[~raddr1[4:0]];
+	assign rdata2 = regs[~raddr2[4:0]];
+endmodule
+
+
+/***************************************************************
+ * picorv32_pcpi_mul
+ ***************************************************************/
+
+module picorv32_pcpi_mul #(
+	parameter STEPS_AT_ONCE = 1,
+	parameter CARRY_CHAIN = 4
+) (
+	input clk, resetn,
+
+	input             pcpi_valid,
+	input      [31:0] pcpi_insn,
+	input      [31:0] pcpi_rs1,
+	input      [31:0] pcpi_rs2,
+	output reg        pcpi_wr,
+	output reg [31:0] pcpi_rd,
+	output reg        pcpi_wait,
+	output reg        pcpi_ready
+);
+	reg instr_mul, instr_mulh, instr_mulhsu, instr_mulhu;
+	wire instr_any_mul = |{instr_mul, instr_mulh, instr_mulhsu, instr_mulhu};
+	wire instr_any_mulh = |{instr_mulh, instr_mulhsu, instr_mulhu};
+	wire instr_rs1_signed = |{instr_mulh, instr_mulhsu};
+	wire instr_rs2_signed = |{instr_mulh};
+
+	reg pcpi_wait_q;
+	wire mul_start = pcpi_wait && !pcpi_wait_q;
+
+	always @(posedge clk) begin
+		instr_mul <= 0;
+		instr_mulh <= 0;
+		instr_mulhsu <= 0;
+		instr_mulhu <= 0;
+
+		if (resetn && pcpi_valid && pcpi_insn[6:0] == 7'b0110011 && pcpi_insn[31:25] == 7'b0000001) begin
+			case (pcpi_insn[14:12])
+				3'b000: instr_mul <= 1;
+				3'b001: instr_mulh <= 1;
+				3'b010: instr_mulhsu <= 1;
+				3'b011: instr_mulhu <= 1;
+			endcase
+		end
+
+		pcpi_wait <= instr_any_mul;
+		pcpi_wait_q <= pcpi_wait;
+	end
+
+	reg [63:0] rs1, rs2, rd, rdx;
+	reg [63:0] next_rs1, next_rs2, this_rs2;
+	reg [63:0] next_rd, next_rdx, next_rdt;
+	reg [6:0] mul_counter;
+	reg mul_waiting;
+	reg mul_finish;
+	integer i, j;
+
+	// carry save accumulator
+	always @* begin
+		next_rd = rd;
+		next_rdx = rdx;
+		next_rs1 = rs1;
+		next_rs2 = rs2;
+
+		for (i = 0; i < STEPS_AT_ONCE; i=i+1) begin
+			this_rs2 = next_rs1[0] ? next_rs2 : 0;
+			if (CARRY_CHAIN == 0) begin
+				next_rdt = next_rd ^ next_rdx ^ this_rs2;
+				next_rdx = ((next_rd & next_rdx) | (next_rd & this_rs2) | (next_rdx & this_rs2)) << 1;
+				next_rd = next_rdt;
+			end else begin
+				next_rdt = 0;
+				for (j = 0; j < 64; j = j + CARRY_CHAIN)
+					{next_rdt[j+CARRY_CHAIN-1], next_rd[j +: CARRY_CHAIN]} =
+							next_rd[j +: CARRY_CHAIN] + next_rdx[j +: CARRY_CHAIN] + this_rs2[j +: CARRY_CHAIN];
+				next_rdx = next_rdt << 1;
+			end
+			next_rs1 = next_rs1 >> 1;
+			next_rs2 = next_rs2 << 1;
+		end
+	end
+
+	always @(posedge clk) begin
+		mul_finish <= 0;
+		if (!resetn) begin
+			mul_waiting <= 1;
+		end else
+		if (mul_waiting) begin
+			if (instr_rs1_signed)
+				rs1 <= $signed(pcpi_rs1);
+			else
+				rs1 <= $unsigned(pcpi_rs1);
+
+			if (instr_rs2_signed)
+				rs2 <= $signed(pcpi_rs2);
+			else
+				rs2 <= $unsigned(pcpi_rs2);
+
+			rd <= 0;
+			rdx <= 0;
+			mul_counter <= (instr_any_mulh ? 63 - STEPS_AT_ONCE : 31 - STEPS_AT_ONCE);
+			mul_waiting <= !mul_start;
+		end else begin
+			rd <= next_rd;
+			rdx <= next_rdx;
+			rs1 <= next_rs1;
+			rs2 <= next_rs2;
+
+			mul_counter <= mul_counter - STEPS_AT_ONCE;
+			if (mul_counter[6]) begin
+				mul_finish <= 1;
+				mul_waiting <= 1;
+			end
+		end
+	end
+
+	always @(posedge clk) begin
+		pcpi_wr <= 0;
+		pcpi_ready <= 0;
+		if (mul_finish && resetn) begin
+			pcpi_wr <= 1;
+			pcpi_ready <= 1;
+			pcpi_rd <= instr_any_mulh ? rd >> 32 : rd;
+		end
+	end
+endmodule
+
+module picorv32_pcpi_fast_mul #(
+	parameter EXTRA_MUL_FFS = 0,
+	parameter EXTRA_INSN_FFS = 0,
+	parameter MUL_CLKGATE = 0
+) (
+	input clk, resetn,
+
+	input             pcpi_valid,
+	input      [31:0] pcpi_insn,
+	input      [31:0] pcpi_rs1,
+	input      [31:0] pcpi_rs2,
+	output            pcpi_wr,
+	output     [31:0] pcpi_rd,
+	output            pcpi_wait,
+	output            pcpi_ready
+);
+	reg instr_mul, instr_mulh, instr_mulhsu, instr_mulhu;
+	wire instr_any_mul = |{instr_mul, instr_mulh, instr_mulhsu, instr_mulhu};
+	wire instr_any_mulh = |{instr_mulh, instr_mulhsu, instr_mulhu};
+	wire instr_rs1_signed = |{instr_mulh, instr_mulhsu};
+	wire instr_rs2_signed = |{instr_mulh};
+
+	reg shift_out;
+	reg [3:0] active;
+	reg [32:0] rs1, rs2, rs1_q, rs2_q;
+	reg [63:0] rd, rd_q;
+
+	wire pcpi_insn_valid = pcpi_valid && pcpi_insn[6:0] == 7'b0110011 && pcpi_insn[31:25] == 7'b0000001;
+	reg pcpi_insn_valid_q;
+
+	always @* begin
+		instr_mul = 0;
+		instr_mulh = 0;
+		instr_mulhsu = 0;
+		instr_mulhu = 0;
+
+		if (resetn && (EXTRA_INSN_FFS ? pcpi_insn_valid_q : pcpi_insn_valid)) begin
+			case (pcpi_insn[14:12])
+				3'b000: instr_mul = 1;
+				3'b001: instr_mulh = 1;
+				3'b010: instr_mulhsu = 1;
+				3'b011: instr_mulhu = 1;
+			endcase
+		end
+	end
+
+	always @(posedge clk) begin
+		pcpi_insn_valid_q <= pcpi_insn_valid;
+		if (!MUL_CLKGATE || active[0]) begin
+			rs1_q <= rs1;
+			rs2_q <= rs2;
+		end
+		if (!MUL_CLKGATE || active[1]) begin
+			rd <= $signed(EXTRA_MUL_FFS ? rs1_q : rs1) * $signed(EXTRA_MUL_FFS ? rs2_q : rs2);
+		end
+		if (!MUL_CLKGATE || active[2]) begin
+			rd_q <= rd;
+		end
+	end
+
+	always @(posedge clk) begin
+		if (instr_any_mul && !(EXTRA_MUL_FFS ? active[3:0] : active[1:0])) begin
+			if (instr_rs1_signed)
+				rs1 <= $signed(pcpi_rs1);
+			else
+				rs1 <= $unsigned(pcpi_rs1);
+
+			if (instr_rs2_signed)
+				rs2 <= $signed(pcpi_rs2);
+			else
+				rs2 <= $unsigned(pcpi_rs2);
+			active[0] <= 1;
+		end else begin
+			active[0] <= 0;
+		end
+
+		active[3:1] <= active;
+		shift_out <= instr_any_mulh;
+
+		if (!resetn)
+			active <= 0;
+	end
+
+	assign pcpi_wr = active[EXTRA_MUL_FFS ? 3 : 1];
+	assign pcpi_wait = 0;
+	assign pcpi_ready = active[EXTRA_MUL_FFS ? 3 : 1];
+`ifdef RISCV_FORMAL_ALTOPS
+	assign pcpi_rd =
+			instr_mul    ? (pcpi_rs1 + pcpi_rs2) ^ 32'h5876063e :
+			instr_mulh   ? (pcpi_rs1 + pcpi_rs2) ^ 32'hf6583fb7 :
+			instr_mulhsu ? (pcpi_rs1 - pcpi_rs2) ^ 32'hecfbe137 :
+			instr_mulhu  ? (pcpi_rs1 + pcpi_rs2) ^ 32'h949ce5e8 : 1'bx;
+`else
+	assign pcpi_rd = shift_out ? (EXTRA_MUL_FFS ? rd_q : rd) >> 32 : (EXTRA_MUL_FFS ? rd_q : rd);
+`endif
+endmodule
+
+
+/***************************************************************
+ * picorv32_pcpi_div
+ ***************************************************************/
+
+module picorv32_pcpi_div (
+	input clk, resetn,
+
+	input             pcpi_valid,
+	input      [31:0] pcpi_insn,
+	input      [31:0] pcpi_rs1,
+	input      [31:0] pcpi_rs2,
+	output reg        pcpi_wr,
+	output reg [31:0] pcpi_rd,
+	output reg        pcpi_wait,
+	output reg        pcpi_ready
+);
+	reg instr_div, instr_divu, instr_rem, instr_remu;
+	wire instr_any_div_rem = |{instr_div, instr_divu, instr_rem, instr_remu};
+
+	reg pcpi_wait_q;
+	wire start = pcpi_wait && !pcpi_wait_q;
+
+	always @(posedge clk) begin
+		instr_div <= 0;
+		instr_divu <= 0;
+		instr_rem <= 0;
+		instr_remu <= 0;
+
+		if (resetn && pcpi_valid && !pcpi_ready && pcpi_insn[6:0] == 7'b0110011 && pcpi_insn[31:25] == 7'b0000001) begin
+			case (pcpi_insn[14:12])
+				3'b100: instr_div <= 1;
+				3'b101: instr_divu <= 1;
+				3'b110: instr_rem <= 1;
+				3'b111: instr_remu <= 1;
+			endcase
+		end
+
+		pcpi_wait <= instr_any_div_rem && resetn;
+		pcpi_wait_q <= pcpi_wait && resetn;
+	end
+
+	reg [31:0] dividend;
+	reg [62:0] divisor;
+	reg [31:0] quotient;
+	reg [31:0] quotient_msk;
+	reg running;
+	reg outsign;
+
+	always @(posedge clk) begin
+		pcpi_ready <= 0;
+		pcpi_wr <= 0;
+		pcpi_rd <= 'bx;
+
+		if (!resetn) begin
+			running <= 0;
+		end else
+		if (start) begin
+			running <= 1;
+			dividend <= (instr_div || instr_rem) && pcpi_rs1[31] ? -pcpi_rs1 : pcpi_rs1;
+			divisor <= ((instr_div || instr_rem) && pcpi_rs2[31] ? -pcpi_rs2 : pcpi_rs2) << 31;
+			outsign <= (instr_div && (pcpi_rs1[31] != pcpi_rs2[31]) && |pcpi_rs2) || (instr_rem && pcpi_rs1[31]);
+			quotient <= 0;
+			quotient_msk <= 1 << 31;
+		end else
+		if (!quotient_msk && running) begin
+			running <= 0;
+			pcpi_ready <= 1;
+			pcpi_wr <= 1;
+`ifdef RISCV_FORMAL_ALTOPS
+			case (1)
+				instr_div:  pcpi_rd <= (pcpi_rs1 - pcpi_rs2) ^ 32'h7f8529ec;
+				instr_divu: pcpi_rd <= (pcpi_rs1 - pcpi_rs2) ^ 32'h10e8fd70;
+				instr_rem:  pcpi_rd <= (pcpi_rs1 - pcpi_rs2) ^ 32'h8da68fa5;
+				instr_remu: pcpi_rd <= (pcpi_rs1 - pcpi_rs2) ^ 32'h3138d0e1;
+			endcase
+`else
+			if (instr_div || instr_divu)
+				pcpi_rd <= outsign ? -quotient : quotient;
+			else
+				pcpi_rd <= outsign ? -dividend : dividend;
+`endif
+		end else begin
+			if (divisor <= dividend) begin
+				dividend <= dividend - divisor;
+				quotient <= quotient | quotient_msk;
+			end
+			divisor <= divisor >> 1;
+`ifdef RISCV_FORMAL_ALTOPS
+			quotient_msk <= quotient_msk >> 5;
+`else
+			quotient_msk <= quotient_msk >> 1;
+`endif
+		end
+	end
+endmodule
+
+
+/***************************************************************
+ * picorv32_axi
+ ***************************************************************/
+
+module picorv32_axi #(
+	parameter [ 0:0] ENABLE_COUNTERS = 1,
+	parameter [ 0:0] ENABLE_COUNTERS64 = 1,
+	parameter [ 0:0] ENABLE_REGS_16_31 = 1,
+	parameter [ 0:0] ENABLE_REGS_DUALPORT = 1,
+	parameter [ 0:0] TWO_STAGE_SHIFT = 1,
+	parameter [ 0:0] BARREL_SHIFTER = 0,
+	parameter [ 0:0] TWO_CYCLE_COMPARE = 0,
+	parameter [ 0:0] TWO_CYCLE_ALU = 0,
+	parameter [ 0:0] COMPRESSED_ISA = 0,
+	parameter [ 0:0] CATCH_MISALIGN = 1,
+	parameter [ 0:0] CATCH_ILLINSN = 1,
+	parameter [ 0:0] ENABLE_PCPI = 0,
+	parameter [ 0:0] ENABLE_MUL = 0,
+	parameter [ 0:0] ENABLE_FAST_MUL = 0,
+	parameter [ 0:0] ENABLE_DIV = 0,
+	parameter [ 0:0] ENABLE_IRQ = 0,
+	parameter [ 0:0] ENABLE_IRQ_QREGS = 1,
+	parameter [ 0:0] ENABLE_IRQ_TIMER = 1,
+	parameter [ 0:0] ENABLE_TRACE = 0,
+	parameter [ 0:0] REGS_INIT_ZERO = 0,
+	parameter [31:0] MASKED_IRQ = 32'h 0000_0000,
+	parameter [31:0] LATCHED_IRQ = 32'h ffff_ffff,
+	parameter [31:0] PROGADDR_RESET = 32'h 0000_0000,
+	parameter [31:0] PROGADDR_IRQ = 32'h 0000_0010,
+	parameter [31:0] STACKADDR = 32'h ffff_ffff
+) (
+	input clk, resetn,
+	output trap,
+
+	// AXI4-lite master memory interface
+
+	output        mem_axi_awvalid,
+	input         mem_axi_awready,
+	output [31:0] mem_axi_awaddr,
+	output [ 2:0] mem_axi_awprot,
+
+	output        mem_axi_wvalid,
+	input         mem_axi_wready,
+	output [31:0] mem_axi_wdata,
+	output [ 3:0] mem_axi_wstrb,
+
+	input         mem_axi_bvalid,
+	output        mem_axi_bready,
+
+	output        mem_axi_arvalid,
+	input         mem_axi_arready,
+	output [31:0] mem_axi_araddr,
+	output [ 2:0] mem_axi_arprot,
+
+	input         mem_axi_rvalid,
+	output        mem_axi_rready,
+	input  [31:0] mem_axi_rdata,
+
+	// Pico Co-Processor Interface (PCPI)
+	output        pcpi_valid,
+	output [31:0] pcpi_insn,
+	output [31:0] pcpi_rs1,
+	output [31:0] pcpi_rs2,
+	input         pcpi_wr,
+	input  [31:0] pcpi_rd,
+	input         pcpi_wait,
+	input         pcpi_ready,
+
+	// IRQ interface
+	input  [31:0] irq,
+	output [31:0] eoi,
+
+`ifdef RISCV_FORMAL
+	output        rvfi_valid,
+	output [63:0] rvfi_order,
+	output [31:0] rvfi_insn,
+	output        rvfi_trap,
+	output        rvfi_halt,
+	output        rvfi_intr,
+	output [ 4:0] rvfi_rs1_addr,
+	output [ 4:0] rvfi_rs2_addr,
+	output [31:0] rvfi_rs1_rdata,
+	output [31:0] rvfi_rs2_rdata,
+	output [ 4:0] rvfi_rd_addr,
+	output [31:0] rvfi_rd_wdata,
+	output [31:0] rvfi_pc_rdata,
+	output [31:0] rvfi_pc_wdata,
+	output [31:0] rvfi_mem_addr,
+	output [ 3:0] rvfi_mem_rmask,
+	output [ 3:0] rvfi_mem_wmask,
+	output [31:0] rvfi_mem_rdata,
+	output [31:0] rvfi_mem_wdata,
+`endif
+
+	// Trace Interface
+	output        trace_valid,
+	output [35:0] trace_data
+);
+	wire        mem_valid;
+	wire [31:0] mem_addr;
+	wire [31:0] mem_wdata;
+	wire [ 3:0] mem_wstrb;
+	wire        mem_instr;
+	wire        mem_ready;
+	wire [31:0] mem_rdata;
+
+	picorv32_axi_adapter axi_adapter (
+		.clk            (clk            ),
+		.resetn         (resetn         ),
+		.mem_axi_awvalid(mem_axi_awvalid),
+		.mem_axi_awready(mem_axi_awready),
+		.mem_axi_awaddr (mem_axi_awaddr ),
+		.mem_axi_awprot (mem_axi_awprot ),
+		.mem_axi_wvalid (mem_axi_wvalid ),
+		.mem_axi_wready (mem_axi_wready ),
+		.mem_axi_wdata  (mem_axi_wdata  ),
+		.mem_axi_wstrb  (mem_axi_wstrb  ),
+		.mem_axi_bvalid (mem_axi_bvalid ),
+		.mem_axi_bready (mem_axi_bready ),
+		.mem_axi_arvalid(mem_axi_arvalid),
+		.mem_axi_arready(mem_axi_arready),
+		.mem_axi_araddr (mem_axi_araddr ),
+		.mem_axi_arprot (mem_axi_arprot ),
+		.mem_axi_rvalid (mem_axi_rvalid ),
+		.mem_axi_rready (mem_axi_rready ),
+		.mem_axi_rdata  (mem_axi_rdata  ),
+		.mem_valid      (mem_valid      ),
+		.mem_instr      (mem_instr      ),
+		.mem_ready      (mem_ready      ),
+		.mem_addr       (mem_addr       ),
+		.mem_wdata      (mem_wdata      ),
+		.mem_wstrb      (mem_wstrb      ),
+		.mem_rdata      (mem_rdata      )
+	);
+
+	picorv32 #(
+		.ENABLE_COUNTERS     (ENABLE_COUNTERS     ),
+		.ENABLE_COUNTERS64   (ENABLE_COUNTERS64   ),
+		.ENABLE_REGS_16_31   (ENABLE_REGS_16_31   ),
+		.ENABLE_REGS_DUALPORT(ENABLE_REGS_DUALPORT),
+		.TWO_STAGE_SHIFT     (TWO_STAGE_SHIFT     ),
+		.BARREL_SHIFTER      (BARREL_SHIFTER      ),
+		.TWO_CYCLE_COMPARE   (TWO_CYCLE_COMPARE   ),
+		.TWO_CYCLE_ALU       (TWO_CYCLE_ALU       ),
+		.COMPRESSED_ISA      (COMPRESSED_ISA      ),
+		.CATCH_MISALIGN      (CATCH_MISALIGN      ),
+		.CATCH_ILLINSN       (CATCH_ILLINSN       ),
+		.ENABLE_PCPI         (ENABLE_PCPI         ),
+		.ENABLE_MUL          (ENABLE_MUL          ),
+		.ENABLE_FAST_MUL     (ENABLE_FAST_MUL     ),
+		.ENABLE_DIV          (ENABLE_DIV          ),
+		.ENABLE_IRQ          (ENABLE_IRQ          ),
+		.ENABLE_IRQ_QREGS    (ENABLE_IRQ_QREGS    ),
+		.ENABLE_IRQ_TIMER    (ENABLE_IRQ_TIMER    ),
+		.ENABLE_TRACE        (ENABLE_TRACE        ),
+		.REGS_INIT_ZERO      (REGS_INIT_ZERO      ),
+		.MASKED_IRQ          (MASKED_IRQ          ),
+		.LATCHED_IRQ         (LATCHED_IRQ         ),
+		.PROGADDR_RESET      (PROGADDR_RESET      ),
+		.PROGADDR_IRQ        (PROGADDR_IRQ        ),
+		.STACKADDR           (STACKADDR           )
+	) picorv32_core (
+		.clk      (clk   ),
+		.resetn   (resetn),
+		.trap     (trap  ),
+
+		.mem_valid(mem_valid),
+		.mem_addr (mem_addr ),
+		.mem_wdata(mem_wdata),
+		.mem_wstrb(mem_wstrb),
+		.mem_instr(mem_instr),
+		.mem_ready(mem_ready),
+		.mem_rdata(mem_rdata),
+
+		.pcpi_valid(pcpi_valid),
+		.pcpi_insn (pcpi_insn ),
+		.pcpi_rs1  (pcpi_rs1  ),
+		.pcpi_rs2  (pcpi_rs2  ),
+		.pcpi_wr   (pcpi_wr   ),
+		.pcpi_rd   (pcpi_rd   ),
+		.pcpi_wait (pcpi_wait ),
+		.pcpi_ready(pcpi_ready),
+
+		.irq(irq),
+		.eoi(eoi),
+
+`ifdef RISCV_FORMAL
+		.rvfi_valid    (rvfi_valid    ),
+		.rvfi_order    (rvfi_order    ),
+		.rvfi_insn     (rvfi_insn     ),
+		.rvfi_trap     (rvfi_trap     ),
+		.rvfi_halt     (rvfi_halt     ),
+		.rvfi_intr     (rvfi_intr     ),
+		.rvfi_rs1_addr (rvfi_rs1_addr ),
+		.rvfi_rs2_addr (rvfi_rs2_addr ),
+		.rvfi_rs1_rdata(rvfi_rs1_rdata),
+		.rvfi_rs2_rdata(rvfi_rs2_rdata),
+		.rvfi_rd_addr  (rvfi_rd_addr  ),
+		.rvfi_rd_wdata (rvfi_rd_wdata ),
+		.rvfi_pc_rdata (rvfi_pc_rdata ),
+		.rvfi_pc_wdata (rvfi_pc_wdata ),
+		.rvfi_mem_addr (rvfi_mem_addr ),
+		.rvfi_mem_rmask(rvfi_mem_rmask),
+		.rvfi_mem_wmask(rvfi_mem_wmask),
+		.rvfi_mem_rdata(rvfi_mem_rdata),
+		.rvfi_mem_wdata(rvfi_mem_wdata),
+`endif
+
+		.trace_valid(trace_valid),
+		.trace_data (trace_data)
+	);
+endmodule
+
+
+/***************************************************************
+ * picorv32_axi_adapter
+ ***************************************************************/
+
+module picorv32_axi_adapter (
+	input clk, resetn,
+
+	// AXI4-lite master memory interface
+
+	output        mem_axi_awvalid,
+	input         mem_axi_awready,
+	output [31:0] mem_axi_awaddr,
+	output [ 2:0] mem_axi_awprot,
+
+	output        mem_axi_wvalid,
+	input         mem_axi_wready,
+	output [31:0] mem_axi_wdata,
+	output [ 3:0] mem_axi_wstrb,
+
+	input         mem_axi_bvalid,
+	output        mem_axi_bready,
+
+	output        mem_axi_arvalid,
+	input         mem_axi_arready,
+	output [31:0] mem_axi_araddr,
+	output [ 2:0] mem_axi_arprot,
+
+	input         mem_axi_rvalid,
+	output        mem_axi_rready,
+	input  [31:0] mem_axi_rdata,
+
+	// Native PicoRV32 memory interface
+
+	input         mem_valid,
+	input         mem_instr,
+	output        mem_ready,
+	input  [31:0] mem_addr,
+	input  [31:0] mem_wdata,
+	input  [ 3:0] mem_wstrb,
+	output [31:0] mem_rdata
+);
+	reg ack_awvalid;
+	reg ack_arvalid;
+	reg ack_wvalid;
+	reg xfer_done;
+
+	assign mem_axi_awvalid = mem_valid && |mem_wstrb && !ack_awvalid;
+	assign mem_axi_awaddr = mem_addr;
+	assign mem_axi_awprot = 0;
+
+	assign mem_axi_arvalid = mem_valid && !mem_wstrb && !ack_arvalid;
+	assign mem_axi_araddr = mem_addr;
+	assign mem_axi_arprot = mem_instr ? 3'b100 : 3'b000;
+
+	assign mem_axi_wvalid = mem_valid && |mem_wstrb && !ack_wvalid;
+	assign mem_axi_wdata = mem_wdata;
+	assign mem_axi_wstrb = mem_wstrb;
+
+	assign mem_ready = mem_axi_bvalid || mem_axi_rvalid;
+	assign mem_axi_bready = mem_valid && |mem_wstrb;
+	assign mem_axi_rready = mem_valid && !mem_wstrb;
+	assign mem_rdata = mem_axi_rdata;
+
+	always @(posedge clk) begin
+		if (!resetn) begin
+			ack_awvalid <= 0;
+		end else begin
+			xfer_done <= mem_valid && mem_ready;
+			if (mem_axi_awready && mem_axi_awvalid)
+				ack_awvalid <= 1;
+			if (mem_axi_arready && mem_axi_arvalid)
+				ack_arvalid <= 1;
+			if (mem_axi_wready && mem_axi_wvalid)
+				ack_wvalid <= 1;
+			if (xfer_done || !mem_valid) begin
+				ack_awvalid <= 0;
+				ack_arvalid <= 0;
+				ack_wvalid <= 0;
+			end
+		end
+	end
+endmodule
+
+
+/***************************************************************
+ * picorv32_wb
+ ***************************************************************/
+
+module picorv32_wb #(
+	parameter [ 0:0] ENABLE_COUNTERS = 1,
+	parameter [ 0:0] ENABLE_COUNTERS64 = 1,
+	parameter [ 0:0] ENABLE_REGS_16_31 = 1,
+	parameter [ 0:0] ENABLE_REGS_DUALPORT = 1,
+	parameter [ 0:0] TWO_STAGE_SHIFT = 1,
+	parameter [ 0:0] BARREL_SHIFTER = 0,
+	parameter [ 0:0] TWO_CYCLE_COMPARE = 0,
+	parameter [ 0:0] TWO_CYCLE_ALU = 0,
+	parameter [ 0:0] COMPRESSED_ISA = 0,
+	parameter [ 0:0] CATCH_MISALIGN = 1,
+	parameter [ 0:0] CATCH_ILLINSN = 1,
+	parameter [ 0:0] ENABLE_PCPI = 0,
+	parameter [ 0:0] ENABLE_MUL = 0,
+	parameter [ 0:0] ENABLE_FAST_MUL = 0,
+	parameter [ 0:0] ENABLE_DIV = 0,
+	parameter [ 0:0] ENABLE_IRQ = 0,
+	parameter [ 0:0] ENABLE_IRQ_QREGS = 1,
+	parameter [ 0:0] ENABLE_IRQ_TIMER = 1,
+	parameter [ 0:0] ENABLE_TRACE = 0,
+	parameter [ 0:0] REGS_INIT_ZERO = 0,
+	parameter [31:0] MASKED_IRQ = 32'h 0000_0000,
+	parameter [31:0] LATCHED_IRQ = 32'h ffff_ffff,
+	parameter [31:0] PROGADDR_RESET = 32'h 0000_0000,
+	parameter [31:0] PROGADDR_IRQ = 32'h 0000_0010,
+	parameter [31:0] STACKADDR = 32'h ffff_ffff
+) (
+	output trap,
+
+	// Wishbone interfaces
+	input wb_rst_i,
+	input wb_clk_i,
+
+	output reg [31:0] wbm_adr_o,
+	output reg [31:0] wbm_dat_o,
+	input [31:0] wbm_dat_i,
+	output reg wbm_we_o,
+	output reg [3:0] wbm_sel_o,
+	output reg wbm_stb_o,
+	input wbm_ack_i,
+	output reg wbm_cyc_o,
+
+	// Pico Co-Processor Interface (PCPI)
+	output        pcpi_valid,
+	output [31:0] pcpi_insn,
+	output [31:0] pcpi_rs1,
+	output [31:0] pcpi_rs2,
+	input         pcpi_wr,
+	input  [31:0] pcpi_rd,
+	input         pcpi_wait,
+	input         pcpi_ready,
+
+	// IRQ interface
+	input  [31:0] irq,
+	output [31:0] eoi,
+
+`ifdef RISCV_FORMAL
+	output        rvfi_valid,
+	output [63:0] rvfi_order,
+	output [31:0] rvfi_insn,
+	output        rvfi_trap,
+	output        rvfi_halt,
+	output        rvfi_intr,
+	output [ 4:0] rvfi_rs1_addr,
+	output [ 4:0] rvfi_rs2_addr,
+	output [31:0] rvfi_rs1_rdata,
+	output [31:0] rvfi_rs2_rdata,
+	output [ 4:0] rvfi_rd_addr,
+	output [31:0] rvfi_rd_wdata,
+	output [31:0] rvfi_pc_rdata,
+	output [31:0] rvfi_pc_wdata,
+	output [31:0] rvfi_mem_addr,
+	output [ 3:0] rvfi_mem_rmask,
+	output [ 3:0] rvfi_mem_wmask,
+	output [31:0] rvfi_mem_rdata,
+	output [31:0] rvfi_mem_wdata,
+`endif
+
+	// Trace Interface
+	output        trace_valid,
+	output [35:0] trace_data,
+
+	output mem_instr
+);
+	wire        mem_valid;
+	wire [31:0] mem_addr;
+	wire [31:0] mem_wdata;
+	wire [ 3:0] mem_wstrb;
+	reg         mem_ready;
+	reg [31:0] mem_rdata;
+
+	wire clk;
+	wire resetn;
+
+	assign clk = wb_clk_i;
+	assign resetn = ~wb_rst_i;
+
+	picorv32 #(
+		.ENABLE_COUNTERS     (ENABLE_COUNTERS     ),
+		.ENABLE_COUNTERS64   (ENABLE_COUNTERS64   ),
+		.ENABLE_REGS_16_31   (ENABLE_REGS_16_31   ),
+		.ENABLE_REGS_DUALPORT(ENABLE_REGS_DUALPORT),
+		.TWO_STAGE_SHIFT     (TWO_STAGE_SHIFT     ),
+		.BARREL_SHIFTER      (BARREL_SHIFTER      ),
+		.TWO_CYCLE_COMPARE   (TWO_CYCLE_COMPARE   ),
+		.TWO_CYCLE_ALU       (TWO_CYCLE_ALU       ),
+		.COMPRESSED_ISA      (COMPRESSED_ISA      ),
+		.CATCH_MISALIGN      (CATCH_MISALIGN      ),
+		.CATCH_ILLINSN       (CATCH_ILLINSN       ),
+		.ENABLE_PCPI         (ENABLE_PCPI         ),
+		.ENABLE_MUL          (ENABLE_MUL          ),
+		.ENABLE_FAST_MUL     (ENABLE_FAST_MUL     ),
+		.ENABLE_DIV          (ENABLE_DIV          ),
+		.ENABLE_IRQ          (ENABLE_IRQ          ),
+		.ENABLE_IRQ_QREGS    (ENABLE_IRQ_QREGS    ),
+		.ENABLE_IRQ_TIMER    (ENABLE_IRQ_TIMER    ),
+		.ENABLE_TRACE        (ENABLE_TRACE        ),
+		.REGS_INIT_ZERO      (REGS_INIT_ZERO      ),
+		.MASKED_IRQ          (MASKED_IRQ          ),
+		.LATCHED_IRQ         (LATCHED_IRQ         ),
+		.PROGADDR_RESET      (PROGADDR_RESET      ),
+		.PROGADDR_IRQ        (PROGADDR_IRQ        ),
+		.STACKADDR           (STACKADDR           )
+	) picorv32_core (
+		.clk      (clk   ),
+		.resetn   (resetn),
+		.trap     (trap  ),
+
+		.mem_valid(mem_valid),
+		.mem_addr (mem_addr ),
+		.mem_wdata(mem_wdata),
+		.mem_wstrb(mem_wstrb),
+		.mem_instr(mem_instr),
+		.mem_ready(mem_ready),
+		.mem_rdata(mem_rdata),
+
+		.pcpi_valid(pcpi_valid),
+		.pcpi_insn (pcpi_insn ),
+		.pcpi_rs1  (pcpi_rs1  ),
+		.pcpi_rs2  (pcpi_rs2  ),
+		.pcpi_wr   (pcpi_wr   ),
+		.pcpi_rd   (pcpi_rd   ),
+		.pcpi_wait (pcpi_wait ),
+		.pcpi_ready(pcpi_ready),
+
+		.irq(irq),
+		.eoi(eoi),
+
+`ifdef RISCV_FORMAL
+		.rvfi_valid    (rvfi_valid    ),
+		.rvfi_order    (rvfi_order    ),
+		.rvfi_insn     (rvfi_insn     ),
+		.rvfi_trap     (rvfi_trap     ),
+		.rvfi_halt     (rvfi_halt     ),
+		.rvfi_intr     (rvfi_intr     ),
+		.rvfi_rs1_addr (rvfi_rs1_addr ),
+		.rvfi_rs2_addr (rvfi_rs2_addr ),
+		.rvfi_rs1_rdata(rvfi_rs1_rdata),
+		.rvfi_rs2_rdata(rvfi_rs2_rdata),
+		.rvfi_rd_addr  (rvfi_rd_addr  ),
+		.rvfi_rd_wdata (rvfi_rd_wdata ),
+		.rvfi_pc_rdata (rvfi_pc_rdata ),
+		.rvfi_pc_wdata (rvfi_pc_wdata ),
+		.rvfi_mem_addr (rvfi_mem_addr ),
+		.rvfi_mem_rmask(rvfi_mem_rmask),
+		.rvfi_mem_wmask(rvfi_mem_wmask),
+		.rvfi_mem_rdata(rvfi_mem_rdata),
+		.rvfi_mem_wdata(rvfi_mem_wdata),
+`endif
+
+		.trace_valid(trace_valid),
+		.trace_data (trace_data)
+	);
+
+	localparam IDLE = 2'b00;
+	localparam WBSTART = 2'b01;
+	localparam WBEND = 2'b10;
+
+	reg [1:0] state;
+
+	wire we;
+	assign we = (mem_wstrb[0] | mem_wstrb[1] | mem_wstrb[2] | mem_wstrb[3]);
+
+	always @(posedge wb_clk_i) begin
+		if (wb_rst_i) begin
+			wbm_adr_o <= 0;
+			wbm_dat_o <= 0;
+			wbm_we_o <= 0;
+			wbm_sel_o <= 0;
+			wbm_stb_o <= 0;
+			wbm_cyc_o <= 0;
+			state <= IDLE;
+		end else begin
+			case (state)
+				IDLE: begin
+					if (mem_valid) begin
+						wbm_adr_o <= mem_addr;
+						wbm_dat_o <= mem_wdata;
+						wbm_we_o <= we;
+						wbm_sel_o <= mem_wstrb;
+
+						wbm_stb_o <= 1'b1;
+						wbm_cyc_o <= 1'b1;
+						state <= WBSTART;
+					end else begin
+						mem_ready <= 1'b0;
+
+						wbm_stb_o <= 1'b0;
+						wbm_cyc_o <= 1'b0;
+						wbm_we_o <= 1'b0;
+					end
+				end
+				WBSTART:begin
+					if (wbm_ack_i) begin
+						mem_rdata <= wbm_dat_i;
+						mem_ready <= 1'b1;
+
+						state <= WBEND;
+
+						wbm_stb_o <= 1'b0;
+						wbm_cyc_o <= 1'b0;
+						wbm_we_o <= 1'b0;
+					end
+				end
+				WBEND: begin
+					mem_ready <= 1'b0;
+
+					state <= IDLE;
+				end
+				default:
+					state <= IDLE;
+			endcase
+		end
+	end
+endmodule
diff --git a/experiments/timfuz/pip_unique.py b/experiments/timfuz/pip_unique.py
new file mode 100644
index 00000000..39b45d44
--- /dev/null
+++ b/experiments/timfuz/pip_unique.py
@@ -0,0 +1,89 @@
+'''
+Verifies that node timing info is unique
+'''
+
+import re
+
+def gen_wires(fin):
+    for l in fin:
+        lj = {}
+        l = l.strip()
+        for kvs in l.split():
+            name, value = kvs.split(':')
+            lj[name] = value
+
+        tile_type, xy, wname = re.match(r'(.*)_(X[0-9]*Y[0-9]*)/(.*)', lj['NAME']).groups()
+        lj['tile_type'] = tile_type
+        lj['xy'] = xy
+        lj['wname'] = wname
+
+        lj['l'] = l
+
+        yield lj
+
+def run(node_fin, verbose=0):
+    refnodes = {}
+    nodei = 0
+    for nodei, anode in enumerate(gen_wires(node_fin)):
+        def getk(anode):
+            return anode['wname']
+            return (anode['tile_type'], anode['wname'])
+
+        if nodei % 1000 == 0:
+            print 'Check node %d' % nodei
+        # Existing node?
+        try:
+            refnode = refnodes[getk(anode)]
+        except KeyError:
+            # Set as reference
+            refnodes[getk(anode)] = anode
+            continue
+        k_invariant = (
+                'CAN_INVERT',
+                'IS_BUFFERED_2_0',
+                'IS_BUFFERED_2_1',
+                'IS_DIRECTIONAL',
+                'IS_EXCLUDED_PIP',
+                'IS_FIXED_INVERSION',
+                'IS_INVERTED',
+                'IS_PSEUDO',
+                'IS_SITE_PIP',
+                'IS_TEST_PIP',
+                )
+        k_varies = (
+                'TILE',
+            )
+        # Verify equivilence
+        for k in k_invariant:
+            if k in refnode and k in anode:
+                def fail():
+                    print 'Mismatch on %s' % k
+                    print refnode[k], anode[k]
+                    print refnode['l']
+                    print anode['l']
+                    #assert 0
+                if refnode[k] != anode[k]:
+                    print
+                    fail()
+            # A key in one but not the other?
+            elif k in refnode or k in anode:
+                assert 0
+            elif k not in k_varies:
+                assert 0
+
+if __name__ == '__main__':
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description=
+        'Timing fuzzer'
+    )
+
+    parser.add_argument('--verbose', type=int, help='')
+    parser.add_argument(
+        'node_fn_in',
+        default='/dev/stdin',
+        nargs='?',
+        help='Input file')
+    args = parser.parse_args()
+    run(open(args.node_fn_in, 'r'), verbose=args.verbose)
diff --git a/experiments/timfuz/placelut.py b/experiments/timfuz/placelut.py
new file mode 100644
index 00000000..47dd9e3c
--- /dev/null
+++ b/experiments/timfuz/placelut.py
@@ -0,0 +1,91 @@
+#!/usr/bin/env python
+
+import argparse
+
+parser = argparse.ArgumentParser(description='')
+parser.add_argument('--sdx', default='8', help='')
+parser.add_argument('--sdy', default='4', help='')
+args = parser.parse_args()
+
+'''
+Generate in pairs
+Fill up switchbox quad for now
+Create random connections between the LUTs
+See how much routing pressure we can generate
+
+Start with non-random connections to the LFSR for solver comparison
+
+Start at SLICE_X16Y102
+'''
+SBASE = (16, 102)
+SDX = int(args.sdx, 0)
+SDY = int(args.sdy, 0)
+nlut = 4 * SDX * SDY
+
+nin = 6 * nlut
+nout = nlut
+
+print('placelut simple')
+print('//SBASE: %s' % (SBASE,))
+print('//SDX: %s' % (SDX,))
+print('//SDY: %s' % (SDX,))
+print('//nlut: %s' % (nlut,))
+print('''\
+module roi (
+        input wire clk,
+        input wire [%u:0] ins,
+        output wire [%u:0] outs);''') % (nin - 1, nout -1)
+
+ini = 0
+outi = 0
+for lutx in xrange(SBASE[0], SBASE[0] + SDX):
+    for luty in xrange(SBASE[1], SBASE[1] + SDY):
+        loc = "SLICE_X%uY%u" % (lutx, luty)
+        for belc in 'ABCD':
+            bel = '%c6LUT' % belc
+            print('''\
+
+	(* KEEP, DONT_TOUCH, LOC="%s", BEL="%s" *)
+	LUT6 #(
+		.INIT(64'hBAD1DEA_1DEADCE0)
+	) %s (''') % (loc, bel, 'lut_x%uy%u_%c' % (lutx, luty, belc))
+            for i in xrange(6):
+                print('''\
+		.I%u(ins[%u]),''' % (i, ini))
+                ini += 1
+            print('''\
+		.O(outs[%u]));''') % (outi,)
+            outi += 1
+assert nin == ini
+assert nout == outi
+
+print('''
+endmodule
+
+module top(input wire clk, input wire stb, input wire di, output wire do);
+    localparam integer DIN_N = %u;
+    localparam integer DOUT_N = %u;
+
+    reg [DIN_N-1:0] din;
+    wire [DOUT_N-1:0] dout;
+
+    reg [DIN_N-1:0] din_shr;
+    reg [DOUT_N-1:0] dout_shr;
+
+    always @(posedge clk) begin
+        din_shr <= {din_shr, di};
+        dout_shr <= {dout_shr, din_shr[DIN_N-1]};
+        if (stb) begin
+            din <= din_shr;
+            dout_shr <= dout;
+        end
+    end
+
+    assign do = dout_shr[DOUT_N-1];
+    roi roi(
+            .clk(clk),
+            .ins(din),
+            .outs(dout)
+            );
+endmodule''') % (nin, nout)
+
diff --git a/experiments/timfuz/placelut_fb.py b/experiments/timfuz/placelut_fb.py
new file mode 100644
index 00000000..7e973da0
--- /dev/null
+++ b/experiments/timfuz/placelut_fb.py
@@ -0,0 +1,103 @@
+#!/usr/bin/env python
+
+'''
+Note: vivado will (by default) fail bitgen DRC on LUT feedback loops
+Looks like can probably be disabled, but we actually don't need a bitstream for timing analysis
+'''
+
+import argparse
+import random
+
+random.seed()
+
+parser = argparse.ArgumentParser(description='')
+parser.add_argument('--sdx', default='8', help='')
+parser.add_argument('--sdy', default='4', help='')
+args = parser.parse_args()
+
+'''
+Generate in pairs
+Fill up switchbox quad for now
+Create random connections between the LUTs
+See how much routing pressure we can generate
+
+Start with non-random connections to the LFSR for solver comparison
+
+Start at SLICE_X16Y102
+'''
+SBASE = (16, 102)
+SDX = int(args.sdx, 0)
+SDY = int(args.sdy, 0)
+nlut = 4 * SDX * SDY
+
+nin = 6 * nlut
+nout = nlut
+
+print('//placelut w/ feedback')
+print('//SBASE: %s' % (SBASE,))
+print('//SDX: %s' % (SDX,))
+print('//SDY: %s' % (SDX,))
+print('//nlut: %s' % (nlut,))
+print('''\
+module roi (
+        input wire clk,
+        input wire [%u:0] ins,
+        output wire [%u:0] outs);''') % (nin - 1, nout -1)
+
+ini = 0
+outi = 0
+for lutx in xrange(SBASE[0], SBASE[0] + SDX):
+    for luty in xrange(SBASE[1], SBASE[1] + SDY):
+        loc = "SLICE_X%uY%u" % (lutx, luty)
+        for belc in 'ABCD':
+            bel = '%c6LUT' % belc
+            print('''\
+
+    (* KEEP, DONT_TOUCH, LOC="%s", BEL="%s" *)
+    LUT6 #(
+        .INIT(64'hBAD1DEA_1DEADCE0)
+    ) %s (''') % (loc, bel, 'lut_x%uy%u_%c' % (lutx, luty, belc))
+            for i in xrange(6):
+                if random.randint(0, 9) < 1:
+                    wfrom = 'ins[%u]' % ini
+                    ini += 1
+                else:
+                    wfrom = 'outs[%u]' % random.randint(0, nout - 1)
+                print('''\
+        .I%u(%s),''' % (i, wfrom))
+            print('''\
+        .O(outs[%u]));''') % (outi,)
+            outi += 1
+#assert nin == ini
+assert nout == outi
+
+print('''
+endmodule
+
+module top(input wire clk, input wire stb, input wire di, output wire do);
+    localparam integer DIN_N = %u;
+    localparam integer DOUT_N = %u;
+
+    reg [DIN_N-1:0] din;
+    wire [DOUT_N-1:0] dout;
+
+    reg [DIN_N-1:0] din_shr;
+    reg [DOUT_N-1:0] dout_shr;
+
+    always @(posedge clk) begin
+        din_shr <= {din_shr, di};
+        dout_shr <= {dout_shr, din_shr[DIN_N-1]};
+        if (stb) begin
+            din <= din_shr;
+            dout_shr <= dout;
+        end
+    end
+
+    assign do = dout_shr[DOUT_N-1];
+    roi roi(
+            .clk(clk),
+            .ins(din),
+            .outs(dout)
+            );
+endmodule''') % (nin, nout)
+
diff --git a/experiments/timfuz/placelut_ff_fb.py b/experiments/timfuz/placelut_ff_fb.py
new file mode 100644
index 00000000..3f8b2784
--- /dev/null
+++ b/experiments/timfuz/placelut_ff_fb.py
@@ -0,0 +1,126 @@
+#!/usr/bin/env python
+
+'''
+Note: vivado will (by default) fail bitgen DRC on LUT feedback loops
+Looks like can probably be disabled, but we actually don't need a bitstream for timing analysis
+
+ERROR: [Vivado 12-2285] Cannot set LOC property of instance 'roi/lut_x22y102_D', Instance roi/lut_x22y102_D can not be placed in D6LUT of site SLICE_X18Y103 because the bel is occupied by roi/lut_x18y103_D(port:). This could be caused by bel constraint conflict
+Resolution: When using BEL constraints, ensure the BEL constraints are defined before the LOC constraints to avoid conflicts at a given site.
+
+'''
+
+import argparse
+import random
+
+random.seed()
+
+parser = argparse.ArgumentParser(description='')
+parser.add_argument('--sdx', default='8', help='')
+parser.add_argument('--sdy', default='4', help='')
+args = parser.parse_args()
+
+'''
+Generate in pairs
+Fill up switchbox quad for now
+Create random connections between the LUTs
+See how much routing pressure we can generate
+
+Start with non-random connections to the LFSR for solver comparison
+
+Start at SLICE_X16Y102
+'''
+SBASE = (16, 102)
+SDX = int(args.sdx, 0)
+SDY = int(args.sdy, 0)
+nlut = 4 * SDX * SDY
+
+nin = 6 * nlut
+nout = nlut
+
+print('//placelut w/ FF + feedback')
+print('//SBASE: %s' % (SBASE,))
+print('//SDX: %s' % (SDX,))
+print('//SDY: %s' % (SDX,))
+print('//nlut: %s' % (nlut,))
+print('''\
+module roi (
+        input wire clk,
+        input wire [%u:0] ins,
+        output wire [%u:0] outs);''') % (nin - 1, nout -1)
+
+ini = 0
+outi = 0
+for lutx in xrange(SBASE[0], SBASE[0] + SDX):
+    for luty in xrange(SBASE[1], SBASE[1] + SDY):
+        loc = "SLICE_X%uY%u" % (lutx, luty)
+        for belc in 'ABCD':
+            bel = '%c6LUT' % belc
+            name = 'lut_x%uy%u_%c' % (lutx, luty, belc)
+            print('''\
+
+    (* KEEP, DONT_TOUCH, LOC="%s", BEL="%s" *)
+    LUT6 #(
+        .INIT(64'hBAD1DEA_1DEADCE0)
+    ) %s (''') % (loc, bel, name)
+            for i in xrange(6):
+                rval = random.randint(0, 9)
+                if rval < 3:
+                    wfrom = 'ins[%u]' % ini
+                    ini += 1
+                #elif rval < 6:
+                #    wfrom = 'outsr[%u]' % random.randint(0, nout - 1)
+                else:
+                    wfrom = 'outs[%u]' % random.randint(0, nout - 1)
+                print('''\
+        .I%u(%s),''' % (i, wfrom))
+            out_w = name + '_o'
+            print('''\
+        .O(%s));''') % (out_w,)
+
+            outs_w = "outs[%u]" % outi
+            if random.randint(0, 9) < 5:
+                print('    assign %s = %s;' % (outs_w, out_w))
+            else:
+                out_r = name + '_or'
+                print('''\
+    reg %s;
+    assign %s = %s;
+    always @(posedge clk) begin
+        %s = %s;
+    end
+    ''' % (out_r, outs_w, out_r, out_r, out_w))
+            outi += 1
+
+#assert nin == ini
+assert nout == outi
+
+print('''
+endmodule
+
+module top(input wire clk, input wire stb, input wire di, output wire do);
+    localparam integer DIN_N = %u;
+    localparam integer DOUT_N = %u;
+
+    reg [DIN_N-1:0] din;
+    wire [DOUT_N-1:0] dout;
+
+    reg [DIN_N-1:0] din_shr;
+    reg [DOUT_N-1:0] dout_shr;
+
+    always @(posedge clk) begin
+        din_shr <= {din_shr, di};
+        dout_shr <= {dout_shr, din_shr[DIN_N-1]};
+        if (stb) begin
+            din <= din_shr;
+            dout_shr <= dout;
+        end
+    end
+
+    assign do = dout_shr[DOUT_N-1];
+    roi roi(
+            .clk(clk),
+            .ins(din),
+            .outs(dout)
+            );
+endmodule''') % (nin, nout)
+
diff --git a/experiments/timfuz/speed.sh b/experiments/timfuz/speed.sh
new file mode 100755
index 00000000..0712c64f
--- /dev/null
+++ b/experiments/timfuz/speed.sh
@@ -0,0 +1,8 @@
+#!/usr/bin/env bash
+set -ex
+
+mkdir -p build_speed
+cd build_speed
+vivado -mode batch -source ../speed.tcl
+python ../speed_json.py speed_model.txt node.txt speed.json
+
diff --git a/experiments/timfuz/speed.tcl b/experiments/timfuz/speed.tcl
new file mode 100644
index 00000000..31f8b857
--- /dev/null
+++ b/experiments/timfuz/speed.tcl
@@ -0,0 +1,182 @@
+source ../../../utils/utils.tcl
+
+proc pin_info {pin} {
+    set cell [get_cells -of_objects $pin]
+    set bel [get_bels -of_objects $cell]
+    set site [get_sites -of_objects $bel]
+    return "$site $bel"
+}
+
+proc pin_bel {pin} {
+    set cell [get_cells -of_objects $pin]
+    set bel [get_bels -of_objects $cell]
+    return $bel
+}
+
+proc build_design_full {} {
+    create_project -force -part $::env(XRAY_PART) design design
+    read_verilog ../top.v
+    read_verilog ../picorv32.v
+    synth_design -top top
+
+    set_property LOCK_PINS {I0:A1 I1:A2 I2:A3 I3:A4 I4:A5 I5:A6} \
+		[get_cells -quiet -filter {REF_NAME == LUT6} -hierarchical]
+
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_00) IOSTANDARD LVCMOS33" [get_ports clk]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_01) IOSTANDARD LVCMOS33" [get_ports stb]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_02) IOSTANDARD LVCMOS33" [get_ports di]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_03) IOSTANDARD LVCMOS33" [get_ports do]
+
+    create_pblock roi
+    set roipb [get_pblocks roi]
+    set_property EXCLUDE_PLACEMENT 1 $roipb
+    add_cells_to_pblock $roipb [get_cells roi]
+    resize_pblock $roipb -add "$::env(XRAY_ROI)"
+
+    randplace_pblock 150 $roipb
+    set_property CFGBVS VCCO [current_design]
+    set_property CONFIG_VOLTAGE 3.3 [current_design]
+    set_property BITSTREAM.GENERAL.PERFRAMECRC YES [current_design]
+
+    set_property CLOCK_DEDICATED_ROUTE FALSE [get_nets clk_IBUF]
+
+    place_design
+    route_design
+
+    write_checkpoint -force design.dcp
+    write_bitstream -force design.bit
+}
+
+
+proc build_design_synth {} {
+    create_project -force -part $::env(XRAY_PART) design design
+
+    read_verilog ../top.v
+    read_verilog ../picorv32.v
+    synth_design -top top
+}
+
+# WARNING: [Common 17-673] Cannot get value of property 'FORWARD' because this property is not valid in conjunction with other property setting on this object.
+# WARNING: [Common 17-673] Cannot get value of property 'REVERSE' because this property is not valid in conjunction with other property setting on this object.
+proc speed_models1 {} {
+    set outdir "."
+    set fp [open "$outdir/speed_model.txt" w]
+    # list_property [lindex [get_speed_models] 0]
+    set speed_models [get_speed_models]
+    set properties [list_property [lindex $speed_models 0]]
+    # "CLASS DELAY FAST_MAX FAST_MIN IS_INSTANCE_SPECIFIC NAME NAME_LOGICAL SLOW_MAX SLOW_MIN SPEED_INDEX TYPE"
+    puts $fp $properties
+
+    set needspace 0
+    foreach speed_model $speed_models {
+        foreach property $properties {
+            if $needspace {
+                puts -nonewline $fp " "
+            }
+            puts -nonewline $fp [get_property $property $speed_model]
+            set needspace 1
+        }
+        puts $fp ""
+    }
+    close $fp
+}
+
+proc speed_models2 {} {
+    set outdir "."
+    set fp [open "$outdir/speed_model.txt" w]
+    # list_property [lindex [get_speed_models] 0]
+    set speed_models [get_speed_models]
+    puts "Items: [llength $speed_models]"
+
+    set needspace 0
+    # Not all objects have the same properties
+    # But they do seem to have the same list
+    set properties [list_property [lindex $speed_models 0]]
+    foreach speed_model $speed_models {
+        set needspace 0
+        foreach property $properties {
+            set val [get_property $property $speed_model]
+            if {"$val" ne ""} {
+                if $needspace {
+                    puts -nonewline $fp " "
+                }
+                puts -nonewline $fp "$property:$val"
+                set needspace 1
+            }
+        }
+        puts $fp ""
+    }
+    close $fp
+}
+
+
+# For cost codes
+# Items: 2663055s
+# Hmm too much
+# Lets filter out items we really want
+proc nodes_all {} {
+    set outdir "."
+    set fp [open "$outdir/node_all.txt" w]
+    set items [get_nodes]
+    puts "Items: [llength $items]"
+
+    set needspace 0
+    set properties [list_property [lindex $items 0]]
+    foreach item $items {
+        set needspace 0
+        foreach property $properties {
+            set val [get_property $property $item]
+            if {"$val" ne ""} {
+                if $needspace {
+                    puts -nonewline $fp " "
+                }
+                puts -nonewline $fp "$property:$val"
+                set needspace 1
+            }
+        }
+        puts $fp ""
+    }
+    close $fp
+}
+
+# Only writes out items with unique cost codes
+# (much faster)
+proc nodes_unique_cc {} {
+    set outdir "."
+    set fp [open "$outdir/node.txt" w]
+    set items [get_nodes]
+    puts "Items: [llength $items]"
+
+    set needspace 0
+    set properties [list_property [lindex $items 0]]
+    set cost_codes_known [dict create]
+    set itemi 0
+    foreach item $items {
+        incr itemi
+        set cost_code [get_property COST_CODE $item]
+        if {[ dict exists $cost_codes_known $cost_code ]} {
+            continue
+        }
+        puts "Adding $cost_code @ item $itemi"
+        dict set cost_codes_known $cost_code 1
+
+        set needspace 0
+        foreach property $properties {
+            set val [get_property $property $item]
+            if {"$val" ne ""} {
+                if $needspace {
+                    puts -nonewline $fp " "
+                }
+                puts -nonewline $fp "$property:$val"
+                set needspace 1
+            }
+        }
+        puts $fp ""
+    }
+    close $fp
+}
+
+build_design_full
+speed_models2
+nodes_unique_cc
+
diff --git a/experiments/timfuz/speed_json.py b/experiments/timfuz/speed_json.py
new file mode 100644
index 00000000..07dfd20b
--- /dev/null
+++ b/experiments/timfuz/speed_json.py
@@ -0,0 +1,98 @@
+import json
+
+def load_speed(fin):
+    speed_models = {}
+    speed_types = {}
+    for l in fin:
+        delay = {}
+        l = l.strip()
+        for kvs in l.split():
+            name, value = kvs.split(':')
+            name = name.lower()
+            if name in ('class',):
+                continue
+            if name in ('speed_index',):
+                value = int(value)
+            if name == 'type':
+                speed_types.setdefault(value, {})
+            delay[name] = value
+        delayk = delay['name']
+        if delayk in delay:
+            raise Exception("Duplicate name")
+
+        if "name" in delay and "name_logical" in delay:
+            # Always true
+            if delay['name'] != delay['name_logical']:
+                raise Exception("nope!")
+            # Found a counter example
+            if 0 and delay['name'] != delay['forward']:
+                # ('BSW_NONTLFW_TLRV', '_BSW_LONG_NONTLFORWARD')
+                print(delay['name'], delay['forward'])
+                raise Exception("nope!")
+            # Found a counter example
+            if 0 and delay['forward'] != delay['reverse']:
+                # _BSW_LONG_NONTLFORWARD _BSW_LONG_TLREVERSE
+                print(delay['forward'], delay['reverse'])
+                raise Exception("nope!")
+
+        speed_models[delayk] = delay
+    return speed_models, speed_types
+
+def load_cost_code(fin):
+    # COST_CODE:4 COST_CODE_NAME:SLOWSINGLE
+    cost_codes = {}
+    for l in fin:
+        lj = {}
+        l = l.strip()
+        for kvs in l.split():
+            name, value = kvs.split(':')
+            name = name.lower()
+            lj[name] = value
+        cost_code = {
+            'name': lj['cost_code_name'],
+            'code': int(lj['cost_code']),
+            # Hmm is this unique per type?
+            #'speed_class': int(lj['speed_class']),
+            }
+        
+        cost_codes[cost_code['name']] = cost_code
+    return cost_codes
+
+def run(speed_fin, node_fin, fout, verbose=0):
+    print('Loading data')
+    speed_models, speed_types = load_speed(speed_fin)
+    cost_codes = load_cost_code(node_fin)
+
+    j = {
+        'speed_model': speed_models,
+        'speed_type': speed_types,
+        'cost_code': cost_codes,
+        }
+    json.dump(j, fout, sort_keys=True, indent=4, separators=(',', ': '))
+
+if __name__ == '__main__':
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description=
+        'Timing fuzzer'
+    )
+
+    parser.add_argument('--verbose', type=int, help='')
+    parser.add_argument(
+        'speed_fn_in',
+        default='/dev/stdin',
+        nargs='?',
+        help='Input file')
+    parser.add_argument(
+        'node_fn_in',
+        default='/dev/stdin',
+        nargs='?',
+        help='Input file')
+    parser.add_argument(
+        'fn_out',
+        default='/dev/stdout',
+        nargs='?',
+        help='Output file')
+    args = parser.parse_args()
+    run(open(args.speed_fn_in, 'r'), open(args.node_fn_in, 'r'), open(args.fn_out, 'w'), verbose=args.verbose)
diff --git a/experiments/timfuz/timfuz.py b/experiments/timfuz/timfuz.py
new file mode 100644
index 00000000..1e14074b
--- /dev/null
+++ b/experiments/timfuz/timfuz.py
@@ -0,0 +1,819 @@
+#!/usr/bin/env python
+
+# https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
+from scipy.optimize import linprog
+import math
+import numpy as np
+from collections import OrderedDict
+import time
+import re
+import os
+import datetime
+import json
+import copy
+import sys
+import random
+import glob
+
+from benchmark import Benchmark
+
+NAME_ZERO = set([
+            "BSW_CLK_ZERO",
+            "BSW_ZERO",
+            "B_ZERO",
+            "C_CLK_ZERO",
+            "C_DSP_ZERO",
+            "C_ZERO",
+            "I_ZERO",
+            "O_ZERO",
+            "RC_ZERO",
+            "R_ZERO",
+            ])
+
+# csv index
+corner_s2i = {
+    'fast_max': 0,
+    'fast_min': 1,
+    'slow_max': 2,
+    'slow_min': 3,
+    }
+
+def print_eqns(A_ubd, b_ub, verbose=0, lim=3, label=''):
+    rows = len(b_ub)
+
+    print('Sample equations (%s) from %d r' % (label, rows))
+    prints = 0
+    #verbose = 1
+    for rowi, row in enumerate(A_ubd):
+        if verbose or ((rowi < 10 or rowi % max(1, (rows / 20)) == 0) and (not lim or prints < lim)):
+            line = '  EQN: p%u: ' % rowi
+            for k, v in sorted(row.items()):
+                line += '%u*t%d ' % (v, k)
+            line += '= %d' % b_ub[rowi]
+            print(line)
+            prints += 1
+
+def print_name_eqns(A_ubd, b_ub, names, verbose=0, lim=3, label=''):
+    rows = len(b_ub)
+
+    print('Sample equations (%s) from %d r' % (label, rows))
+    prints = 0
+    #verbose = 1
+    for rowi, row in enumerate(A_ubd):
+        if verbose or ((rowi < 10 or rowi % max(1, (rows / 20)) == 0) and (not lim or prints < lim)):
+            line = '  EQN: p%u: ' % rowi
+            for k, v in sorted(row.items()):
+                line += '%u*%s ' % (v, names[k])
+            line += '= %d' % b_ub[rowi]
+            print(line)
+            prints += 1
+
+def print_names(names, verbose=1):
+    print('Names: %d' % len(names))
+    for xi, name in enumerate(names):
+        print('  % 4u % -80s' % (xi, name))
+
+def invb(b_ub):
+    #return [-b for b in b_ub]
+    return -np.array(b_ub)
+
+def check_feasible_d(A_ubd, b_ub, names):
+    A_ub, b_ub_inv = Ab_d2np(A_ubd, b_ub, names)
+    check_feasible(A_ub, b_ub_inv)
+
+def check_feasible(A_ub, b_ub):
+    sys.stdout.write('Check feasible ')
+    sys.stdout.flush()
+
+    rows = len(b_ub)
+    cols = len(A_ub[0])
+
+    progress = max(1, rows / 100)
+
+    # Chose a high arbitrary value for x
+    # Delays should be in order of ns, so a 10 ns delay should be way above what anything should be
+    xs = [10e3 for _i in range(cols)]
+
+    # FIXME: use the correct np function to do this for me
+    # Verify bounds
+    #b_res = np.matmul(A_ub, xs)
+    #print(type(A_ub), type(xs)
+    #A_ub = np.array(A_ub)
+    #xs = np.array(xs)
+    #b_res = np.matmul(A_ub, xs)
+    def my_mul(A_ub, xs):
+        #print('cols', cols
+        #print('rows', rows
+        ret = [None] * rows
+        for row in range(rows):
+            this = 0
+            for col in range(cols):
+                this += A_ub[row][col] * xs[col]
+            ret[row] = this
+        return ret
+    b_res = my_mul(A_ub, xs)
+
+    # Verify bound was respected
+    for rowi, (this_b, this_b_ub) in enumerate(zip(b_res, b_ub)):
+        if rowi % progress == 0:
+            sys.stdout.write('.')
+            sys.stdout.flush()
+        if this_b >= this_b_ub or this_b > 0:
+            print('% 4d Want res % 10.1f <= % 10.1f <= 0' % (rowi, this_b, this_b_ub))
+            raise Exception("Bad ")
+    print(' done')
+
+def Ab_ub_dt2d(eqns):
+    '''Convert dict using the rows as keys into a list of dicts + b_ub list (ie return A_ub, b_ub)'''
+    #return [dict(rowt) for rowt in eqns]
+    rows = [(dict(rowt), b) for rowt, b in eqns.items()]
+    A_ubd, b_ub = zip(*rows)
+    return list(A_ubd), list(b_ub)
+
+# This significantly reduces runtime
+def simplify_rows(A_ubd, b_ub):
+    '''Remove duplicate equations, taking highest delay'''
+    # dict of constants to highest delay
+    eqns = OrderedDict()
+    assert len(A_ubd) == len(b_ub), (len(A_ubd), len(b_ub))
+
+    sys.stdout.write('SimpR ')
+    sys.stdout.flush()
+    progress = max(1, len(b_ub) / 100)
+    zero_ds = 0
+    zero_es = 0
+    for loopi, (b, rowd) in enumerate(zip(b_ub, A_ubd)):
+        if loopi % progress == 0:
+            sys.stdout.write('.')
+            sys.stdout.flush()
+
+        # TODO: elements have zero delay (ex: COUT)
+        # Remove these from now since they make me nervous
+        # Although they should just solve to 0
+        if not b:
+            zero_ds += 1
+            continue
+
+        # A very few of these exist with very small values
+        # TODO: investigate, understand what these are
+        # Leaving these in can make the result unsolvable since there does not exist a set of constants to reach the delay
+        if len(rowd) == 0:
+            zero_es += 1
+            continue
+
+        rowt = Ar_ds2t(rowd)
+        eqns[rowt] = max(eqns.get(rowt, 0), b)
+
+    print(' done')
+
+    #A_ub_ret = eqns.keys()
+    A_ubd_ret, b_ub_ret = Ab_ub_dt2d(eqns)
+
+    print('Simplify rows: %d => %d w/ zd %d, ze %d' % (len(b_ub), len(b_ub_ret), zero_ds, zero_es))
+    #return A_ub_ret, b_ub_ret
+    #return A_ub_np2d(A_ub_ret), b_ub_ret
+    return A_ubd_ret, b_ub_ret
+
+def simplify_cols(names, A_ubd, b_ub):
+    '''
+    Remove unsued columns
+    This is fairly straightforward in dictionary form now as only have to remove and adjust indices
+    Maybe should use the names as keys? Then this wouldn't be needed anymore as indices wouldn't need to be rebased
+
+    XXX: shuffles the name order around. Do we care?
+    '''
+
+    # First: find unused names
+    # use dict since no standard ordered set
+    used_cols = set()
+    names_ret = OrderedDict()
+    col_old2new = OrderedDict()
+    rows = len(b_ub)
+    cols = len(names)
+
+    sys.stdout.write('SimpC indexing ')
+    sys.stdout.flush()
+    progress = max(1, rows / 100)
+    for rowi, rowd in enumerate(A_ubd):
+        if rowi % progress == 0:
+            sys.stdout.write('.')
+            sys.stdout.flush()
+        for coli in rowd.keys():
+            used_cols.add(coli)
+
+    for coli in range(cols):
+        if coli in used_cols:
+            names_ret[names[coli]] = None
+            col_old2new[coli] = len(col_old2new)
+    assert len(used_cols) == len(col_old2new)
+
+    print(' done')
+
+    # Create a new matrix, copying important values over
+    #A_ub_ret = np.zeros((4, 1))
+    #A_ub_ret[3][0] = 1.0
+    #A_ub_ret = np.zeros((rows, len(names_ret)))
+    A_ub_ret = [None] * rows
+    sys.stdout.write('SimpC creating ')
+    sys.stdout.flush()
+    progress = max(1, rows / 100)
+    for rowi, rowd_old in enumerate(A_ubd):
+        if rowi % progress == 0:
+            sys.stdout.write('.')
+            sys.stdout.flush()
+        l = [(col_old2new[k], v) for k, v in rowd_old.items()]
+        A_ub_ret[rowi] = OrderedDict(l)
+    print(' done')
+
+    print('Simplify cols: %d => %d cols' % (len(names), len(names_ret)))
+    nr = list(names_ret.keys())
+    return nr, A_ub_ret, b_ub
+
+def A_ubr_np2d(row, sf=1):
+    '''Convert a single row'''
+    #d = {}
+    d = OrderedDict()
+    for coli, val in enumerate(row):
+        if val:
+            d[coli] = sf * val
+    return d
+
+def A_ub_np2d(A_ub, sf=1):
+    '''Convert A_ub entries in numpy matrix to dictionary / sparse form'''
+    A_ubd = [None] * len(A_ub)
+    for i, row in enumerate(A_ub):
+        A_ubd[i] = A_ubr_np2d(row, sf=sf)
+    return A_ubd
+
+# def Ar_ds2np(row_ds, names):
+#     Ar_di2np(row_di, cols, sf=1)
+
+def Ar_di2np(row_di, cols, sf=1):
+    rownp = np.zeros(cols)
+    for coli, val in row_di.items():
+        # Sign inversion due to way solver works
+        rownp[coli] = sf * val
+    return rownp
+
+# NOTE: sign inversion
+def A_di2np(Adi, cols, sf=1):
+    '''Convert A_ub entries in dictionary / sparse to numpy matrix form'''
+    return [Ar_di2np(row_di, cols, sf=sf) for row_di in Adi]
+
+def Ar_ds2t(rowd):
+    '''Convert a dictionary row into a tuple with (column number, value) tuples'''
+    return tuple(sorted(rowd.items()))
+
+def A_ubr_t2d(rowt):
+    '''Convert a dictionary row into a tuple with (column number, value) tuples'''
+    return OrderedDict(rowt)
+
+def A_ub_d2t(A_ubd):
+    '''Convert rows as dicts to rows as tuples'''
+    return [Ar_ds2t(rowd) for rowd in A_ubd]
+
+def A_ub_t2d(A_ubd):
+    '''Convert rows as tuples to rows as dicts'''
+    return [OrderedDict(rowt) for rowt in A_ubd]
+
+def Ab_d2np(A_ubd, b_ub, names):
+    A_ub = A_di2np(A_ubd, len(names))
+    b_ub_inv = invb(b_ub)
+    return A_ub, b_ub_inv
+
+def Ab_np2d(A_ub, b_ub_inv):
+    A_ubd = A_ub_np2d(A_ub)
+    b_ub = invb(b_ub_inv)
+    return A_ubd, b_ub
+
+def sort_equations_(A_ubd, b_ub):
+    # Dictionaries aren't hashable for sorting even though they are comparable
+    return A_ub_t2d(sorted(A_ub_d2t(A_ubd)))
+
+def sort_equations(A_ub, b_ub):
+    # Track rows with value column
+    # Hmm can't sort against np arrays
+    tosort = [(sorted(row.items()), b) for row, b in zip(A_ub, b_ub)]
+    #res = sorted(tosort, key=lambda e: e[0])
+    res = sorted(tosort)
+    A_ubtr, b_ubr = zip(*res)
+    return [OrderedDict(rowt) for rowt in A_ubtr], b_ubr
+
+def lte_const(row_ref, row_cmp):
+    '''Return true if all constants are smaller magnitude in row_cmp than row_ref'''
+    #return False
+    for k, vc in row_cmp.items():
+        vr = row_ref.get(k, None)
+        # Not in reference?
+        if vr is None:
+            return False
+        if vr < vc:
+            return False
+    return True
+
+def shared_const(row_ref, row_cmp):
+    '''Return true if more constants are equal than not equal'''
+    #return False
+    matches = 0
+    unmatches = 0
+    ks = list(row_ref.keys()) + list(row_cmp.keys())
+    for k in ks:
+        vr = row_ref.get(k, None)
+        vc = row_cmp.get(k, None)
+        # At least one
+        if vr is not None and vc is not None:
+            if vc == vr:
+                matches += 1
+            else:
+                unmatches += 1
+        else:
+            unmatches += 1
+
+    # Will equation reduce if subtracted?
+    return matches > unmatches
+
+def reduce_const(row_ref, row_cmp):
+    '''Subtract cmp constants from ref'''
+    #ret = {}
+    ret = OrderedDict()
+    ks = set(row_ref.keys())
+    ks.update(set(row_cmp.keys()))
+    for k in ks:
+        vr = row_ref.get(k, 0)
+        vc = row_cmp.get(k, 0)
+        res = vr - vc
+        if res:
+            ret[k] = res
+    return ret
+
+def derive_eq_by_row(A_ubd, b_ub, verbose=0, col_lim=0, tweak=False):
+    '''
+    Derive equations by subtracting whole rows
+
+    Given equations like:
+    t0           >= 10
+    t0 + t1      >= 15
+    t0 + t1 + t2 >= 17
+
+    When I look at these, I think of a solution something like:
+    t0 = 10f
+    t1 = 5
+    t2 = 2
+
+    However, linprog tends to choose solutions like:
+    t0 = 17
+    t1 = 0
+    t2 = 0
+
+    To this end, add additional constraints by finding equations that are subsets of other equations
+    How to do this in a reasonable time span?
+    Also equations are sparse, which makes this harder to compute
+    '''
+    rows = len(A_ubd)
+    assert rows == len(b_ub)
+
+    # Index equations into hash maps so can lookup sparse elements quicker
+    assert len(A_ubd) == len(b_ub)
+    A_ubd_ret = copy.copy(A_ubd)
+    assert len(A_ubd) == len(A_ubd_ret)
+
+    #print('Finding subsets')
+    ltes = 0
+    scs = 0
+    b_ub_ret = list(b_ub)
+    sys.stdout.write('Deriving rows ')
+    sys.stdout.flush()
+    progress = max(1, rows / 100)
+    for row_refi, row_ref in enumerate(A_ubd):
+        if row_refi % progress == 0:
+            sys.stdout.write('.')
+            sys.stdout.flush()
+        if col_lim and len(row_ref) > col_lim:
+            continue
+
+        for row_cmpi, row_cmp in enumerate(A_ubd):
+            if row_refi == row_cmpi or col_lim and len(row_cmp) > col_lim:
+                continue
+            # FIXME: this check was supposed to be removed
+            '''
+            Every elements in row_cmp is in row_ref
+            but this doesn't mean the constants are smaller
+            Filter these out
+            '''
+            # XXX: just reduce and filter out solutions with positive constants
+            # or actually are these also useful as is?
+            lte = lte_const(row_ref, row_cmp)
+            if lte:
+                ltes += 1
+            sc = 0 and shared_const(row_ref, row_cmp)
+            if sc:
+                scs += 1
+            if lte or sc:
+                if verbose:
+                    print('')
+                    print('match')
+                    print('  ', row_ref, b_ub[row_refi])
+                    print('  ', row_cmp, b_ub[row_cmpi])
+                # Reduce
+                A_new = reduce_const(row_ref, row_cmp)
+                # Did this actually significantly reduce the search space?
+                #if tweak and len(A_new) > 4 and len(A_new) > len(row_cmp) / 2:
+                if tweak and len(A_new) > 8 and len(A_new) > len(row_cmp) / 2:
+                    continue
+                b_new = b_ub[row_refi] - b_ub[row_cmpi]
+                # Definitely possible
+                # Maybe filter these out if they occur?
+                if verbose:
+                    print(b_new)
+                # Also inverted sign
+                if b_new <= 0:
+                    if verbose:
+                        print("Unexpected b")
+                    continue
+                if verbose:
+                    print('OK')
+                A_ubd_ret.append(A_new)
+                b_ub_ret.append(b_new)
+    print(' done')
+
+    #A_ub_ret = A_di2np(A_ubd2, cols=cols)
+    print('Derive row: %d => %d rows using %d lte, %d sc' % (len(b_ub), len(b_ub_ret), ltes, scs))
+    assert len(A_ubd_ret) == len(b_ub_ret)
+    return A_ubd_ret, b_ub_ret
+
+def derive_eq_by_col(A_ubd, b_ub, verbose=0):
+    '''
+    Derive equations by subtracting out all bounded constants (ie "known" columns)
+    '''
+    rows = len(A_ubd)
+
+    # Find all entries where
+
+    # Index equations with a single constraint
+    knowns = {}
+    sys.stdout.write('Derive col indexing ')
+    #A_ubd = A_ub_np2d(A_ub)
+    sys.stdout.flush()
+    progress = max(1, rows / 100)
+    for row_refi, row_refd in enumerate(A_ubd):
+        if row_refi % progress == 0:
+            sys.stdout.write('.')
+            sys.stdout.flush()
+        if len(row_refd) == 1:
+            k, v = list(row_refd.items())[0]
+            # Reduce any constants to canonical form
+            if v != 1:
+                row_refd[k] = 1
+                b_ub[row_refi] /= v
+            knowns[k] = b_ub[row_refi]
+    print(' done')
+    #knowns_set = set(knowns.keys())
+    print('%d constrained' % len(knowns))
+
+    '''
+    Now see what we can do
+    Rows that are already constrained: eliminate
+        TODO: maybe keep these if this would violate their constraint
+    Otherwise eliminate the original row and generate a simplified result now
+    '''
+    b_ub_ret = []
+    A_ubd_ret = []
+    sys.stdout.write('Derive col main ')
+    sys.stdout.flush()
+    progress = max(1, rows / 100)
+    for row_refi, row_refd in enumerate(A_ubd):
+        if row_refi % progress == 0:
+            sys.stdout.write('.')
+            sys.stdout.flush()
+        # Reduce as much as possible
+        #row_new = {}
+        row_new = OrderedDict()
+        b_new = b_ub[row_refi]
+        # Copy over single entries
+        if len(row_refd) == 1:
+            row_new = row_refd
+        else:
+            for k, v in row_refd.items():
+                if k in knowns:
+                    # Remove column and take out corresponding delay
+                    b_new -= v * knowns[k]
+                # Copy over
+                else:
+                    row_new[k] = v
+
+        # Possibly reduced all usable contants out
+        if len(row_new) == 0:
+            continue
+        if b_new <= 0:
+            continue
+
+        A_ubd_ret.append(row_new)
+        b_ub_ret.append(b_new)
+    print(' done')
+
+    print('Derive col: %d => %d rows' % (len(b_ub), len(b_ub_ret)))
+    return A_ubd_ret, b_ub_ret
+
+def col_dist(A_ubd, desc='of', names=[], lim=0):
+    '''print(frequency distribution of number of elements in a given row'''
+    rows = len(A_ubd)
+    cols = len(names)
+
+    fs = {}
+    for row in A_ubd:
+        this_cols = len(row)
+        fs[this_cols] = fs.get(this_cols, 0) + 1
+
+    print('Col count distribution (%s) for %dr x %dc w/ %d freqs' % (desc, rows, cols, len(fs)))
+    prints = 0
+    for i, (k, v) in enumerate(sorted(fs.items())):
+        if lim == 0 or (lim and prints < lim or i == len(fs) - 1):
+            print('  %d: %d' % (k, v))
+        prints += 1
+        if lim and prints == lim:
+            print('  ...')
+
+def name_dist(A_ubd, desc='of', names=[], lim=0):
+    '''print(frequency distribution of number of times an element appears'''
+    rows = len(A_ubd)
+    cols = len(names)
+
+    fs = {i: 0 for i in range(len(names))}
+    for row in A_ubd:
+        for k in row.keys():
+            fs[k] += 1
+
+    print('Name count distribution (%s) for %dr x %dc' % (desc, rows, cols))
+    prints = 0
+    for namei, name in enumerate(names):
+        if lim == 0 or (lim and prints < lim or namei == len(fs) - 1):
+            print('  %s: %d' % (name, fs[namei]))
+            prints += 1
+            if lim and prints == lim:
+                print('  ...')
+
+    fs2 = {}
+    for v in fs.values():
+        fs2[v] = fs2.get(v, 0) + 1
+    prints = 0
+    print('Distribution distribution (%d items)'% len(fs2))
+    for i, (k, v) in enumerate(sorted(fs2.items())):
+        if lim == 0 or (lim and prints < lim or i == len(fs2) - 1):
+            print('  %s: %s' % (k, v))
+            prints += 1
+            if lim and prints == lim:
+                print('  ...')
+
+    zeros = fs2.get(0, 0)
+    if zeros:
+        raise Exception("%d names without equation" % zeros)
+
+def filter_ncols(A_ubd, b_ub, cols_min=0, cols_max=0):
+    '''Only keep equations with a few delay elements'''
+    A_ubd_ret = []
+    b_ub_ret = []
+
+    #print('Removing large rows')
+    for rowd, b in zip(A_ubd, b_ub):
+        if (not cols_min or len(rowd) >= cols_min) and (not cols_max or len(rowd) <= cols_max):
+            A_ubd_ret.append(rowd)
+            b_ub_ret.append(b)
+
+    print('Filter ncols w/ %d <= cols <= %d: %d ==> %d rows' % (cols_min, cols_max, len(b_ub), len(b_ub_ret)))
+    assert len(b_ub_ret)
+    return A_ubd_ret, b_ub_ret
+
+def preprocess(A_ubd, b_ub, opts, names, verbose=0):
+    def debug(what):
+        if verbose:
+            print('')
+            print_eqns(A_ubd, b_ub, verbose=verbose, label=what, lim=20)
+            col_dist(A_ubd, what, names)
+            check_feasible_d(A_ubd, b_ub, names)
+
+    col_dist(A_ubd, 'pre-filt', names, lim=12)
+    debug('pre-filt')
+
+    need_simpc = 0
+
+    # Input set may have redundant constraints
+    A_ubd, b_ub = simplify_rows(A_ubd=A_ubd, b_ub=b_ub)
+    debug("simp_rows")
+    cols_min_pre = opts.get('cols_min_pre', None)
+    cols_max_pre = opts.get('cols_max_pre', None)
+    # Filter input based on number of columns
+    if cols_min_pre or cols_max_pre:
+        A_ubd, b_ub = filter_ncols(A_ubd=A_ubd, b_ub=b_ub, cols_min=cols_min_pre, cols_max=cols_max_pre)
+        debug("filt_ncols")
+        need_simpc = 1
+
+    # Limit input rows, mostly for quick full run checks
+    row_limit = opts.get('row_limit', None)
+    if row_limit:
+        before_rows = len(b_ub)
+        A_ubd = A_ubd[0:row_limit]
+        b_ub = b_ub[0:row_limit]
+        print('Row limit %d => %d rows' % (before_rows, len(b_ub)))
+        need_simpc = 1
+
+    if need_simpc:
+        names, A_ubd, b_ub = simplify_cols(names=names, A_ubd=A_ubd, b_ub=b_ub)
+        debug("simp_cols")
+
+    return A_ubd, b_ub, names
+
+def massage_equations(A_ubd, b_ub, opts, names, verbose=0):
+    '''
+    Equation pipeline
+    Some operations may generate new equations
+    Simplify after these to avoid unnecessary overhead on redundant constraints
+    Similarly some operations may eliminate equations, potentially eliminating a column (ie variable)
+    Remove these columns as necessary to speed up solving
+    '''
+
+    def debug(what):
+        if verbose:
+            print('')
+            print_eqns(A_ubd, b_ub, verbose=verbose, label=what, lim=20)
+            col_dist(A_ubd, what, names)
+            check_feasible_d(A_ubd, b_ub, names)
+
+    A_ubd, b_ub, names = preprocess(A_ubd, b_ub, opts, names, verbose=verbose)
+
+    # Try to (intelligently) subtract equations to generate additional constraints
+    # This helps avoid putting all delay in a single shared variable
+    derive_lim = opts.get('derive_lim', None)
+    if derive_lim:
+        dstart = len(b_ub)
+
+        # Original simple
+        if 0:
+            for di in range(derive_lim):
+                print
+                assert len(A_ubd) == len(b_ub)
+                n_orig = len(b_ub)
+
+                # Meat of the operation
+                # Focus on easy equations for first pass to get a lot of easy derrivations
+                col_lim = 12 if di == 0 else None
+                #col_lim = None
+                A_ubd, b_ub = derive_eq_by_row(A_ubd, b_ub, col_lim=col_lim)
+                debug("der_rows")
+                # Run another simplify pass since new equations may have overlap with original
+                A_ubd, b_ub = simplify_rows(A_ubd, b_ub)
+                print('Derive row %d / %d: %d => %d equations' % (di + 1, derive_lim, n_orig, len(b_ub)))
+                debug("der_rows simp")
+
+                n_orig2 = len(b_ub)
+                # Meat of the operation
+                A_ubd, b_ub = derive_eq_by_col(A_ubd, b_ub)
+                debug("der_cols")
+                # Run another simplify pass since new equations may have overlap with original
+                A_ubd, b_ub = simplify_rows(A_ubd=A_ubd, b_ub=b_ub)
+                print('Derive col %d / %d: %d => %d equations' % (di + 1, derive_lim, n_orig2, len(b_ub)))
+                debug("der_cols simp")
+
+                if n_orig == len(b_ub):
+                    break
+
+        if 1:
+            # Each iteration one more column is allowed until all columns are included
+            # (and the system is stable)
+            col_lim = 15
+            di = 0
+            while True:
+                print
+                n_orig = len(b_ub)
+
+                print('Loop %d, lim %d' % (di + 1, col_lim))
+                # Meat of the operation
+                A_ubd, b_ub = derive_eq_by_row(A_ubd, b_ub, col_lim=col_lim, tweak=True)
+                debug("der_rows")
+                # Run another simplify pass since new equations may have overlap with original
+                A_ubd, b_ub = simplify_rows(A_ubd, b_ub)
+                print('Derive row: %d => %d equations' % (n_orig, len(b_ub)))
+                debug("der_rows simp")
+
+                n_orig2 = len(b_ub)
+                # Meat of the operation
+                A_ubd, b_ub = derive_eq_by_col(A_ubd, b_ub)
+                debug("der_cols")
+                # Run another simplify pass since new equations may have overlap with original
+                A_ubd, b_ub = simplify_rows(A_ubd=A_ubd, b_ub=b_ub)
+                print('Derive col %d: %d => %d equations' % (di + 1, n_orig2, len(b_ub)))
+                debug("der_cols simp")
+
+                # Doesn't help computation, but helps debugging
+                names, A_ubd, b_ub = simplify_cols(names=names, A_ubd=A_ubd, b_ub=b_ub)
+                A_ubd, b_ub = sort_equations(A_ubd, b_ub)
+                debug("loop done")
+                col_dist(A_ubd, 'derive done iter %d, lim %d' % (di, col_lim), names, lim=12)
+
+                rows = len(A_ubd)
+                if n_orig == len(b_ub) and col_lim >= rows:
+                    break
+                col_lim += col_lim / 5
+                di += 1
+
+        dend = len(b_ub)
+        print('')
+        print('Derive net: %d => %d' % (dstart, dend))
+        print('')
+        # Was experimentting to see how much the higher order columns really help
+
+    cols_min_post = opts.get('cols_min_post', None)
+    cols_max_post = opts.get('cols_max_post', None)
+    # Filter input based on number of columns
+    if cols_min_post or cols_max_post:
+        A_ubd, b_ub = filter_ncols(A_ubd=A_ubd, b_ub=b_ub, cols_min=cols_min_post, cols_max=cols_max_post)
+        debug("filter_ncals final")
+
+    names, A_ubd, b_ub = simplify_cols(names=names, A_ubd=A_ubd, b_ub=b_ub)
+    debug("simp_cols final")
+
+    # Helps debug readability
+    A_ubd, b_ub = sort_equations(A_ubd, b_ub)
+    debug("final (sorted)")
+    return names, A_ubd, b_ub
+
+def Ar_di2ds(rowA, names):
+    row = OrderedDict()
+    for k, v in rowA.items():
+        row[names[k]] = v
+    return row
+
+def A_di2ds(Adi, names):
+    rows = []
+    for row_di in Adi:
+        rows.append(Ar_di2ds(row_di, names))
+    return rows
+
+def Ar_ds2di(row_ds, names):
+    def keyi(name):
+        if name not in names:
+            names[name] = len(names)
+        return names[name]
+
+    row_di = OrderedDict()
+    for k, v in row_ds.items():
+        row_di[keyi(k)] = v
+    return row_di
+
+def A_ds2di(rows):
+    names = OrderedDict()
+
+    A_ubd = []
+    for row_ds in rows:
+        A_ubd.append(Ar_ds2di(row_ds, names))
+
+    return list(names.keys()), A_ubd
+
+def A_ds2np(Ads):
+    names, Adi = A_ds2di(Ads)
+    return names, A_di2np(Adi, len(names))
+
+def loadc_Ads_mkb(fns, mkb, filt):
+    bs = []
+    Ads = []
+    for fn in fns:
+        with open(fn, 'r') as f:
+            # skip header
+            f.readline()
+            for l in f:
+                cols = l.split(',')
+                ico = bool(int(cols[0]))
+                corners = cols[1]
+                vars = cols[2:]
+
+                corners = [int(x) for x in corners.split()]
+                def mkvar(x):
+                    i, var = x.split()
+                    return (var, int(i))
+                vars = OrderedDict([mkvar(var) for var in vars])
+                if not filt(ico, corners, vars):
+                    continue
+
+                bs.append(mkb(corners))
+                Ads.append(vars)
+
+    return Ads, bs
+
+def loadc_Ads_b(fns, corner, ico=None):
+    corner = corner or "slow_max"
+    corneri = corner_s2i[corner]
+
+    if ico is not None:
+        filt = lambda ico, corners, vars: ico == ico
+    else:
+        filt = lambda ico, corners, vars: True
+
+    def mkb(val):
+        return val[corneri]
+    return loadc_Ads_mkb(fns, mkb, filt)
+
+def index_names(Ads):
+    names = set()
+    for row_ds in Ads:
+        for k1 in row_ds.keys():
+            names.add(k1)
+    return names
diff --git a/experiments/timfuz/timfuz_checksub.py b/experiments/timfuz/timfuz_checksub.py
new file mode 100644
index 00000000..774ce020
--- /dev/null
+++ b/experiments/timfuz/timfuz_checksub.py
@@ -0,0 +1,259 @@
+#!/usr/bin/env python3
+
+from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np
+import numpy as np
+import glob
+import json
+import math
+from collections import OrderedDict
+
+# check for issues that may be due to round off error
+STRICT = 1
+
+def Adi2matrix_random(A_ubd, b_ub, names):
+    # random assignment
+    # was making some empty rows
+
+    A_ret = [np.zeros(len(names)) for _i in range(len(names))]
+    b_ret = np.zeros(len(names))
+
+    for row, b in zip(A_ubd, b_ub):
+        # Randomly assign to a row
+        dst_rowi = random.randint(0, len(names) - 1)
+        rownp = Ar_di2np(row, cols=len(names), sf=1)
+
+        A_ret[dst_rowi] = np.add(A_ret[dst_rowi], rownp)
+        b_ret[dst_rowi] += b
+    return A_ret, b_ret
+
+def Ads2matrix_linear(Ads, b):
+    names, Adi = A_ds2di(Ads)
+    cols = len(names)
+    rows_out = len(b)
+
+    A_ret = [np.zeros(cols) for _i in range(rows_out)]
+    b_ret = np.zeros(rows_out)
+
+    dst_rowi = 0
+    for row_di, row_b in zip(Adi, b):
+        row_np = Ar_di2np(row_di, cols)
+
+        A_ret[dst_rowi] = np.add(A_ret[dst_rowi], row_np)
+        b_ret[dst_rowi] += row_b
+        dst_rowi = (dst_rowi + 1) % rows_out
+    return A_ret, b_ret
+
+def row_sub_syms(row, sub_json, verbose=False):
+    if 0 and verbose:
+        print("")
+        print(row.items())
+
+    delsyms = 0
+    for k in sub_json['drop_names']:
+        try:
+            del row[k]
+            delsyms += 1
+        except KeyError:
+            pass
+    if verbose:
+        print("Deleted %u symbols" % delsyms)
+
+    if verbose:
+        print('Checking pivots')
+        print(sorted(row.items()))
+        for group, pivot in sorted(sub_json['pivots'].items()):
+            if pivot not in row:
+                continue
+            n = row[pivot]
+            print('  pivot %u %s' % (n, pivot))
+
+    for group, pivot in sorted(sub_json['pivots'].items()):
+        if pivot not in row:
+            continue
+
+        # take the sub out n times
+        # note constants may be negative
+        n = row[pivot]
+        if verbose:
+            print('pivot %i %s' % (n, pivot))
+        for subk, subv in sorted(sub_json['subs'][group].items()):
+            oldn = row.get(subk, 0)
+            rown = oldn - n * subv
+            if verbose:
+                print("  %s: %d => %d" % (subk, oldn, rown))
+            if rown == 0:
+                # only becomes zero if didn't previously exist
+                del row[subk]
+                if verbose:
+                    print("    del")
+            else:
+                row[subk] = rown
+        row[group] = n
+        assert pivot not in row
+
+    # after all constants are applied, the row should end up positive?
+    if STRICT:
+        for k, v in sorted(row.items()):
+            assert v > 0, (k, v)
+
+def run_sub_json(Ads, sub_json, verbose=False):
+    nrows = 0
+    nsubs = 0
+
+    ncols_old = 0
+    ncols_new = 0
+
+    print('Subbing %u rows' % len(Ads))
+    prints = set()
+
+    for rowi, row in enumerate(Ads):
+        if 0 and verbose:
+            print(row)
+        if verbose:
+            print('')
+            print('Row %u w/ %u elements' % (rowi, len(row)))
+
+        row_orig = dict(row)
+        row_sub_syms(row, sub_json, verbose=verbose)
+        nrows += 1
+        if row_orig != row:
+            nsubs += 1
+            if verbose:
+                rowt = Ar_ds2t(row)
+                if rowt not in prints:
+                    print('row', row)
+                    prints.add(rowt)
+        ncols_old += len(row_orig)
+        ncols_new += len(row)
+
+    if verbose:
+        print('')
+
+    print("Sub: %u / %u rows changed" % (nsubs, nrows))
+    print("Sub: %u => %u cols" % (ncols_old, ncols_new))
+
+def pmatrix(Anp, s):
+    import sympy
+    msym = sympy.Matrix(Anp)
+    print(s)
+    sympy.pprint(msym)
+
+def pds(Ads, s):
+    names, Anp = A_ds2np(Ads)
+    pmatrix(Anp, s)
+    print('Names: %s' % (names,))
+
+def run(fns_in, sub_json=None, verbose=False, corner=None):
+    Ads, b = loadc_Ads_b(fns_in, corner, ico=True)
+
+    # Remove duplicate rows
+    # is this necessary?
+    # maybe better to just add them into the matrix directly
+    #Ads, b = simplify_rows(Ads, b)
+
+    if sub_json:
+        print('Subbing JSON %u rows' % len(Ads))
+        #pds(Ads, 'Orig')
+        names_old = index_names(Ads)
+        run_sub_json(Ads, sub_json, verbose=verbose)
+        names_new = index_names(Ads)
+        print("Sub: %u => %u names" % (len(names_old), len(names_new)))
+        print(names_new)
+        print('Subbed JSON %u rows' % len(Ads))
+        names = names_new
+        #pds(Ads, 'Sub')
+    else:
+        names = index_names(Ads)
+
+    # Squash into a matrix
+    # A_ub2, b_ub2 = Adi2matrix_random(A_ubd, b, names)
+    Amat, _bmat = Ads2matrix_linear(Ads, b)
+    #pmatrix(Amat, 'Matrix')
+
+    '''
+    The matrix must be fully ranked to even be considered reasonable
+    Even then, floating point error *possibly* could make it fully ranked, although probably not since we have whole numbers
+    Hence the slogdet check
+    '''
+    print
+    # https://docs.scipy.org/doc/numpy-dev/reference/generated/numpy.linalg.matrix_rank.html
+    print('rank: %s / %d col' % (np.linalg.matrix_rank(Amat), len(names)))
+    if 0:
+        # https://docs.scipy.org/doc/numpy-1.14.0/reference/generated/numpy.linalg.slogdet.html
+        sign, logdet = np.linalg.slogdet(Amat)
+        # If the determinant is zero, then sign will be 0 and logdet will be -Inf
+        if sign == 0 and logdet == float('-inf'):
+            print('slogdet :( : 0')
+        else:
+            print('slogdet :) : %s, %s' % (sign, logdet))
+
+def load_sub(fn):
+    delta = 0.001
+    j = json.load(open(fn, 'r'))
+
+    # convert groups to use integer constants
+    # beware of roundoff error
+    # if we round poorly here, it won't give incorrect results later, but may make it fail to find a good solution
+
+    if 'pivots' in j:
+        print('pivots: using existing')
+    else:
+        print('pivots: guessing')
+
+        pivots = OrderedDict()
+        j['pivots'] = pivots
+
+        for name, vals in sorted(j['subs'].items()):
+            pivot = None
+            for k, v in vals.items():
+                if STRICT:
+                    vi = int(round(v))
+                    assert abs(vi - v) < delta
+                    vals[k] = vi
+                else:
+                    vals[k] = float(v)
+
+                # there may be more than one acceptable pivot
+                # take the first
+                if v == 1 and pivot is None:
+                    pivot = k
+            assert pivot is not None
+            pivots[name] = pivot
+
+    return j
+
+def main():
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description=
+        'Check sub.json solution feasibility'
+    )
+
+    parser.add_argument('--verbose', action='store_true', help='')
+    parser.add_argument('--sub-json', help='')
+    parser.add_argument('--corner', default="slow_max", help='')
+    parser.add_argument(
+        'fns_in',
+        nargs='*',
+        help='timing3.txt input files')
+    args = parser.parse_args()
+    # Store options in dict to ease passing through functions
+    bench = Benchmark()
+
+    fns_in = args.fns_in
+    if not fns_in:
+        fns_in = glob.glob('specimen_*/timing3.txt')
+
+    sub_json = None
+    if args.sub_json:
+        sub_json = load_sub(args.sub_json)
+
+    try:
+        run(sub_json=sub_json,
+            fns_in=fns_in, verbose=args.verbose, corner=args.corner)
+    finally:
+        print('Exiting after %s' % bench)
+
+if __name__ == '__main__':
+    main()
diff --git a/experiments/timfuz/timfuz_corner_csv.py b/experiments/timfuz/timfuz_corner_csv.py
new file mode 100644
index 00000000..1df10bd0
--- /dev/null
+++ b/experiments/timfuz/timfuz_corner_csv.py
@@ -0,0 +1,60 @@
+#!/usr/bin/env python3
+
+from timfuz import Benchmark, simplify_rows, loadc_Ads_b
+import glob
+
+def run(fout, fns_in, corner, verbose=0):
+    Ads, b = loadc_Ads_b(fns_in, corner, ico=True)
+    Ads, b = simplify_rows(Ads, b)
+
+    fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
+    for row_b, row_ds in zip(b, Ads):
+        # write in same format, but just stick to this corner
+        out_b = [str(row_b) for _i in range(4)]
+        ico = '1'
+        items = [ico, ' '.join(out_b)]
+
+        for k, v in sorted(row_ds.items()):
+            items.append('%u %s' % (v, k))
+        fout.write(','.join(items) + '\n')
+
+def main():
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description=
+        'Create a .csv with a single process corner'
+    )
+
+    parser.add_argument('--verbose', type=int, help='')
+    parser.add_argument('--auto-name', action='store_true', help='timing3.csv => timing3c.csv')
+    parser.add_argument('--out', default=None, help='Output csv')
+    parser.add_argument('--corner', help='Output csv')
+    parser.add_argument(
+        'fns_in',
+        nargs='*',
+        help='timing3.csv input files')
+    args = parser.parse_args()
+    bench = Benchmark()
+
+    fnout = args.out
+    if fnout is None:
+        if args.auto_name:
+            assert len(args.fns_in) == 1
+            fnin = args.fns_in[0]
+            fnout = fnin.replace('timing3.csv', 'timing3c.csv')
+            assert fnout != fnin, 'Expect timing3.csv in'
+        else:
+            fnout = '/dev/stdout'
+    print("Writing to %s" % fnout)
+    fout = open(fnout, 'w')
+
+    fns_in = args.fns_in
+    if not fns_in:
+        fns_in = glob.glob('specimen_*/timing3.csv')
+
+    run(fout=fout,
+        fns_in=fns_in, corner=args.corner, verbose=args.verbose)
+
+if __name__ == '__main__':
+    main()
diff --git a/experiments/timfuz/timfuz_csv.py b/experiments/timfuz/timfuz_csv.py
new file mode 100644
index 00000000..97da40e1
--- /dev/null
+++ b/experiments/timfuz/timfuz_csv.py
@@ -0,0 +1,272 @@
+#!/usr/bin/env python3
+
+from timfuz import Benchmark, row_di2ds, A_di2ds
+import numpy as np
+import glob
+import math
+import json
+import sympy
+import sys
+from collections import OrderedDict
+
+# Speed index: some sort of special value
+SI_NONE = 0xFFFF
+
+PREFIX_W = 'WIRE_'
+PREFIX_P = 'PIP_'
+#PREFIX_W = ''
+#PREFIX_P = ''
+
+def parse_pip(s):
+    # Entries like
+    # CLK_BUFG_REBUF_X60Y117/CLK_BUFG_REBUF.CLK_BUFG_REBUF_R_CK_GCLK0_BOT<<->>CLK_BUFG_REBUF_R_CK_GCLK0_TOP
+    # Convert to (site, type, pip_junction, pip)
+    pipstr, speed_index = s.split(':')
+    speed_index = int(speed_index)
+    site, instance = pipstr.split('/')
+    #type, pip_junction, pip = others.split('.')
+    #return (site, type, pip_junction, pip)
+    return site, instance, int(speed_index)
+
+def parse_node(s):
+    node, nwires = s.split(':')
+    return node, int(nwires)
+
+def parse_wire(s):
+    # CLBLM_R_X3Y80/CLBLM_M_D6:952
+    wirestr, speed_index = s.split(':')
+    site, instance = wirestr.split('/')
+    return site, instance, int(speed_index)
+
+# FIXME: these actually have a delay element
+# Probably need to put these back in
+def remove_virtual_pips(pips):
+    return pips
+    return filter(lambda pip: not re.match(r'CLBL[LM]_[LR]_', pip[0]), pips)
+
+def load_timing3(f, name='file'):
+    # src_bel dst_bel ico fast_max fast_min slow_max slow_min pips
+    f.readline()
+    ret = []
+    bads = 0
+    for l in f:
+        # FIXME: hack
+        if 0 and 'CLK' in l:
+            continue
+
+        l = l.strip()
+        if not l:
+            continue
+        parts = l.split(' ')
+        # FIXME: deal with these nodes
+        if len(parts) != 11:
+            bads += 1
+            continue
+        net, src_bel, dst_bel, ico, fast_max, fast_min, slow_max, slow_min, pips, nodes, wires = parts
+        pips = pips.split('|')
+        nodes = nodes.split('|')
+        wires = wires.split('|')
+        ret.append({
+            'net': net,
+            'src_bel': src_bel,
+            'dst_bel': dst_bel,
+            'ico': int(ico),
+            # ps
+            'fast_max': int(fast_max),
+            'fast_min': int(fast_min),
+            'slow_max': int(slow_max),
+            'slow_min': int(slow_min),
+            'pips': remove_virtual_pips([parse_pip(pip) for pip in pips]),
+            'nodes': [parse_node(node) for node in nodes],
+            'wires': [parse_wire(wire) for wire in wires],
+            'line': l,
+            })
+    print('  load %s: %d bad, %d good' % (name, bads, len(ret)))
+    #assert 0
+    return ret
+
+def load_speed_json(f):
+    j = json.load(f)
+    # Index speed indexes to names
+    speed_i2s = {}
+    for k, v in j['speed_model'].items():
+        i = v['speed_index']
+        if i != SI_NONE:
+            speed_i2s[i] = k
+    return j, speed_i2s
+
+# Verify the nodes and wires really do line up
+def vals2Adi_check(vals, names):
+    print('Checking')
+    for val in vals:
+        node_wires = 0
+        for _node, wiresn in val['nodes']:
+            node_wires += wiresn
+        assert node_wires == len(val['wires'])
+    print('Done')
+    assert 0
+
+def vals2Adi(vals, speed_i2s,
+        name_tr={}, name_drop=[],
+        verbose=False):
+    def pip2speed(pip):
+        _site, _name, speed_index  = pip
+        return PREFIX_P + speed_i2s[speed_index]
+    def wire2speed(wire):
+        _site, _name, speed_index = wire
+        return PREFIX_W + speed_i2s[speed_index]
+
+    # Want this ordered
+    names = OrderedDict()
+
+    print('Creating matrix w/ tr: %d, drop: %d' % (len(name_tr), len(name_drop)))
+
+    # Take sites out entirely using handy "interconnect only" option
+    #vals = filter(lambda x: str(x).find('SLICE') >= 0, vals)
+    # Highest count while still getting valid result
+
+    # First index all of the given pip types
+    # Start out as set then convert to list to keep matrix order consistent
+    sys.stdout.write('Indexing delay elements ')
+    sys.stdout.flush()
+    progress = max(1, len(vals) / 100)
+    for vali, val in enumerate(vals):
+        if vali % progress == 0:
+            sys.stdout.write('.')
+            sys.stdout.flush()
+        odl = [(pip2speed(pip), None) for pip in val['pips']]
+        names.update(OrderedDict(odl))
+
+        odl = [(wire2speed(wire), None) for wire in val['wires']]
+        names.update(OrderedDict(odl))
+    print(' done')
+
+    # Apply transform
+    orig_names = len(names)
+    for k in (list(name_drop) + list(name_tr.keys())):
+        if k in names:
+            del names[k]
+        else:
+            print('WARNING: failed to remove %s' % k)
+    names.update(OrderedDict([(name, None) for name in name_tr.values()]))
+    print('Names tr %d => %d' % (orig_names, len(names)))
+
+    # Make unique list
+    names = list(names.keys())
+    name_s2i = {}
+    for namei, name in enumerate(names):
+        name_s2i[name] = namei
+    if verbose:
+        for name in names:
+            print('NAME: ', name)
+        for name in name_drop:
+            print('DROP: ', name)
+        for l, r in name_tr.items():
+            print('TR: %s => %s' % (l, r))
+
+    # Now create a matrix with all of these delays
+    # Each row needs len(names) elements
+    # -2 means 2 elements present, 0 means absent
+    # (could hit same pip twice)
+    print('Creating delay element matrix w/ %d names' % len(names))
+    Adi = [None for _i in range(len(vals))]
+    for vali, val in enumerate(vals):
+        def add_name(name):
+            if name in name_drop:
+                return
+            name = name_tr.get(name, name)
+            namei = name_s2i[name]
+            row_di[namei] = row_di.get(namei, 0) + 1
+
+        # Start with 0 occurances
+        #row = [0 for _i in range(len(names))]
+        row_di = {}
+
+        #print('pips: ', val['pips']
+        for pip in val['pips']:
+            add_name(pip2speed(pip))
+        for wire in val['wires']:
+            add_name(wire2speed(wire))
+        #A_ub.append(row)
+        Adi[vali] = row_di
+
+    return Adi, names
+
+# TODO: load directly as Ads
+# remove names_tr, names_drop
+def vals2Ads(vals, speed_i2s, verbose=False):
+    Adi, names = vals2Adi(vals, speed_i2s, verbose=False)
+    return A_di2ds(Adi, names)
+
+def load_Ads(speed_json_f, f_ins):
+
+    print('Loading data')
+
+    _speedj, speed_i2s = load_speed_json(speed_json_f)
+
+    vals = []
+    for avals in [load_timing3(f_in, name) for f_in, name in f_ins]:
+        vals.extend(avals)
+
+    Ads = vals2Ads(vals, speed_i2s)
+
+    def mkb(val):
+        return (val['fast_max'], val['fast_min'], val['slow_max'], val['slow_min'])
+    b = [mkb(val) for val in vals]
+    ico = [val['ico'] for val in vals]
+
+    return Ads, b, ico
+
+def run(speed_json_f, fout, f_ins, verbose=0, corner=None):
+    Ads, bs, ico = load_Ads(speed_json_f, f_ins)
+
+    fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
+    for row_bs, row_ds, row_ico in zip(bs, Ads, ico):
+        # like: 123 456 120 450, 1 a, 2 b
+        # first column has delay corners, followed by delay element count
+        items = [str(row_ico), ' '.join([str(x) for x in row_bs])]
+        for k, v in sorted(row_ds.items()):
+            items.append('%u %s' % (v, k))
+        fout.write(','.join(items) + '\n')
+
+def main():
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description=
+        'Convert obscure timing3.txt into more readable but roughly equivilent timing3.csv'
+    )
+
+    parser.add_argument('--verbose', type=int, help='')
+    parser.add_argument('--auto-name', action='store_true', help='timing3.txt => timing3.csv')
+    parser.add_argument('--speed-json', default='build_speed/speed.json',
+        help='Provides speed index to name translation')
+    parser.add_argument('--out', default=None, help='Output csv')
+    parser.add_argument(
+        'fns_in',
+        nargs='*',
+        help='timing3.txt input files')
+    args = parser.parse_args()
+    bench = Benchmark()
+
+    fnout = args.out
+    if fnout is None:
+        if args.auto_name:
+            assert len(args.fns_in) == 1
+            fnin = args.fns_in[0]
+            fnout = fnin.replace('.txt', '.csv')
+            assert fnout != fnin, 'Expect .txt in'
+        else:
+            fnout = '/dev/stdout'
+    print("Writing to %s" % fnout)
+    fout = open(fnout, 'w')
+
+    fns_in = args.fns_in
+    if not fns_in:
+        fns_in = glob.glob('specimen_*/timing3.txt')
+
+    run(speed_json_f=open(args.speed_json, 'r'), fout=fout,
+        f_ins=[(open(fn_in, 'r'), fn_in) for fn_in in fns_in], verbose=args.verbose)
+
+if __name__ == '__main__':
+    main()
diff --git a/experiments/timfuz/timfuz_rref.py b/experiments/timfuz/timfuz_rref.py
new file mode 100644
index 00000000..2fc3c103
--- /dev/null
+++ b/experiments/timfuz/timfuz_rref.py
@@ -0,0 +1,206 @@
+#!/usr/bin/env python3
+
+'''
+Triaging tool to help understand where we need more timing coverage
+Finds correlated variables to help make better test cases
+'''
+
+from timfuz import Benchmark, Ar_di2np, loadc_Ads_b, index_names, A_ds2np
+import numpy as np
+import glob
+import math
+import json
+import sympy
+from collections import OrderedDict
+
+STRICT = 1
+
+class State(object):
+    def __init__(self, Ads, drop_names=[]):
+        self.Ads = Ads
+        self.names = index_names(self.Ads)
+
+        # known zero delay elements
+        self.drop_names = set(drop_names)
+        # active names in rows
+        # includes sub symbols, excludes symbols that have been substituted out
+        self.base_names = set(self.names)
+        self.names = set(self.base_names)
+        # List of variable substitutions
+        # k => dict of v:n entries that it came from
+        self.subs = {}
+        self.verbose = True
+
+    def print_stats(self):
+        print("Stats")
+        print("  Substitutions: %u" % len(self.subs))
+        if self.subs:
+            print("    Largest: %u" % max([len(x) for x in self.subs.values()]))
+        print("  Rows: %u" % len(self.Ads))
+        print("  Cols (in): %u" % (len(self.base_names) + len(self.drop_names)))
+        print("  Cols (preprocessed): %u" % len(self.base_names))
+        print("    Drop names: %u" % len(self.drop_names))
+        print("  Cols (out): %u" % len(self.names))
+        assert len(self.names) >= len(self.subs)
+
+    @staticmethod
+    def load(fn_ins):
+        Ads, _b = loadc_Ads_b(fn_ins, corner=None, ico=True)
+        return State(Ads)
+
+def write_state(state, fout):
+    j = {
+        'names': dict([(x, None) for x in state.names]),
+        'drop_names': list(state.drop_names),
+        'base_names': list(state.base_names),
+        'subs': dict([(name, values) for name, values in state.subs.items()]),
+        'pivots': state.pivots,
+    }
+    json.dump(j, fout, sort_keys=True, indent=4, separators=(',', ': '))
+
+def Adi2matrix(Adi, cols):
+    A_ub2 = [np.zeros(cols) for _i in range(cols)]
+
+    dst_rowi = 0
+    for row in Adi:
+        rownp = Ar_di2np(row, cols=len(names), sf=1)
+
+        A_ub2[dst_rowi] = np.add(A_ub2[dst_rowi], rownp)
+        dst_rowi = (dst_rowi + 1) % len(names)
+
+    return A_ub2
+
+def Anp2matrix(Anp):
+    ncols = len(Anp[0])
+    A_ub2 = [np.zeros(ncols) for _i in range(ncols)]
+    dst_rowi = 0
+    for rownp in Anp:
+        A_ub2[dst_rowi] = np.add(A_ub2[dst_rowi], rownp)
+        dst_rowi = (dst_rowi + 1) % ncols
+    return A_ub2
+
+def row_np2ds(rownp, names):
+    ret = {}
+    assert len(rownp) == len(names), (len(rownp), len(names))
+    for namei, name in enumerate(names):
+        v = rownp[namei]
+        if v:
+            ret[name] = v
+    return ret
+
+def comb_corr_sets(state, verbose=False):
+    print('Converting rows to integer keys')
+    names, Anp = A_ds2np(state.Ads)
+
+    print('np: %u rows x %u cols' % (len(Anp), len(Anp[0])))
+    print('Combining rows into matrix')
+    mnp = Anp2matrix(Anp)
+    print('Matrix: %u rows x %u cols' % (len(mnp), len(mnp[0])))
+    print('Converting np to sympy matrix')
+    msym = sympy.Matrix(mnp)
+    print('Making rref')
+    rref, pivots = msym.rref()
+
+    if verbose:
+        print('names')
+        print(names)
+        print('Matrix')
+        sympy.pprint(msym)
+        print('Pivots')
+        sympy.pprint(pivots)
+        print('rref')
+        sympy.pprint(rref)
+
+    state.pivots = {}
+
+    def row_solved(rownp, row_pivot):
+        for ci, c in enumerate(rownp):
+            if ci == row_pivot:
+                continue
+            if c != 0:
+                return False
+        return True
+
+    rrefnp = np.array(rref).astype(np.float64)
+    print('Computing groups w/ rref %u row x %u col' % (len(rrefnp), len(rrefnp[0])))
+    #print(rrefnp)
+    # rows that have a single 1 are okay
+    # anything else requires substitution (unless all 0)
+    # pivots may be fewer than the rows
+    # remaining rows should be 0s
+    for row_i, (row_pivot, rownp) in enumerate(zip(pivots, rrefnp)):
+        rowds = row_np2ds(rownp, names)
+        # boring cases: solved variable, not fully ranked
+        #if sum(rowds.values()) == 1:
+        if row_solved(rownp, row_pivot):
+            continue
+
+        # a grouping
+        group_name = "GROUP_%u" % row_i
+        if STRICT:
+            delta = 0.001
+            rowds_store = {}
+            for k, v in rowds.items():
+                vi = int(round(v))
+                error = abs(vi - v)
+                assert error < delta, (error, delta)
+                rowds_store[k] = vi
+        else:
+            rowds_store = rowds
+        state.subs[group_name] = rowds_store
+        # Add the new symbol
+        state.names.add(group_name)
+        # Remove substituted symbols
+        # Note: symbols may appear multiple times
+        state.names.difference_update(set(rowds.keys()))
+        pivot_name = names[row_pivot]
+        state.pivots[group_name] = pivot_name
+        if verbose:
+            print("%s (%s): %s" % (group_name, pivot_name, rowds))
+
+    return state
+
+def run(fout, fn_ins, verbose=0):
+    print('Loading data')
+
+    state = State.load(fn_ins)
+    comb_corr_sets(state, verbose=verbose)
+    state.print_stats()
+    if fout:
+        write_state(state, fout)
+
+def main():
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description=
+        'Timing fuzzer'
+    )
+
+    parser.add_argument('--verbose', action='store_true', help='')
+    parser.add_argument('--speed-json', default='build_speed/speed.json',
+        help='Provides speed index to name translation')
+    parser.add_argument('--out', help='Output sub.json substitution result')
+    parser.add_argument(
+        'fns_in',
+        nargs='*',
+        help='timing3.txt input files')
+    args = parser.parse_args()
+    bench = Benchmark()
+
+    fout = None
+    if args.out:
+        fout = open(args.out, 'w')
+
+    fns_in = args.fns_in
+    if not fns_in:
+        fns_in = glob.glob('specimen_*/timing3.csv')
+
+    try:
+        run(fout=fout,
+            fn_ins=args.fns_in, verbose=args.verbose)
+    finally:
+        print('Exiting after %s' % bench)
+
+if __name__ == '__main__':
+    main()
diff --git a/experiments/timfuz/timfuz_solve.py b/experiments/timfuz/timfuz_solve.py
new file mode 100644
index 00000000..225d3060
--- /dev/null
+++ b/experiments/timfuz/timfuz_solve.py
@@ -0,0 +1,98 @@
+#!/usr/bin/env python3
+
+def run_corner(A_ubd, b_ub, names, verbose=0, opts={}, meta={}):
+    # Given timing scores for above delays (-ps)
+    names_orig = names
+
+    #print_eqns(A_ub, b_ub, verbose=verbose)
+    names, A_ubd, b_ub = massage_equations(A_ubd, b_ub, opts, names, verbose=verbose)
+
+    print
+    print_eqns(A_ubd, b_ub, verbose=verbose)
+
+    print
+    col_dist(A_ubd, 'final', names)
+
+    A_ub, b_ub = Ab_d2np(A_ubd, b_ub, names)
+
+    # Its having trouble giving me solutions as this gets bigger
+    # Make a terrible baseline guess to confirm we aren't doing something bad
+    #print_names(names, verbose=verbose)
+    check_feasible(A_ub=A_ub, b_ub=b_ub)
+
+    '''
+    Be mindful of signs
+    Have something like
+    timing1/timing 2 are constants
+    delay1 +   delay2 +               delay4     >= timing1
+               delay2 +   delay3                 >= timing2
+
+    But need it in compliant form:
+    -delay1 +   -delay2 +               -delay4     <= -timing1
+                -delay2 +   -delay3                 <= -timing2
+    '''
+    rows = len(A_ub)
+    cols = len(A_ub[0])
+    # Minimization function scalars
+    # Treat all logic elements as equally important
+    c = [1 for _i in range(len(names))]
+    # Delays cannot be negative
+    # (this is also the default constraint)
+    #bounds =  [(0, None) for _i in range(len(names))]
+    # Also you can provide one to apply to all
+    bounds = (0, None)
+
+    # Seems to take about rows + 3 iterations
+    # Give some margin
+    #maxiter = int(1.1 * rows + 100)
+    #maxiter = max(1000, int(1000 * rows + 1000))
+    # Most of the time I want it to just keep going unless I ^C it
+    maxiter = 1000000
+
+    if verbose >= 2:
+        print('b_ub', b_ub)
+    print('Unique delay elements: %d' % len(names))
+    print('  # delay minimization weights: %d' % len(c))
+    print('  # delay constraints: %d' % len(bounds))
+    print('Input paths')
+    print('  # timing scores: %d' % len(b_ub))
+    print('  Rows: %d' % rows)
+
+    tlast = [time.time()]
+    iters = [0]
+    printn = [0]
+    def callback(xk, **kwargs):
+        iters[0] = kwargs['nit']
+        if time.time() - tlast[0] > 1.0:
+            sys.stdout.write('I:%d ' % kwargs['nit'])
+            tlast[0] = time.time()
+            printn[0] += 1
+            if printn[0] % 10 == 0:
+                sys.stdout.write('\n')
+            sys.stdout.flush()
+
+    print('')
+    # Now find smallest values for delay constants
+    # Due to input bounds (ex: column limit), some delay elements may get eliminated entirely
+    print('Running linprog w/ %d r, %d c (%d name)' % (rows, cols, len(names_orig)))
+    res = linprog(c, A_ub=A_ub, b_ub=b_ub, bounds=bounds, callback=callback,
+          options={"disp": True, 'maxiter': maxiter, 'bland': True, 'tol': 1e-6,})
+    nonzeros = 0
+    print('Ran %d iters' % iters[0])
+    if res.success:
+        print('Result sample (%d elements)' % (len(res.x)))
+        plim = 3
+        for xi, (name, x) in enumerate(zip(names, res.x)):
+            nonzero = x >= 0.001
+            if nonzero:
+                nonzeros += 1
+            #if nonzero and (verbose >= 1 or xi > 30):
+            if nonzero and (verbose or ((nonzeros < 100 or nonzeros % 20 == 0) and nonzeros <= plim)):
+                print('  % 4u % -80s % 10.1f' % (xi, name, x))
+        print('Delay on %d / %d' % (nonzeros, len(res.x)))
+        if not os.path.exists('res'):
+            os.mkdir('res')
+        fn_out = 'res/%s' % datetime.datetime.utcnow().isoformat().split('.')[0]
+        print('Writing %s' % fn_out)
+        np.save(fn_out, (3, c, A_ub, b_ub, bounds, names, res, meta))
+
diff --git a/experiments/timfuz/top.v b/experiments/timfuz/top.v
new file mode 100644
index 00000000..0cb9b8a3
--- /dev/null
+++ b/experiments/timfuz/top.v
@@ -0,0 +1,109 @@
+//move some stuff to minitests/ncy0
+
+`define SEED 32'h12345678
+
+module top(input clk, stb, di, output do);
+	localparam integer DIN_N = 42;
+	localparam integer DOUT_N = 79;
+
+	reg [DIN_N-1:0] din;
+	wire [DOUT_N-1:0] dout;
+
+	reg [DIN_N-1:0] din_shr;
+	reg [DOUT_N-1:0] dout_shr;
+
+	always @(posedge clk) begin
+		din_shr <= {din_shr, di};
+		dout_shr <= {dout_shr, din_shr[DIN_N-1]};
+		if (stb) begin
+			din <= din_shr;
+			dout_shr <= dout;
+		end
+	end
+
+	assign do = dout_shr[DOUT_N-1];
+
+	roi #(.DIN_N(DIN_N), .DOUT_N(DOUT_N))
+	    roi (
+		.clk(clk),
+		.din(din),
+		.dout(dout)
+	);
+endmodule
+
+module roi(input clk, input [DIN_N-1:0] din, output [DOUT_N-1:0] dout);
+	parameter integer DIN_N = -1;
+	parameter integer DOUT_N = -1;
+
+    /*
+    //Take out for now to make sure LUTs are more predictable
+	picorv32 picorv32 (
+		.clk(clk),
+		.resetn(din[0]),
+		.mem_valid(dout[0]),
+		.mem_instr(dout[1]),
+		.mem_ready(din[1]),
+		.mem_addr(dout[33:2]),
+		.mem_wdata(dout[66:34]),
+		.mem_wstrb(dout[70:67]),
+		.mem_rdata(din[33:2])
+	);
+	*/
+
+    /*
+	randluts randluts (
+		.din(din[41:34]),
+		.dout(dout[78:71])
+	);
+	*/
+	randluts #(.N(150)) randluts (
+		.din(din[41:34]),
+		.dout(dout[78:71])
+	);
+endmodule
+
+module randluts(input [7:0] din, output [7:0] dout);
+	parameter integer N = 250;
+
+	function [31:0] xorshift32(input [31:0] xorin);
+		begin
+			xorshift32 = xorin;
+			xorshift32 = xorshift32 ^ (xorshift32 << 13);
+			xorshift32 = xorshift32 ^ (xorshift32 >> 17);
+			xorshift32 = xorshift32 ^ (xorshift32 <<  5);
+		end
+	endfunction
+
+	function [63:0] lutinit(input [7:0] a, b);
+		begin
+			lutinit[63:32] = xorshift32(xorshift32(xorshift32(xorshift32({a, b} ^ `SEED))));
+			lutinit[31: 0] = xorshift32(xorshift32(xorshift32(xorshift32({b, a} ^ `SEED))));
+		end
+	endfunction
+
+	wire [(N+1)*8-1:0] nets;
+
+	assign nets[7:0] = din;
+	assign dout = nets[(N+1)*8-1:N*8];
+
+	genvar i, j;
+	generate
+		for (i = 0; i < N; i = i+1) begin:is
+			for (j = 0; j < 8; j = j+1) begin:js
+				localparam integer k = xorshift32(xorshift32(xorshift32(xorshift32((i << 20) ^ (j << 10) ^ `SEED)))) & 255;
+				(* KEEP, DONT_TOUCH *)
+				LUT6 #(
+					.INIT(lutinit(i, j))
+				) lut (
+					.I0(nets[8*i+(k+0)%8]),
+					.I1(nets[8*i+(k+1)%8]),
+					.I2(nets[8*i+(k+2)%8]),
+					.I3(nets[8*i+(k+3)%8]),
+					.I4(nets[8*i+(k+4)%8]),
+					.I5(nets[8*i+(k+5)%8]),
+					.O(nets[8*i+8+j])
+				);
+			end
+		end
+	endgenerate
+endmodule
diff --git a/experiments/timfuz/wire_unique.py b/experiments/timfuz/wire_unique.py
new file mode 100644
index 00000000..391c2e0c
--- /dev/null
+++ b/experiments/timfuz/wire_unique.py
@@ -0,0 +1,92 @@
+'''
+Verifies that node timing info is unique
+'''
+
+import re
+
+def gen_wires(fin):
+    for l in fin:
+        lj = {}
+        l = l.strip()
+        for kvs in l.split():
+            name, value = kvs.split(':')
+            lj[name] = value
+
+        tile_type, xy, wname = re.match(r'(.*)_(X[0-9]*Y[0-9]*)/(.*)', lj['NAME']).groups()
+        lj['tile_type'] = tile_type
+        lj['xy'] = xy
+        lj['wname'] = wname
+
+        lj['l'] = l
+
+        yield lj
+
+def run(node_fin, verbose=0):
+    refnodes = {}
+    nodei = 0
+    for nodei, anode in enumerate(gen_wires(node_fin)):
+        def getk(anode):
+            return anode['wname']
+            #return (anode['tile_type'], anode['wname'])
+
+        if nodei % 1000 == 0:
+            print 'Check node %d' % nodei
+        # Existing node?
+        try:
+            refnode = refnodes[getk(anode)]
+        except KeyError:
+            # Set as reference
+            refnodes[getk(anode)] = anode
+            continue
+        k_invariant = (
+                'COST_CODE',
+                'IS_INPUT_PIN',
+                'IS_OUTPUT_PIN',
+                'IS_PART_OF_BUS',
+                'NUM_INTERSECTS',
+                'NUM_TILE_PORTS',
+                'SPEED_INDEX',
+                'TILE_PATTERN_OFFSET',
+                )
+        k_varies = (
+                'ID_IN_TILE_TYPE',
+                'IS_CONNECTED',
+                'NUM_DOWNHILL_PIPS',
+                'NUM_PIPS',
+                'NUM_UPHILL_PIPS',
+                'TILE_NAME',
+            )
+        # Verify equivilence
+        for k in k_invariant:
+            if k in refnode and k in anode:
+                def fail():
+                    print 'Mismatch on %s' % k
+                    print refnode[k], anode[k]
+                    print refnode['l']
+                    print anode['l']
+                    #assert 0
+                if refnode[k] != anode[k]:
+                    print
+                    fail()
+            # A key in one but not the other?
+            elif k in refnode or k in anode:
+                assert 0
+            elif k not in k_varies:
+                assert 0
+
+if __name__ == '__main__':
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description=
+        'Timing fuzzer'
+    )
+
+    parser.add_argument('--verbose', type=int, help='')
+    parser.add_argument(
+        'node_fn_in',
+        default='/dev/stdin',
+        nargs='?',
+        help='Input file')
+    args = parser.parse_args()
+    run(open(args.node_fn_in, 'r'), verbose=args.verbose)

From 8c5436916c422e580619aafd7879d476047bc6c1 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Fri, 24 Aug 2018 12:51:21 -0700
Subject: [PATCH 02/55] timfuz: begin converting to fractions

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 experiments/timfuz/timfuz_checksub.py |  4 +++-
 experiments/timfuz/timfuz_rref.py     | 21 +++++++++++++++++++--
 2 files changed, 22 insertions(+), 3 deletions(-)

diff --git a/experiments/timfuz/timfuz_checksub.py b/experiments/timfuz/timfuz_checksub.py
index 774ce020..cf290d78 100644
--- a/experiments/timfuz/timfuz_checksub.py
+++ b/experiments/timfuz/timfuz_checksub.py
@@ -8,7 +8,7 @@ import math
 from collections import OrderedDict
 
 # check for issues that may be due to round off error
-STRICT = 1
+STRICT = 0
 
 def Adi2matrix_random(A_ubd, b_ub, names):
     # random assignment
@@ -92,6 +92,8 @@ def row_sub_syms(row, sub_json, verbose=False):
         assert pivot not in row
 
     # after all constants are applied, the row should end up positive?
+    # numeric precision issues may limit this
+    # Ex: AssertionError: ('PIP_BSW_2ELSING0', -2.220446049250313e-16)
     if STRICT:
         for k, v in sorted(row.items()):
             assert v > 0, (k, v)
diff --git a/experiments/timfuz/timfuz_rref.py b/experiments/timfuz/timfuz_rref.py
index 2fc3c103..1fa514b3 100644
--- a/experiments/timfuz/timfuz_rref.py
+++ b/experiments/timfuz/timfuz_rref.py
@@ -12,8 +12,22 @@ import math
 import json
 import sympy
 from collections import OrderedDict
+from fractions import Fraction
 
-STRICT = 1
+STRICT = 0
+
+def fracr(r):
+    DELTA = 0.0001
+
+    for i, x in enumerate(r):
+        if type(x) is float:
+            xi = int(x)
+            assert abs(xi - x) < DELTA
+            r[i] = xi
+    return [Fraction(x) for x in r]
+
+def fracm(m):
+    return [fracr(r) for r in m]
 
 class State(object):
     def __init__(self, Ads, drop_names=[]):
@@ -97,10 +111,13 @@ def comb_corr_sets(state, verbose=False):
     mnp = Anp2matrix(Anp)
     print('Matrix: %u rows x %u cols' % (len(mnp), len(mnp[0])))
     print('Converting np to sympy matrix')
-    msym = sympy.Matrix(mnp)
+    mfrac = fracm(mnp)
+    print('mfrac', type(mfrac[0][0]))
+    msym = sympy.Matrix(mfrac)
     print('Making rref')
     rref, pivots = msym.rref()
 
+
     if verbose:
         print('names')
         print(names)

From 71dad3d09cf498d69d567fab7b3507faaaa7eb36 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Fri, 24 Aug 2018 13:12:33 -0700
Subject: [PATCH 03/55] timfuz: use symbolic math to generate constants

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 experiments/timfuz/timfuz_checksub.py | 11 ++----
 experiments/timfuz/timfuz_rref.py     | 56 +++++++++++++++------------
 2 files changed, 35 insertions(+), 32 deletions(-)

diff --git a/experiments/timfuz/timfuz_checksub.py b/experiments/timfuz/timfuz_checksub.py
index cf290d78..a1bbc5d7 100644
--- a/experiments/timfuz/timfuz_checksub.py
+++ b/experiments/timfuz/timfuz_checksub.py
@@ -8,7 +8,7 @@ import math
 from collections import OrderedDict
 
 # check for issues that may be due to round off error
-STRICT = 0
+STRICT = 1
 
 def Adi2matrix_random(A_ubd, b_ub, names):
     # random assignment
@@ -78,7 +78,7 @@ def row_sub_syms(row, sub_json, verbose=False):
             print('pivot %i %s' % (n, pivot))
         for subk, subv in sorted(sub_json['subs'][group].items()):
             oldn = row.get(subk, 0)
-            rown = oldn - n * subv
+            rown = oldn - n * (1.0* subv[0] / subv[1])
             if verbose:
                 print("  %s: %d => %d" % (subk, oldn, rown))
             if rown == 0:
@@ -208,12 +208,7 @@ def load_sub(fn):
         for name, vals in sorted(j['subs'].items()):
             pivot = None
             for k, v in vals.items():
-                if STRICT:
-                    vi = int(round(v))
-                    assert abs(vi - v) < delta
-                    vals[k] = vi
-                else:
-                    vals[k] = float(v)
+                vals[k] = float(v)
 
                 # there may be more than one acceptable pivot
                 # take the first
diff --git a/experiments/timfuz/timfuz_rref.py b/experiments/timfuz/timfuz_rref.py
index 1fa514b3..0ac87967 100644
--- a/experiments/timfuz/timfuz_rref.py
+++ b/experiments/timfuz/timfuz_rref.py
@@ -14,8 +14,6 @@ import sympy
 from collections import OrderedDict
 from fractions import Fraction
 
-STRICT = 0
-
 def fracr(r):
     DELTA = 0.0001
 
@@ -85,6 +83,12 @@ def Adi2matrix(Adi, cols):
     return A_ub2
 
 def Anp2matrix(Anp):
+    '''
+    Original idea was to make into a square matrix
+    but this loses too much information
+    so now this actually isn't doing anything and should probably be eliminated
+    '''
+
     ncols = len(Anp[0])
     A_ub2 = [np.zeros(ncols) for _i in range(ncols)]
     dst_rowi = 0
@@ -102,6 +106,19 @@ def row_np2ds(rownp, names):
             ret[name] = v
     return ret
 
+def row_sym2dsf(rowsym, names):
+    '''Convert a sympy row into a dictionary of keys to (numerator, denominator) tuples'''
+    from sympy import fraction
+
+    ret = {}
+    assert len(rowsym) == len(names), (len(rowsym), len(names))
+    for namei, name in enumerate(names):
+        v = rowsym[namei]
+        if v:
+            (num, den) = fraction(v)
+            ret[name] = (int(num), int(den))
+    return ret
+
 def comb_corr_sets(state, verbose=False):
     print('Converting rows to integer keys')
     names, Anp = A_ds2np(state.Ads)
@@ -130,50 +147,41 @@ def comb_corr_sets(state, verbose=False):
 
     state.pivots = {}
 
-    def row_solved(rownp, row_pivot):
-        for ci, c in enumerate(rownp):
+    def row_solved(rowsym, row_pivot):
+        for ci, c in enumerate(rowsym):
             if ci == row_pivot:
                 continue
             if c != 0:
                 return False
         return True
 
-    rrefnp = np.array(rref).astype(np.float64)
-    print('Computing groups w/ rref %u row x %u col' % (len(rrefnp), len(rrefnp[0])))
+    #rrefnp = np.array(rref).astype(np.float64)
+    #print('Computing groups w/ rref %u row x %u col' % (len(rrefnp), len(rrefnp[0])))
     #print(rrefnp)
     # rows that have a single 1 are okay
     # anything else requires substitution (unless all 0)
     # pivots may be fewer than the rows
     # remaining rows should be 0s
-    for row_i, (row_pivot, rownp) in enumerate(zip(pivots, rrefnp)):
-        rowds = row_np2ds(rownp, names)
-        # boring cases: solved variable, not fully ranked
-        #if sum(rowds.values()) == 1:
-        if row_solved(rownp, row_pivot):
+    for row_i, row_pivot in enumerate(pivots):
+        rowsym = rref.row(row_i)
+        # yipee! nothign to report
+        if row_solved(rowsym, row_pivot):
             continue
 
         # a grouping
         group_name = "GROUP_%u" % row_i
-        if STRICT:
-            delta = 0.001
-            rowds_store = {}
-            for k, v in rowds.items():
-                vi = int(round(v))
-                error = abs(vi - v)
-                assert error < delta, (error, delta)
-                rowds_store[k] = vi
-        else:
-            rowds_store = rowds
-        state.subs[group_name] = rowds_store
+        rowdsf = row_sym2dsf(rowsym, names)
+
+        state.subs[group_name] = rowdsf
         # Add the new symbol
         state.names.add(group_name)
         # Remove substituted symbols
         # Note: symbols may appear multiple times
-        state.names.difference_update(set(rowds.keys()))
+        state.names.difference_update(set(rowdsf.keys()))
         pivot_name = names[row_pivot]
         state.pivots[group_name] = pivot_name
         if verbose:
-            print("%s (%s): %s" % (group_name, pivot_name, rowds))
+            print("%s (%s): %s" % (group_name, pivot_name, rowdsf))
 
     return state
 

From 97ea34d4cd5e39d0c68bf92a7d0200dd49153363 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Fri, 24 Aug 2018 13:22:34 -0700
Subject: [PATCH 04/55] timfuz: checksub uses fractions

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 experiments/timfuz/timfuz_checksub.py | 32 +++++----------------------
 1 file changed, 6 insertions(+), 26 deletions(-)

diff --git a/experiments/timfuz/timfuz_checksub.py b/experiments/timfuz/timfuz_checksub.py
index a1bbc5d7..3bd4df63 100644
--- a/experiments/timfuz/timfuz_checksub.py
+++ b/experiments/timfuz/timfuz_checksub.py
@@ -6,6 +6,7 @@ import glob
 import json
 import math
 from collections import OrderedDict
+from fractions import Fraction
 
 # check for issues that may be due to round off error
 STRICT = 1
@@ -77,8 +78,8 @@ def row_sub_syms(row, sub_json, verbose=False):
         if verbose:
             print('pivot %i %s' % (n, pivot))
         for subk, subv in sorted(sub_json['subs'][group].items()):
-            oldn = row.get(subk, 0)
-            rown = oldn - n * (1.0* subv[0] / subv[1])
+            oldn = row.get(subk, Fraction(0))
+            rown = oldn - n * subv
             if verbose:
                 print("  %s: %d => %d" % (subk, oldn, rown))
             if rown == 0:
@@ -190,32 +191,11 @@ def run(fns_in, sub_json=None, verbose=False, corner=None):
             print('slogdet :) : %s, %s' % (sign, logdet))
 
 def load_sub(fn):
-    delta = 0.001
     j = json.load(open(fn, 'r'))
 
-    # convert groups to use integer constants
-    # beware of roundoff error
-    # if we round poorly here, it won't give incorrect results later, but may make it fail to find a good solution
-
-    if 'pivots' in j:
-        print('pivots: using existing')
-    else:
-        print('pivots: guessing')
-
-        pivots = OrderedDict()
-        j['pivots'] = pivots
-
-        for name, vals in sorted(j['subs'].items()):
-            pivot = None
-            for k, v in vals.items():
-                vals[k] = float(v)
-
-                # there may be more than one acceptable pivot
-                # take the first
-                if v == 1 and pivot is None:
-                    pivot = k
-            assert pivot is not None
-            pivots[name] = pivot
+    for name, vals in sorted(j['subs'].items()):
+        for k, v in vals.items():
+            vals[k] = Fraction(v[0], v[1])
 
     return j
 

From aeebb45b34446fefbb14bb713a1ba590ca465f02 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Fri, 24 Aug 2018 14:10:36 -0700
Subject: [PATCH 05/55] timfuz: timfuz_solve main()

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 experiments/timfuz/timfuz.py          | 121 +++++++++++++++++--
 experiments/timfuz/timfuz_checksub.py | 117 ++----------------
 experiments/timfuz/timfuz_solve.py    | 165 ++++++++++++++++++++++----
 3 files changed, 261 insertions(+), 142 deletions(-)

diff --git a/experiments/timfuz/timfuz.py b/experiments/timfuz/timfuz.py
index 1e14074b..9082c25b 100644
--- a/experiments/timfuz/timfuz.py
+++ b/experiments/timfuz/timfuz.py
@@ -1,7 +1,5 @@
 #!/usr/bin/env python
 
-# https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
-from scipy.optimize import linprog
 import math
 import numpy as np
 from collections import OrderedDict
@@ -14,6 +12,7 @@ import copy
 import sys
 import random
 import glob
+from fractions import Fraction
 
 from benchmark import Benchmark
 
@@ -229,36 +228,33 @@ def simplify_cols(names, A_ubd, b_ub):
     nr = list(names_ret.keys())
     return nr, A_ub_ret, b_ub
 
-def A_ubr_np2d(row, sf=1):
+def A_ubr_np2d(row):
     '''Convert a single row'''
     #d = {}
     d = OrderedDict()
     for coli, val in enumerate(row):
         if val:
-            d[coli] = sf * val
+            d[coli] = val
     return d
 
-def A_ub_np2d(A_ub, sf=1):
+def A_ub_np2d(A_ub):
     '''Convert A_ub entries in numpy matrix to dictionary / sparse form'''
     A_ubd = [None] * len(A_ub)
     for i, row in enumerate(A_ub):
-        A_ubd[i] = A_ubr_np2d(row, sf=sf)
+        A_ubd[i] = A_ubr_np2d(row)
     return A_ubd
 
-# def Ar_ds2np(row_ds, names):
-#     Ar_di2np(row_di, cols, sf=1)
-
-def Ar_di2np(row_di, cols, sf=1):
+def Ar_di2np(row_di, cols):
     rownp = np.zeros(cols)
     for coli, val in row_di.items():
         # Sign inversion due to way solver works
-        rownp[coli] = sf * val
+        rownp[coli] = val
     return rownp
 
 # NOTE: sign inversion
-def A_di2np(Adi, cols, sf=1):
+def A_di2np(Adi, cols):
     '''Convert A_ub entries in dictionary / sparse to numpy matrix form'''
-    return [Ar_di2np(row_di, cols, sf=sf) for row_di in Adi]
+    return [Ar_di2np(row_di, cols) for row_di in Adi]
 
 def Ar_ds2t(rowd):
     '''Convert a dictionary row into a tuple with (column number, value) tuples'''
@@ -817,3 +813,102 @@ def index_names(Ads):
         for k1 in row_ds.keys():
             names.add(k1)
     return names
+
+def load_sub(fn):
+    j = json.load(open(fn, 'r'))
+
+    for name, vals in sorted(j['subs'].items()):
+        for k, v in vals.items():
+            vals[k] = Fraction(v[0], v[1])
+
+    return j
+
+def row_sub_syms(row, sub_json, verbose=False):
+    if 0 and verbose:
+        print("")
+        print(row.items())
+
+    delsyms = 0
+    for k in sub_json['drop_names']:
+        try:
+            del row[k]
+            delsyms += 1
+        except KeyError:
+            pass
+    if verbose:
+        print("Deleted %u symbols" % delsyms)
+
+    if verbose:
+        print('Checking pivots')
+        print(sorted(row.items()))
+        for group, pivot in sorted(sub_json['pivots'].items()):
+            if pivot not in row:
+                continue
+            n = row[pivot]
+            print('  pivot %u %s' % (n, pivot))
+
+    for group, pivot in sorted(sub_json['pivots'].items()):
+        if pivot not in row:
+            continue
+
+        # take the sub out n times
+        # note constants may be negative
+        n = row[pivot]
+        if verbose:
+            print('pivot %i %s' % (n, pivot))
+        for subk, subv in sorted(sub_json['subs'][group].items()):
+            oldn = row.get(subk, Fraction(0))
+            rown = oldn - n * subv
+            if verbose:
+                print("  %s: %d => %d" % (subk, oldn, rown))
+            if rown == 0:
+                # only becomes zero if didn't previously exist
+                del row[subk]
+                if verbose:
+                    print("    del")
+            else:
+                row[subk] = rown
+        row[group] = n
+        assert pivot not in row
+
+    # after all constants are applied, the row should end up positive?
+    # numeric precision issues previously limited this
+    # Ex: AssertionError: ('PIP_BSW_2ELSING0', -2.220446049250313e-16)
+    for k, v in sorted(row.items()):
+        assert v > 0, (k, v)
+
+def run_sub_json(Ads, sub_json, verbose=False):
+    nrows = 0
+    nsubs = 0
+
+    ncols_old = 0
+    ncols_new = 0
+
+    print('Subbing %u rows' % len(Ads))
+    prints = set()
+
+    for rowi, row in enumerate(Ads):
+        if 0 and verbose:
+            print(row)
+        if verbose:
+            print('')
+            print('Row %u w/ %u elements' % (rowi, len(row)))
+
+        row_orig = dict(row)
+        row_sub_syms(row, sub_json, verbose=verbose)
+        nrows += 1
+        if row_orig != row:
+            nsubs += 1
+            if verbose:
+                rowt = Ar_ds2t(row)
+                if rowt not in prints:
+                    print('row', row)
+                    prints.add(rowt)
+        ncols_old += len(row_orig)
+        ncols_new += len(row)
+
+    if verbose:
+        print('')
+
+    print("Sub: %u / %u rows changed" % (nsubs, nrows))
+    print("Sub: %u => %u cols" % (ncols_old, ncols_new))
diff --git a/experiments/timfuz/timfuz_checksub.py b/experiments/timfuz/timfuz_checksub.py
index 3bd4df63..f91fb38e 100644
--- a/experiments/timfuz/timfuz_checksub.py
+++ b/experiments/timfuz/timfuz_checksub.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python3
 
-from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np
+from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json
 import numpy as np
 import glob
 import json
@@ -8,9 +8,6 @@ import math
 from collections import OrderedDict
 from fractions import Fraction
 
-# check for issues that may be due to round off error
-STRICT = 1
-
 def Adi2matrix_random(A_ubd, b_ub, names):
     # random assignment
     # was making some empty rows
@@ -44,97 +41,6 @@ def Ads2matrix_linear(Ads, b):
         dst_rowi = (dst_rowi + 1) % rows_out
     return A_ret, b_ret
 
-def row_sub_syms(row, sub_json, verbose=False):
-    if 0 and verbose:
-        print("")
-        print(row.items())
-
-    delsyms = 0
-    for k in sub_json['drop_names']:
-        try:
-            del row[k]
-            delsyms += 1
-        except KeyError:
-            pass
-    if verbose:
-        print("Deleted %u symbols" % delsyms)
-
-    if verbose:
-        print('Checking pivots')
-        print(sorted(row.items()))
-        for group, pivot in sorted(sub_json['pivots'].items()):
-            if pivot not in row:
-                continue
-            n = row[pivot]
-            print('  pivot %u %s' % (n, pivot))
-
-    for group, pivot in sorted(sub_json['pivots'].items()):
-        if pivot not in row:
-            continue
-
-        # take the sub out n times
-        # note constants may be negative
-        n = row[pivot]
-        if verbose:
-            print('pivot %i %s' % (n, pivot))
-        for subk, subv in sorted(sub_json['subs'][group].items()):
-            oldn = row.get(subk, Fraction(0))
-            rown = oldn - n * subv
-            if verbose:
-                print("  %s: %d => %d" % (subk, oldn, rown))
-            if rown == 0:
-                # only becomes zero if didn't previously exist
-                del row[subk]
-                if verbose:
-                    print("    del")
-            else:
-                row[subk] = rown
-        row[group] = n
-        assert pivot not in row
-
-    # after all constants are applied, the row should end up positive?
-    # numeric precision issues may limit this
-    # Ex: AssertionError: ('PIP_BSW_2ELSING0', -2.220446049250313e-16)
-    if STRICT:
-        for k, v in sorted(row.items()):
-            assert v > 0, (k, v)
-
-def run_sub_json(Ads, sub_json, verbose=False):
-    nrows = 0
-    nsubs = 0
-
-    ncols_old = 0
-    ncols_new = 0
-
-    print('Subbing %u rows' % len(Ads))
-    prints = set()
-
-    for rowi, row in enumerate(Ads):
-        if 0 and verbose:
-            print(row)
-        if verbose:
-            print('')
-            print('Row %u w/ %u elements' % (rowi, len(row)))
-
-        row_orig = dict(row)
-        row_sub_syms(row, sub_json, verbose=verbose)
-        nrows += 1
-        if row_orig != row:
-            nsubs += 1
-            if verbose:
-                rowt = Ar_ds2t(row)
-                if rowt not in prints:
-                    print('row', row)
-                    prints.add(rowt)
-        ncols_old += len(row_orig)
-        ncols_new += len(row)
-
-    if verbose:
-        print('')
-
-    print("Sub: %u / %u rows changed" % (nsubs, nrows))
-    print("Sub: %u => %u cols" % (ncols_old, ncols_new))
-
 def pmatrix(Anp, s):
     import sympy
     msym = sympy.Matrix(Anp)
@@ -146,7 +52,10 @@ def pds(Ads, s):
     pmatrix(Anp, s)
     print('Names: %s' % (names,))
 
-def run(fns_in, sub_json=None, verbose=False, corner=None):
+def run(fns_in, sub_json=None, verbose=False):
+    # arbitrary...data is thrown away
+    corner = "slow_max"
+
     Ads, b = loadc_Ads_b(fns_in, corner, ico=True)
 
     # Remove duplicate rows
@@ -190,15 +99,6 @@ def run(fns_in, sub_json=None, verbose=False, corner=None):
         else:
             print('slogdet :) : %s, %s' % (sign, logdet))
 
-def load_sub(fn):
-    j = json.load(open(fn, 'r'))
-
-    for name, vals in sorted(j['subs'].items()):
-        for k, v in vals.items():
-            vals[k] = Fraction(v[0], v[1])
-
-    return j
-
 def main():
     import argparse
 
@@ -209,18 +109,17 @@ def main():
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--sub-json', help='')
-    parser.add_argument('--corner', default="slow_max", help='')
     parser.add_argument(
         'fns_in',
         nargs='*',
-        help='timing3.txt input files')
+        help='timing3.csv input files')
     args = parser.parse_args()
     # Store options in dict to ease passing through functions
     bench = Benchmark()
 
     fns_in = args.fns_in
     if not fns_in:
-        fns_in = glob.glob('specimen_*/timing3.txt')
+        fns_in = glob.glob('specimen_*/timing3.csv')
 
     sub_json = None
     if args.sub_json:
@@ -228,7 +127,7 @@ def main():
 
     try:
         run(sub_json=sub_json,
-            fns_in=fns_in, verbose=args.verbose, corner=args.corner)
+            fns_in=fns_in, verbose=args.verbose)
     finally:
         print('Exiting after %s' % bench)
 
diff --git a/experiments/timfuz/timfuz_solve.py b/experiments/timfuz/timfuz_solve.py
index 225d3060..2041d773 100644
--- a/experiments/timfuz/timfuz_solve.py
+++ b/experiments/timfuz/timfuz_solve.py
@@ -1,24 +1,77 @@
 #!/usr/bin/env python3
 
-def run_corner(A_ubd, b_ub, names, verbose=0, opts={}, meta={}):
+# https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
+from scipy.optimize import linprog
+from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json
+import numpy as np
+import glob
+import json
+import math
+from collections import OrderedDict
+from fractions import Fraction
+import sys
+import datetime
+import os
+import time
+
+def check_feasible(A_ub, b_ub):
+    '''
+    Put large timing constants into the equations
+    See if that would solve it
+
+    Its having trouble giving me solutions as this gets bigger
+    Make a terrible baseline guess to confirm we aren't doing something bad
+    '''
+
+    sys.stdout.write('Check feasible ')
+    sys.stdout.flush()
+
+    rows = len(b_ub)
+    cols = len(A_ub[0])
+
+    progress = max(1, rows / 100)
+
+    # Chose a high arbitrary value for x
+    # Delays should be in order of ns, so a 10 ns delay should be way above what anything should be
+    xs = [10e3 for _i in range(cols)]
+
+    # FIXME: use the correct np function to do this for me
+    # Verify bounds
+    #b_res = np.matmul(A_ub, xs)
+    #print(type(A_ub), type(xs)
+    #A_ub = np.array(A_ub)
+    #xs = np.array(xs)
+    #b_res = np.matmul(A_ub, xs)
+    def my_mul(A_ub, xs):
+        #print('cols', cols
+        #print('rows', rows
+        ret = [None] * rows
+        for row in range(rows):
+            this = 0
+            for col in range(cols):
+                this += A_ub[row][col] * xs[col]
+            ret[row] = this
+        return ret
+    b_res = my_mul(A_ub, xs)
+
+    # Verify bound was respected
+    for rowi, (this_b, this_b_ub) in enumerate(zip(b_res, b_ub)):
+        if rowi % progress == 0:
+            sys.stdout.write('.')
+            sys.stdout.flush()
+        if this_b >= this_b_ub or this_b > 0:
+            print('% 4d Want res % 10.1f <= % 10.1f <= 0' % (rowi, this_b, this_b_ub))
+            raise Exception("Bad ")
+    print(' done')
+
+def run_corner(Anp, b, names, verbose=False, opts={}, meta={}):
+    assert type(Anp[0]) is np.ndarray, type(Anp[0])
+    assert type(b) is np.ndarray, type(b)
+
     # Given timing scores for above delays (-ps)
     names_orig = names
 
-    #print_eqns(A_ub, b_ub, verbose=verbose)
-    names, A_ubd, b_ub = massage_equations(A_ubd, b_ub, opts, names, verbose=verbose)
-
-    print
-    print_eqns(A_ubd, b_ub, verbose=verbose)
-
-    print
-    col_dist(A_ubd, 'final', names)
-
-    A_ub, b_ub = Ab_d2np(A_ubd, b_ub, names)
-
-    # Its having trouble giving me solutions as this gets bigger
-    # Make a terrible baseline guess to confirm we aren't doing something bad
-    #print_names(names, verbose=verbose)
-    check_feasible(A_ub=A_ub, b_ub=b_ub)
+    #check_feasible(Anp, b)
 
     '''
     Be mindful of signs
@@ -31,8 +84,14 @@ def run_corner(A_ubd, b_ub, names, verbose=0, opts={}, meta={}):
     -delay1 +   -delay2 +               -delay4     <= -timing1
                 -delay2 +   -delay3                 <= -timing2
     '''
-    rows = len(A_ub)
-    cols = len(A_ub[0])
+    rows = len(Anp)
+    cols = len(Anp[0])
+    print('Scaling to solution form...')
+    b_ub = -1.0 * b
+    #A_ub = -1.0 * Anp
+    A_ub = [-1.0 * x for x in Anp]
+
+    print('Creating misc constants...')
     # Minimization function scalars
     # Treat all logic elements as equally important
     c = [1 for _i in range(len(names))]
@@ -50,12 +109,12 @@ def run_corner(A_ubd, b_ub, names, verbose=0, opts={}, meta={}):
     maxiter = 1000000
 
     if verbose >= 2:
-        print('b_ub', b_ub)
+        print('b_ub', b)
     print('Unique delay elements: %d' % len(names))
     print('  # delay minimization weights: %d' % len(c))
     print('  # delay constraints: %d' % len(bounds))
     print('Input paths')
-    print('  # timing scores: %d' % len(b_ub))
+    print('  # timing scores: %d' % len(b))
     print('  Rows: %d' % rows)
 
     tlast = [time.time()]
@@ -96,3 +155,69 @@ def run_corner(A_ubd, b_ub, names, verbose=0, opts={}, meta={}):
         print('Writing %s' % fn_out)
         np.save(fn_out, (3, c, A_ub, b_ub, bounds, names, res, meta))
 
+def run(fns_in, corner, sub_json=None, dedup=True, verbose=False):
+    Ads, b = loadc_Ads_b(fns_in, corner, ico=True)
+
+    # Remove duplicate rows
+    # is this necessary?
+    # maybe better to just add them into the matrix directly
+    if dedup:
+        oldn = len(Ads)
+        Ads, b = simplify_rows(Ads, b)
+        print('Simplify %u => %u rows' % (oldn, len(Ads)))
+
+    if sub_json:
+        print('Sub: %u rows' % len(Ads))
+        names_old = index_names(Ads)
+        run_sub_json(Ads, sub_json, verbose=verbose)
+        names = index_names(Ads)
+        print("Sub: %u => %u names" % (len(names_old), len(names)))
+    else:
+        names = index_names(Ads)
+
+    if 0:
+        print
+        print_eqns(A_ubd, b_ub, verbose=verbose)
+
+        print
+        col_dist(A_ubd, 'final', names)
+
+    print('Converting to numpy...')
+    names, Anp = A_ds2np(Ads)
+    run_corner(Anp, np.asarray(b), names, verbose=verbose)
+
+def main():
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description=
+        'Solve timing solution'
+    )
+
+    parser.add_argument('--verbose', action='store_true', help='')
+    parser.add_argument('--sub-json', help='Group substitutions to make fully ranked')
+    parser.add_argument('--corner', default="slow_max", help='')
+    parser.add_argument(
+        'fns_in',
+        nargs='*',
+        help='timing3.csv input files')
+    args = parser.parse_args()
+    # Store options in dict to ease passing through functions
+    bench = Benchmark()
+
+    fns_in = args.fns_in
+    if not fns_in:
+        fns_in = glob.glob('specimen_*/timing3.csv')
+
+    sub_json = None
+    if args.sub_json:
+        sub_json = load_sub(args.sub_json)
+
+    try:
+        run(sub_json=sub_json,
+            fns_in=fns_in, verbose=args.verbose, corner=args.corner)
+    finally:
+        print('Exiting after %s' % bench)
+
+if __name__ == '__main__':
+    main()

From 343cd5b41386106590df35865ee029c0ae2c27b7 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Fri, 24 Aug 2018 14:56:50 -0700
Subject: [PATCH 06/55] timfuz: old massage routines added back in

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 experiments/timfuz/timfuz.py         | 146 +++---------
 experiments/timfuz/timfuz_massage.py | 335 +++++++++++++++++++++++++++
 experiments/timfuz/timfuz_rref.py    |   2 +-
 experiments/timfuz/timfuz_solve.py   |  31 ++-
 4 files changed, 385 insertions(+), 129 deletions(-)
 create mode 100644 experiments/timfuz/timfuz_massage.py

diff --git a/experiments/timfuz/timfuz.py b/experiments/timfuz/timfuz.py
index 9082c25b..f0b4af9f 100644
--- a/experiments/timfuz/timfuz.py
+++ b/experiments/timfuz/timfuz.py
@@ -130,18 +130,18 @@ def Ab_ub_dt2d(eqns):
     return list(A_ubd), list(b_ub)
 
 # This significantly reduces runtime
-def simplify_rows(A_ubd, b_ub):
+def simplify_rows(Ads, b_ub):
     '''Remove duplicate equations, taking highest delay'''
     # dict of constants to highest delay
     eqns = OrderedDict()
-    assert len(A_ubd) == len(b_ub), (len(A_ubd), len(b_ub))
+    assert len(Ads) == len(b_ub), (len(Ads), len(b_ub))
 
     sys.stdout.write('SimpR ')
     sys.stdout.flush()
     progress = max(1, len(b_ub) / 100)
     zero_ds = 0
     zero_es = 0
-    for loopi, (b, rowd) in enumerate(zip(b_ub, A_ubd)):
+    for loopi, (b, rowd) in enumerate(zip(b_ub, Ads)):
         if loopi % progress == 0:
             sys.stdout.write('.')
             sys.stdout.flush()
@@ -173,61 +173,6 @@ def simplify_rows(A_ubd, b_ub):
     #return A_ub_np2d(A_ub_ret), b_ub_ret
     return A_ubd_ret, b_ub_ret
 
-def simplify_cols(names, A_ubd, b_ub):
-    '''
-    Remove unsued columns
-    This is fairly straightforward in dictionary form now as only have to remove and adjust indices
-    Maybe should use the names as keys? Then this wouldn't be needed anymore as indices wouldn't need to be rebased
-
-    XXX: shuffles the name order around. Do we care?
-    '''
-
-    # First: find unused names
-    # use dict since no standard ordered set
-    used_cols = set()
-    names_ret = OrderedDict()
-    col_old2new = OrderedDict()
-    rows = len(b_ub)
-    cols = len(names)
-
-    sys.stdout.write('SimpC indexing ')
-    sys.stdout.flush()
-    progress = max(1, rows / 100)
-    for rowi, rowd in enumerate(A_ubd):
-        if rowi % progress == 0:
-            sys.stdout.write('.')
-            sys.stdout.flush()
-        for coli in rowd.keys():
-            used_cols.add(coli)
-
-    for coli in range(cols):
-        if coli in used_cols:
-            names_ret[names[coli]] = None
-            col_old2new[coli] = len(col_old2new)
-    assert len(used_cols) == len(col_old2new)
-
-    print(' done')
-
-    # Create a new matrix, copying important values over
-    #A_ub_ret = np.zeros((4, 1))
-    #A_ub_ret[3][0] = 1.0
-    #A_ub_ret = np.zeros((rows, len(names_ret)))
-    A_ub_ret = [None] * rows
-    sys.stdout.write('SimpC creating ')
-    sys.stdout.flush()
-    progress = max(1, rows / 100)
-    for rowi, rowd_old in enumerate(A_ubd):
-        if rowi % progress == 0:
-            sys.stdout.write('.')
-            sys.stdout.flush()
-        l = [(col_old2new[k], v) for k, v in rowd_old.items()]
-        A_ub_ret[rowi] = OrderedDict(l)
-    print(' done')
-
-    print('Simplify cols: %d => %d cols' % (len(names), len(names_ret)))
-    nr = list(names_ret.keys())
-    return nr, A_ub_ret, b_ub
-
 def A_ubr_np2d(row):
     '''Convert a single row'''
     #d = {}
@@ -239,10 +184,10 @@ def A_ubr_np2d(row):
 
 def A_ub_np2d(A_ub):
     '''Convert A_ub entries in numpy matrix to dictionary / sparse form'''
-    A_ubd = [None] * len(A_ub)
+    Adi = [None] * len(A_ub)
     for i, row in enumerate(A_ub):
-        A_ubd[i] = A_ubr_np2d(row)
-    return A_ubd
+        Adi[i] = A_ubr_np2d(row)
+    return Adi
 
 def Ar_di2np(row_di, cols):
     rownp = np.zeros(cols)
@@ -282,66 +227,15 @@ def Ab_np2d(A_ub, b_ub_inv):
     b_ub = invb(b_ub_inv)
     return A_ubd, b_ub
 
-def sort_equations_(A_ubd, b_ub):
-    # Dictionaries aren't hashable for sorting even though they are comparable
-    return A_ub_t2d(sorted(A_ub_d2t(A_ubd)))
-
-def sort_equations(A_ub, b_ub):
+def sort_equations(Ads, b):
     # Track rows with value column
     # Hmm can't sort against np arrays
-    tosort = [(sorted(row.items()), b) for row, b in zip(A_ub, b_ub)]
+    tosort = [(sorted(row.items()), rowb) for row, rowb in zip(Ads, b)]
     #res = sorted(tosort, key=lambda e: e[0])
     res = sorted(tosort)
     A_ubtr, b_ubr = zip(*res)
     return [OrderedDict(rowt) for rowt in A_ubtr], b_ubr
 
-def lte_const(row_ref, row_cmp):
-    '''Return true if all constants are smaller magnitude in row_cmp than row_ref'''
-    #return False
-    for k, vc in row_cmp.items():
-        vr = row_ref.get(k, None)
-        # Not in reference?
-        if vr is None:
-            return False
-        if vr < vc:
-            return False
-    return True
-
-def shared_const(row_ref, row_cmp):
-    '''Return true if more constants are equal than not equal'''
-    #return False
-    matches = 0
-    unmatches = 0
-    ks = list(row_ref.keys()) + list(row_cmp.keys())
-    for k in ks:
-        vr = row_ref.get(k, None)
-        vc = row_cmp.get(k, None)
-        # At least one
-        if vr is not None and vc is not None:
-            if vc == vr:
-                matches += 1
-            else:
-                unmatches += 1
-        else:
-            unmatches += 1
-
-    # Will equation reduce if subtracted?
-    return matches > unmatches
-
-def reduce_const(row_ref, row_cmp):
-    '''Subtract cmp constants from ref'''
-    #ret = {}
-    ret = OrderedDict()
-    ks = set(row_ref.keys())
-    ks.update(set(row_cmp.keys()))
-    for k in ks:
-        vr = row_ref.get(k, 0)
-        vc = row_cmp.get(k, 0)
-        res = vr - vc
-        if res:
-            ret[k] = res
-    return ret
-
 def derive_eq_by_row(A_ubd, b_ub, verbose=0, col_lim=0, tweak=False):
     '''
     Derive equations by subtracting whole rows
@@ -510,13 +404,13 @@ def derive_eq_by_col(A_ubd, b_ub, verbose=0):
     print('Derive col: %d => %d rows' % (len(b_ub), len(b_ub_ret)))
     return A_ubd_ret, b_ub_ret
 
-def col_dist(A_ubd, desc='of', names=[], lim=0):
+def col_dist(Ads, desc='of', names=[], lim=0):
     '''print(frequency distribution of number of elements in a given row'''
-    rows = len(A_ubd)
+    rows = len(Ads)
     cols = len(names)
 
     fs = {}
-    for row in A_ubd:
+    for row in Ads:
         this_cols = len(row)
         fs[this_cols] = fs.get(this_cols, 0) + 1
 
@@ -912,3 +806,21 @@ def run_sub_json(Ads, sub_json, verbose=False):
 
     print("Sub: %u / %u rows changed" % (nsubs, nrows))
     print("Sub: %u => %u cols" % (ncols_old, ncols_new))
+
+def print_eqns(Ads, b, verbose=0, lim=3, label=''):
+    rows = len(b)
+
+    print('Sample equations (%s) from %d r' % (label, rows))
+    prints = 0
+    for rowi, row in enumerate(Ads):
+        if verbose or ((rowi < 10 or rowi % max(1, (rows / 20)) == 0) and (not lim or prints < lim)):
+            line = '  EQN: p%u: ' % rowi
+            for k, v in sorted(row.items()):
+                line += '%u*t%s ' % (v, k)
+            line += '= %d' % b[rowi]
+            print(line)
+            prints += 1
+
+def print_eqns_np(A_ub, b_ub, verbose=0):
+    Adi = A_ub_np2d(A_ub)
+    print_eqns(Adi, b_ub, verbose=verbose)
diff --git a/experiments/timfuz/timfuz_massage.py b/experiments/timfuz/timfuz_massage.py
new file mode 100644
index 00000000..add24fe1
--- /dev/null
+++ b/experiments/timfuz/timfuz_massage.py
@@ -0,0 +1,335 @@
+#!/usr/bin/env python3
+
+from timfuz import simplify_rows, print_eqns, print_eqns_np, sort_equations, col_dist
+import numpy as np
+import math
+import sys
+import datetime
+import os
+import time
+import copy
+from collections import OrderedDict
+
+def lte_const(row_ref, row_cmp):
+    '''Return true if all constants are smaller magnitude in row_cmp than row_ref'''
+    #return False
+    for k, vc in row_cmp.items():
+        vr = row_ref.get(k, None)
+        # Not in reference?
+        if vr is None:
+            return False
+        if vr < vc:
+            return False
+    return True
+
+def shared_const(row_ref, row_cmp):
+    '''Return true if more constants are equal than not equal'''
+    #return False
+    matches = 0
+    unmatches = 0
+    ks = list(row_ref.keys()) + list(row_cmp.keys())
+    for k in ks:
+        vr = row_ref.get(k, None)
+        vc = row_cmp.get(k, None)
+        # At least one
+        if vr is not None and vc is not None:
+            if vc == vr:
+                matches += 1
+            else:
+                unmatches += 1
+        else:
+            unmatches += 1
+
+    # Will equation reduce if subtracted?
+    return matches > unmatches
+
+def reduce_const(row_ref, row_cmp):
+    '''Subtract cmp constants from ref'''
+    #ret = {}
+    ret = OrderedDict()
+    ks = set(row_ref.keys())
+    ks.update(set(row_cmp.keys()))
+    for k in ks:
+        vr = row_ref.get(k, 0)
+        vc = row_cmp.get(k, 0)
+        res = vr - vc
+        if res:
+            ret[k] = res
+    return ret
+
+def derive_eq_by_row(Ads, b, verbose=0, col_lim=0, tweak=False):
+    '''
+    Derive equations by subtracting whole rows
+
+    Given equations like:
+    t0           >= 10
+    t0 + t1      >= 15
+    t0 + t1 + t2 >= 17
+
+    When I look at these, I think of a solution something like:
+    t0 = 10f
+    t1 = 5
+    t2 = 2
+
+    However, linprog tends to choose solutions like:
+    t0 = 17
+    t1 = 0
+    t2 = 0
+
+    To this end, add additional constraints by finding equations that are subsets of other equations
+    How to do this in a reasonable time span?
+    Also equations are sparse, which makes this harder to compute
+    '''
+    rows = len(Ads)
+    assert rows == len(b)
+
+    # Index equations into hash maps so can lookup sparse elements quicker
+    assert len(Ads) == len(b)
+    Ads_ret = copy.copy(Ads)
+    assert len(Ads) == len(Ads_ret)
+
+    #print('Finding subsets')
+    ltes = 0
+    scs = 0
+    b_ret = list(b)
+    sys.stdout.write('Deriving rows ')
+    sys.stdout.flush()
+    progress = max(1, rows / 100)
+    for row_refi, row_ref in enumerate(Ads):
+        if row_refi % progress == 0:
+            sys.stdout.write('.')
+            sys.stdout.flush()
+        if col_lim and len(row_ref) > col_lim:
+            continue
+
+        for row_cmpi, row_cmp in enumerate(Ads):
+            if row_refi == row_cmpi or col_lim and len(row_cmp) > col_lim:
+                continue
+            # FIXME: this check was supposed to be removed
+            '''
+            Every elements in row_cmp is in row_ref
+            but this doesn't mean the constants are smaller
+            Filter these out
+            '''
+            # XXX: just reduce and filter out solutions with positive constants
+            # or actually are these also useful as is?
+            lte = lte_const(row_ref, row_cmp)
+            if lte:
+                ltes += 1
+            sc = 0 and shared_const(row_ref, row_cmp)
+            if sc:
+                scs += 1
+            if lte or sc:
+                if verbose:
+                    print('')
+                    print('match')
+                    print('  ', row_ref, b[row_refi])
+                    print('  ', row_cmp, b[row_cmpi])
+                # Reduce
+                A_new = reduce_const(row_ref, row_cmp)
+                # Did this actually significantly reduce the search space?
+                #if tweak and len(A_new) > 4 and len(A_new) > len(row_cmp) / 2:
+                if tweak and len(A_new) > 8 and len(A_new) > len(row_cmp) / 2:
+                    continue
+                b_new = b[row_refi] - b[row_cmpi]
+                # Definitely possible
+                # Maybe filter these out if they occur?
+                if verbose:
+                    print(b_new)
+                # Also inverted sign
+                if b_new <= 0:
+                    if verbose:
+                        print("Unexpected b")
+                    continue
+                if verbose:
+                    print('OK')
+                Ads_ret.append(A_new)
+                b_ret.append(b_new)
+    print(' done')
+
+    #A_ub_ret = A_di2np(Ads2, cols=cols)
+    print('Derive row: %d => %d rows using %d lte, %d sc' % (len(b), len(b_ret), ltes, scs))
+    assert len(Ads_ret) == len(b_ret)
+    return Ads_ret, b_ret
+
+def derive_eq_by_col(Ads, b_ub, verbose=0):
+    '''
+    Derive equations by subtracting out all bounded constants (ie "known" columns)
+    '''
+    rows = len(Ads)
+
+    # Find all entries where
+
+    # Index equations with a single constraint
+    knowns = {}
+    sys.stdout.write('Derive col indexing ')
+    sys.stdout.flush()
+    progress = max(1, rows / 100)
+    for row_refi, row_refd in enumerate(Ads):
+        if row_refi % progress == 0:
+            sys.stdout.write('.')
+            sys.stdout.flush()
+        if len(row_refd) == 1:
+            k, v = list(row_refd.items())[0]
+            # Reduce any constants to canonical form
+            if v != 1:
+                row_refd[k] = 1
+                b_ub[row_refi] /= v
+            knowns[k] = b_ub[row_refi]
+    print(' done')
+    #knowns_set = set(knowns.keys())
+    print('%d constrained' % len(knowns))
+
+    '''
+    Now see what we can do
+    Rows that are already constrained: eliminate
+        TODO: maybe keep these if this would violate their constraint
+    Otherwise eliminate the original row and generate a simplified result now
+    '''
+    b_ret = []
+    Ads_ret = []
+    sys.stdout.write('Derive col main ')
+    sys.stdout.flush()
+    progress = max(1, rows / 100)
+    for row_refi, row_refd in enumerate(Ads):
+        if row_refi % progress == 0:
+            sys.stdout.write('.')
+            sys.stdout.flush()
+        # Reduce as much as possible
+        #row_new = {}
+        row_new = OrderedDict()
+        b_new = b_ub[row_refi]
+        # Copy over single entries
+        if len(row_refd) == 1:
+            row_new = row_refd
+        else:
+            for k, v in row_refd.items():
+                if k in knowns:
+                    # Remove column and take out corresponding delay
+                    b_new -= v * knowns[k]
+                # Copy over
+                else:
+                    row_new[k] = v
+
+        # Possibly reduced all usable contants out
+        if len(row_new) == 0:
+            continue
+        if b_new <= 0:
+            continue
+
+        Ads_ret.append(row_new)
+        b_ret.append(b_new)
+    print(' done')
+
+    print('Derive col: %d => %d rows' % (len(b_ub), len(b_ret)))
+    return Ads_ret, b_ret
+
+def massage_equations(Ads, b, verbose=False, derive_lim=3):
+    '''
+    Equation pipeline
+    Some operations may generate new equations
+    Simplify after these to avoid unnecessary overhead on redundant constraints
+    Similarly some operations may eliminate equations, potentially eliminating a column (ie variable)
+    Remove these columns as necessary to speed up solving
+    '''
+
+    def debug(what):
+        if verbose:
+            print('')
+            print_eqns(Ads, b, verbose=verbose, label=what, lim=20)
+            col_dist(Ads, what)
+            check_feasible_d(Ads, b)
+
+    # Try to (intelligently) subtract equations to generate additional constraints
+    # This helps avoid putting all delay in a single shared variable
+    if derive_lim:
+        dstart = len(b)
+
+        # Original simple
+        if 0:
+            for di in range(derive_lim):
+                print
+                assert len(Ads) == len(b)
+                n_orig = len(b)
+
+                # Meat of the operation
+                # Focus on easy equations for first pass to get a lot of easy derrivations
+                col_lim = 12 if di == 0 else None
+                #col_lim = None
+                Ads, b = derive_eq_by_row(Ads, b, col_lim=col_lim)
+                debug("der_rows")
+                # Run another simplify pass since new equations may have overlap with original
+                Ads, b = simplify_rows(Ads, b)
+                print('Derive row %d / %d: %d => %d equations' % (di + 1, derive_lim, n_orig, len(b)))
+                debug("der_rows simp")
+
+                n_orig2 = len(b)
+                # Meat of the operation
+                Ads, b = derive_eq_by_col(Ads, b)
+                debug("der_cols")
+                # Run another simplify pass since new equations may have overlap with original
+                Ads, b = simplify_rows(Ads, b)
+                print('Derive col %d / %d: %d => %d equations' % (di + 1, derive_lim, n_orig2, len(b)))
+                debug("der_cols simp")
+
+                if n_orig == len(b):
+                    break
+
+        if 1:
+            # Each iteration one more column is allowed until all columns are included
+            # (and the system is stable)
+            col_lim = 15
+            di = 0
+            while True:
+                print
+                n_orig = len(b)
+
+                print('Loop %d, lim %d' % (di + 1, col_lim))
+                # Meat of the operation
+                Ads, b = derive_eq_by_row(Ads, b, col_lim=col_lim, tweak=True)
+                debug("der_rows")
+                # Run another simplify pass since new equations may have overlap with original
+                Ads, b = simplify_rows(Ads, b)
+                print('Derive row: %d => %d equations' % (n_orig, len(b)))
+                debug("der_rows simp")
+
+                n_orig2 = len(b)
+                # Meat of the operation
+                Ads, b = derive_eq_by_col(Ads, b)
+                debug("der_cols")
+                # Run another simplify pass since new equations may have overlap with original
+                Ads, b = simplify_rows(Ads, b)
+                print('Derive col %d: %d => %d equations' % (di + 1, n_orig2, len(b)))
+                debug("der_cols simp")
+
+                # Doesn't help computation, but helps debugging
+                Ads, b = sort_equations(Ads, b)
+                debug("loop done")
+                col_dist(Ads, 'derive done iter %d, lim %d' % (di, col_lim), lim=12)
+
+                rows = len(Ads)
+                if n_orig == len(b) and col_lim >= rows:
+                    break
+                col_lim += col_lim / 5
+                di += 1
+
+        dend = len(b)
+        print('')
+        print('Derive net: %d => %d' % (dstart, dend))
+        print('')
+        # Was experimentting to see how much the higher order columns really help
+
+    '''
+    cols_min_post = opts.get('cols_min_post', None)
+    cols_max_post = opts.get('cols_max_post', None)
+    # Filter input based on number of columns
+    if cols_min_post or cols_max_post:
+        Ads, b = filter_ncols(Ads=Ads, b=b, cols_min=cols_min_post, cols_max=cols_max_post)
+        debug("filter_ncals final")
+    '''
+
+    # Helps debug readability
+    Ads, b = sort_equations(Ads, b)
+    debug("final (sorted)")
+    return Ads, b
+
diff --git a/experiments/timfuz/timfuz_rref.py b/experiments/timfuz/timfuz_rref.py
index 0ac87967..31ecca0d 100644
--- a/experiments/timfuz/timfuz_rref.py
+++ b/experiments/timfuz/timfuz_rref.py
@@ -169,7 +169,7 @@ def comb_corr_sets(state, verbose=False):
             continue
 
         # a grouping
-        group_name = "GROUP_%u" % row_i
+        group_name = "GRP_%u" % row_i
         rowdsf = row_sym2dsf(rowsym, names)
 
         state.subs[group_name] = rowdsf
diff --git a/experiments/timfuz/timfuz_solve.py b/experiments/timfuz/timfuz_solve.py
index 2041d773..356476e5 100644
--- a/experiments/timfuz/timfuz_solve.py
+++ b/experiments/timfuz/timfuz_solve.py
@@ -2,7 +2,8 @@
 
 # https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
 from scipy.optimize import linprog
-from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json
+from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json, A_ub_np2d, print_eqns, print_eqns_np
+from timfuz_massage import massage_equations
 import numpy as np
 import glob
 import json
@@ -65,12 +66,10 @@ def check_feasible(A_ub, b_ub):
     print(' done')
 
 def run_corner(Anp, b, names, verbose=False, opts={}, meta={}):
+    # Given timing scores for above delays (-ps)
     assert type(Anp[0]) is np.ndarray, type(Anp[0])
     assert type(b) is np.ndarray, type(b)
 
-    # Given timing scores for above delays (-ps)
-    names_orig = names
-
     #check_feasible(Anp, b)
 
     '''
@@ -91,6 +90,12 @@ def run_corner(Anp, b, names, verbose=False, opts={}, meta={}):
     #A_ub = -1.0 * Anp
     A_ub = [-1.0 * x for x in Anp]
 
+    if verbose:
+        print('')
+        print('A_ub b_ub')
+        print_eqns_np(A_ub, b_ub, verbose=verbose)
+        print('')
+
     print('Creating misc constants...')
     # Minimization function scalars
     # Treat all logic elements as equally important
@@ -133,7 +138,7 @@ def run_corner(Anp, b, names, verbose=False, opts={}, meta={}):
     print('')
     # Now find smallest values for delay constants
     # Due to input bounds (ex: column limit), some delay elements may get eliminated entirely
-    print('Running linprog w/ %d r, %d c (%d name)' % (rows, cols, len(names_orig)))
+    print('Running linprog w/ %d r, %d c (%d name)' % (rows, cols, len(names)))
     res = linprog(c, A_ub=A_ub, b_ub=b_ub, bounds=bounds, callback=callback,
           options={"disp": True, 'maxiter': maxiter, 'bland': True, 'tol': 1e-6,})
     nonzeros = 0
@@ -155,7 +160,7 @@ def run_corner(Anp, b, names, verbose=False, opts={}, meta={}):
         print('Writing %s' % fn_out)
         np.save(fn_out, (3, c, A_ub, b_ub, bounds, names, res, meta))
 
-def run(fns_in, corner, sub_json=None, dedup=True, verbose=False):
+def run(fns_in, corner, sub_json=None, dedup=True, massage=False, verbose=False):
     Ads, b = loadc_Ads_b(fns_in, corner, ico=True)
 
     # Remove duplicate rows
@@ -175,12 +180,15 @@ def run(fns_in, corner, sub_json=None, dedup=True, verbose=False):
     else:
         names = index_names(Ads)
 
-    if 0:
+    if verbose:
         print
-        print_eqns(A_ubd, b_ub, verbose=verbose)
+        print_eqns(Ads, b, verbose=verbose)
 
-        print
-        col_dist(A_ubd, 'final', names)
+        #print
+        #col_dist(A_ubd, 'final', names)
+
+    if massage:
+        Ads, b = massage_equations(Ads, b)
 
     print('Converting to numpy...')
     names, Anp = A_ds2np(Ads)
@@ -195,6 +203,7 @@ def main():
     )
 
     parser.add_argument('--verbose', action='store_true', help='')
+    parser.add_argument('--massage', action='store_true', help='')
     parser.add_argument('--sub-json', help='Group substitutions to make fully ranked')
     parser.add_argument('--corner', default="slow_max", help='')
     parser.add_argument(
@@ -215,7 +224,7 @@ def main():
 
     try:
         run(sub_json=sub_json,
-            fns_in=fns_in, verbose=args.verbose, corner=args.corner)
+            fns_in=fns_in, verbose=args.verbose, corner=args.corner, massage=args.massage)
     finally:
         print('Exiting after %s' % bench)
 

From 6d78626239b209b9bcdbc2404c3813b36e9f4fe2 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Fri, 24 Aug 2018 17:09:50 -0700
Subject: [PATCH 07/55] timfuz: massage experiments

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 experiments/timfuz/timfuz_massage.py | 340 +++++++++++++++++++++------
 experiments/timfuz/timfuz_rref.py    |  35 +--
 2 files changed, 279 insertions(+), 96 deletions(-)

diff --git a/experiments/timfuz/timfuz_massage.py b/experiments/timfuz/timfuz_massage.py
index add24fe1..3c7b78b8 100644
--- a/experiments/timfuz/timfuz_massage.py
+++ b/experiments/timfuz/timfuz_massage.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python3
 
-from timfuz import simplify_rows, print_eqns, print_eqns_np, sort_equations, col_dist
+from timfuz import simplify_rows, print_eqns, print_eqns_np, sort_equations, col_dist, index_names
 import numpy as np
 import math
 import sys
@@ -92,9 +92,9 @@ def derive_eq_by_row(Ads, b, verbose=0, col_lim=0, tweak=False):
     ltes = 0
     scs = 0
     b_ret = list(b)
-    sys.stdout.write('Deriving rows ')
+    sys.stdout.write('Deriving rows (%u) ' % rows)
     sys.stdout.flush()
-    progress = max(1, rows / 100)
+    progress = int(max(1, rows / 100))
     for row_refi, row_ref in enumerate(Ads):
         if row_refi % progress == 0:
             sys.stdout.write('.')
@@ -152,6 +152,104 @@ def derive_eq_by_row(Ads, b, verbose=0, col_lim=0, tweak=False):
     assert len(Ads_ret) == len(b_ret)
     return Ads_ret, b_ret
 
+def derive_eq_by_near_row(Ads, b, verbose=0, col_lim=0, tweak=False):
+    '''
+    Derive equations by subtracting whole rows
+
+    Given equations like:
+    t0           >= 10
+    t0 + t1      >= 15
+    t0 + t1 + t2 >= 17
+
+    When I look at these, I think of a solution something like:
+    t0 = 10f
+    t1 = 5
+    t2 = 2
+
+    However, linprog tends to choose solutions like:
+    t0 = 17
+    t1 = 0
+    t2 = 0
+
+    To this end, add additional constraints by finding equations that are subsets of other equations
+    How to do this in a reasonable time span?
+    Also equations are sparse, which makes this harder to compute
+    '''
+    rows = len(Ads)
+    assert rows == len(b)
+    rowdelta = int(rows / 2)
+
+    # Index equations into hash maps so can lookup sparse elements quicker
+    assert len(Ads) == len(b)
+    Ads_ret = copy.copy(Ads)
+    assert len(Ads) == len(Ads_ret)
+
+    #print('Finding subsets')
+    ltes = 0
+    scs = 0
+    b_ret = list(b)
+    sys.stdout.write('Deriving rows (%u) ' % rows)
+    sys.stdout.flush()
+    progress = int(max(1, rows / 100))
+    for row_refi, row_ref in enumerate(Ads):
+        if row_refi % progress == 0:
+            sys.stdout.write('.')
+            sys.stdout.flush()
+        if col_lim and len(row_ref) > col_lim:
+            continue
+
+        #for row_cmpi, row_cmp in enumerate(Ads):
+        for row_cmpi in range(max(0, row_refi - rowdelta), min(len(Ads), row_refi + rowdelta)):
+            if row_refi == row_cmpi or col_lim and len(row_cmp) > col_lim:
+                continue
+            row_cmp = Ads[row_cmpi]
+            # FIXME: this check was supposed to be removed
+            '''
+            Every elements in row_cmp is in row_ref
+            but this doesn't mean the constants are smaller
+            Filter these out
+            '''
+            # XXX: just reduce and filter out solutions with positive constants
+            # or actually are these also useful as is?
+            lte = lte_const(row_ref, row_cmp)
+            if lte:
+                ltes += 1
+            sc = 0 and shared_const(row_ref, row_cmp)
+            if sc:
+                scs += 1
+            if lte or sc:
+                if verbose:
+                    print('')
+                    print('match')
+                    print('  ', row_ref, b[row_refi])
+                    print('  ', row_cmp, b[row_cmpi])
+                # Reduce
+                A_new = reduce_const(row_ref, row_cmp)
+                # Did this actually significantly reduce the search space?
+                #if tweak and len(A_new) > 4 and len(A_new) > len(row_cmp) / 2:
+                #if tweak and len(A_new) > 8 and len(A_new) > len(row_cmp) / 2:
+                #    continue
+                b_new = b[row_refi] - b[row_cmpi]
+                # Definitely possible
+                # Maybe filter these out if they occur?
+                if verbose:
+                    print(b_new)
+                # Also inverted sign
+                if b_new <= 0:
+                    if verbose:
+                        print("Unexpected b")
+                    continue
+                if verbose:
+                    print('OK')
+                Ads_ret.append(A_new)
+                b_ret.append(b_new)
+    print(' done')
+
+    #A_ub_ret = A_di2np(Ads2, cols=cols)
+    print('Derive row: %d => %d rows using %d lte, %d sc' % (len(b), len(b_ret), ltes, scs))
+    assert len(Ads_ret) == len(b_ret)
+    return Ads_ret, b_ret
+
 def derive_eq_by_col(Ads, b_ub, verbose=0):
     '''
     Derive equations by subtracting out all bounded constants (ie "known" columns)
@@ -224,7 +322,7 @@ def derive_eq_by_col(Ads, b_ub, verbose=0):
     print('Derive col: %d => %d rows' % (len(b_ub), len(b_ret)))
     return Ads_ret, b_ret
 
-def massage_equations(Ads, b, verbose=False, derive_lim=3):
+def massage_equations_old(Ads, b, verbose=False, derive_lim=3):
     '''
     Equation pipeline
     Some operations may generate new equations
@@ -242,82 +340,43 @@ def massage_equations(Ads, b, verbose=False, derive_lim=3):
 
     # Try to (intelligently) subtract equations to generate additional constraints
     # This helps avoid putting all delay in a single shared variable
-    if derive_lim:
-        dstart = len(b)
+    dstart = len(b)
 
-        # Original simple
-        if 0:
-            for di in range(derive_lim):
-                print
-                assert len(Ads) == len(b)
-                n_orig = len(b)
+    # Original simple
+    for di in range(derive_lim):
+        print
+        assert len(Ads) == len(b)
+        n_orig = len(b)
 
-                # Meat of the operation
-                # Focus on easy equations for first pass to get a lot of easy derrivations
-                col_lim = 12 if di == 0 else None
-                #col_lim = None
-                Ads, b = derive_eq_by_row(Ads, b, col_lim=col_lim)
-                debug("der_rows")
-                # Run another simplify pass since new equations may have overlap with original
-                Ads, b = simplify_rows(Ads, b)
-                print('Derive row %d / %d: %d => %d equations' % (di + 1, derive_lim, n_orig, len(b)))
-                debug("der_rows simp")
+        # Meat of the operation
+        # Focus on easy equations for first pass to get a lot of easy derrivations
+        col_lim = 12 if di == 0 else None
+        #col_lim = None
+        Ads, b = derive_eq_by_row(Ads, b, col_lim=col_lim)
+        debug("der_rows")
+        # Run another simplify pass since new equations may have overlap with original
+        Ads, b = simplify_rows(Ads, b)
+        print('Derive row %d / %d: %d => %d equations' % (di + 1, derive_lim, n_orig, len(b)))
+        debug("der_rows simp")
 
-                n_orig2 = len(b)
-                # Meat of the operation
-                Ads, b = derive_eq_by_col(Ads, b)
-                debug("der_cols")
-                # Run another simplify pass since new equations may have overlap with original
-                Ads, b = simplify_rows(Ads, b)
-                print('Derive col %d / %d: %d => %d equations' % (di + 1, derive_lim, n_orig2, len(b)))
-                debug("der_cols simp")
+        n_orig2 = len(b)
+        # Meat of the operation
+        Ads, b = derive_eq_by_col(Ads, b)
+        debug("der_cols")
+        # Run another simplify pass since new equations may have overlap with original
+        Ads, b = simplify_rows(Ads, b)
+        print('Derive col %d / %d: %d => %d equations' % (di + 1, derive_lim, n_orig2, len(b)))
+        debug("der_cols simp")
 
-                if n_orig == len(b):
-                    break
+        if n_orig == len(b):
+            break
 
-        if 1:
-            # Each iteration one more column is allowed until all columns are included
-            # (and the system is stable)
-            col_lim = 15
-            di = 0
-            while True:
-                print
-                n_orig = len(b)
 
-                print('Loop %d, lim %d' % (di + 1, col_lim))
-                # Meat of the operation
-                Ads, b = derive_eq_by_row(Ads, b, col_lim=col_lim, tweak=True)
-                debug("der_rows")
-                # Run another simplify pass since new equations may have overlap with original
-                Ads, b = simplify_rows(Ads, b)
-                print('Derive row: %d => %d equations' % (n_orig, len(b)))
-                debug("der_rows simp")
-
-                n_orig2 = len(b)
-                # Meat of the operation
-                Ads, b = derive_eq_by_col(Ads, b)
-                debug("der_cols")
-                # Run another simplify pass since new equations may have overlap with original
-                Ads, b = simplify_rows(Ads, b)
-                print('Derive col %d: %d => %d equations' % (di + 1, n_orig2, len(b)))
-                debug("der_cols simp")
-
-                # Doesn't help computation, but helps debugging
-                Ads, b = sort_equations(Ads, b)
-                debug("loop done")
-                col_dist(Ads, 'derive done iter %d, lim %d' % (di, col_lim), lim=12)
-
-                rows = len(Ads)
-                if n_orig == len(b) and col_lim >= rows:
-                    break
-                col_lim += col_lim / 5
-                di += 1
-
-        dend = len(b)
-        print('')
-        print('Derive net: %d => %d' % (dstart, dend))
-        print('')
-        # Was experimentting to see how much the higher order columns really help
+    dend = len(b)
+    print('')
+    print('Derive net: %d => %d' % (dstart, dend))
+    print('')
+    # Was experimentting to see how much the higher order columns really help
 
     '''
     cols_min_post = opts.get('cols_min_post', None)
@@ -333,3 +392,136 @@ def massage_equations(Ads, b, verbose=False, derive_lim=3):
     debug("final (sorted)")
     return Ads, b
 
+def massage_equations_old2(Ads, b, verbose=False):
+    '''
+    Equation pipeline
+    Some operations may generate new equations
+    Simplify after these to avoid unnecessary overhead on redundant constraints
+    Similarly some operations may eliminate equations, potentially eliminating a column (ie variable)
+    Remove these columns as necessary to speed up solving
+    '''
+
+    def debug(what):
+        if verbose:
+            print('')
+            print_eqns(Ads, b, verbose=verbose, label=what, lim=20)
+            col_dist(Ads, what)
+            check_feasible_d(Ads, b)
+
+    # Try to (intelligently) subtract equations to generate additional constraints
+    # This helps avoid putting all delay in a single shared variable
+    dstart = len(b)
+    cols = len(index_names(Ads))
+
+    # Each iteration one more column is allowed until all columns are included
+    # (and the system is stable)
+    col_lim = 15
+    di = 0
+    while True:
+        print
+        n_orig = len(b)
+
+        print('Loop %d, lim %d' % (di + 1, col_lim))
+        # Meat of the operation
+        Ads, b = derive_eq_by_row(Ads, b, col_lim=col_lim, tweak=True)
+        debug("der_rows")
+        # Run another simplify pass since new equations may have overlap with original
+        Ads, b = simplify_rows(Ads, b)
+        print('Derive row: %d => %d equations' % (n_orig, len(b)))
+        debug("der_rows simp")
+
+        n_orig2 = len(b)
+        # Meat of the operation
+        Ads, b = derive_eq_by_col(Ads, b)
+        debug("der_cols")
+        # Run another simplify pass since new equations may have overlap with original
+        Ads, b = simplify_rows(Ads, b)
+        print('Derive col %d: %d => %d equations' % (di + 1, n_orig2, len(b)))
+        debug("der_cols simp")
+
+        # Doesn't help computation, but helps debugging
+        Ads, b = sort_equations(Ads, b)
+        debug("loop done")
+        col_dist(Ads, 'derive done iter %d, lim %d' % (di, col_lim), lim=12)
+
+        rows = len(Ads)
+        if n_orig == len(b) and col_lim >= cols:
+            break
+        col_lim += col_lim / 5
+        di += 1
+
+        dend = len(b)
+        print('')
+        print('Derive net: %d => %d' % (dstart, dend))
+        print('')
+        # Was experimentting to see how much the higher order columns really help
+
+    # Helps debug readability
+    Ads, b = sort_equations(Ads, b)
+    debug("final (sorted)")
+    print('')
+    print('Massage final: %d => %d rows' % (dstart, dend))
+    return Ads, b
+
+def massage_equations(Ads, b, verbose=False):
+    '''
+    Equation pipeline
+    Some operations may generate new equations
+    Simplify after these to avoid unnecessary overhead on redundant constraints
+    Similarly some operations may eliminate equations, potentially eliminating a column (ie variable)
+    Remove these columns as necessary to speed up solving
+    '''
+
+    def debug(what):
+        if verbose:
+            print('')
+            print_eqns(Ads, b, verbose=verbose, label=what, lim=20)
+            col_dist(Ads, what)
+            check_feasible_d(Ads, b)
+
+    # Try to (intelligently) subtract equations to generate additional constraints
+    # This helps avoid putting all delay in a single shared variable
+    dstart = len(b)
+    cols = len(index_names(Ads))
+
+    # Each iteration one more column is allowed until all columns are included
+    # (and the system is stable)
+    print
+    n_orig = len(b)
+
+    # Meat of the operation
+    Ads, b = derive_eq_by_near_row(Ads, b, tweak=True)
+    debug("der_rows")
+    # Run another simplify pass since new equations may have overlap with original
+    Ads, b = simplify_rows(Ads, b)
+    print('Derive row: %d => %d equations' % (n_orig, len(b)))
+    debug("der_rows simp")
+
+    n_orig2 = len(b)
+    # Meat of the operation
+    Ads, b = derive_eq_by_col(Ads, b)
+    debug("der_cols")
+    # Run another simplify pass since new equations may have overlap with original
+    Ads, b = simplify_rows(Ads, b)
+    print('Derive col: %d => %d equations' % (n_orig2, len(b)))
+    debug("der_cols simp")
+
+    # Doesn't help computation, but helps debugging
+    Ads, b = sort_equations(Ads, b)
+    debug("loop done")
+    col_dist(Ads, 'derive done', lim=12)
+
+    rows = len(Ads)
+
+    dend = len(b)
+    print('')
+    print('Derive net: %d => %d' % (dstart, dend))
+    print('')
+    # Was experimentting to see how much the higher order columns really help
+
+    # Helps debug readability
+    Ads, b = sort_equations(Ads, b)
+    debug("final (sorted)")
+    print('')
+    print('Massage final: %d => %d rows' % (dstart, dend))
+    return Ads, b
diff --git a/experiments/timfuz/timfuz_rref.py b/experiments/timfuz/timfuz_rref.py
index 31ecca0d..85122d54 100644
--- a/experiments/timfuz/timfuz_rref.py
+++ b/experiments/timfuz/timfuz_rref.py
@@ -5,7 +5,7 @@ Triaging tool to help understand where we need more timing coverage
 Finds correlated variables to help make better test cases
 '''
 
-from timfuz import Benchmark, Ar_di2np, loadc_Ads_b, index_names, A_ds2np
+from timfuz import Benchmark, Ar_di2np, loadc_Ads_b, index_names, A_ds2np, simplify_rows
 import numpy as np
 import glob
 import math
@@ -57,7 +57,9 @@ class State(object):
 
     @staticmethod
     def load(fn_ins):
-        Ads, _b = loadc_Ads_b(fn_ins, corner=None, ico=True)
+        Ads, b = loadc_Ads_b(fn_ins, corner=None, ico=True)
+        print('Simplifying')
+        #Ads, b = simplify_rows(Ads, b)
         return State(Ads)
 
 def write_state(state, fout):
@@ -70,18 +72,6 @@ def write_state(state, fout):
     }
     json.dump(j, fout, sort_keys=True, indent=4, separators=(',', ': '))
 
-def Adi2matrix(Adi, cols):
-    A_ub2 = [np.zeros(cols) for _i in range(cols)]
-
-    dst_rowi = 0
-    for row in Adi:
-        rownp = Ar_di2np(row, cols=len(names), sf=1)
-
-        A_ub2[dst_rowi] = np.add(A_ub2[dst_rowi], rownp)
-        dst_rowi = (dst_rowi + 1) % len(names)
-
-    return A_ub2
-
 def Anp2matrix(Anp):
     '''
     Original idea was to make into a square matrix
@@ -119,27 +109,28 @@ def row_sym2dsf(rowsym, names):
             ret[name] = (int(num), int(den))
     return ret
 
-def comb_corr_sets(state, verbose=False):
+def state_rref(state, verbose=False):
     print('Converting rows to integer keys')
     names, Anp = A_ds2np(state.Ads)
 
     print('np: %u rows x %u cols' % (len(Anp), len(Anp[0])))
     print('Combining rows into matrix')
-    mnp = Anp2matrix(Anp)
+    #mnp = Anp2matrix(Anp)
+    mnp = Anp
     print('Matrix: %u rows x %u cols' % (len(mnp), len(mnp[0])))
     print('Converting np to sympy matrix')
     mfrac = fracm(mnp)
-    print('mfrac', type(mfrac[0][0]))
     msym = sympy.Matrix(mfrac)
-    print('Making rref')
-    rref, pivots = msym.rref()
-
-
     if verbose:
         print('names')
         print(names)
         print('Matrix')
         sympy.pprint(msym)
+    print('Making rref')
+    rref, pivots = msym.rref()
+
+
+    if verbose:
         print('Pivots')
         sympy.pprint(pivots)
         print('rref')
@@ -189,7 +180,7 @@ def run(fout, fn_ins, verbose=0):
     print('Loading data')
 
     state = State.load(fn_ins)
-    comb_corr_sets(state, verbose=verbose)
+    state_rref(state, verbose=verbose)
     state.print_stats()
     if fout:
         write_state(state, fout)

From 9ff07f4278e9bd98252f4c6b98878b8f43c52564 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Mon, 27 Aug 2018 12:37:21 -0700
Subject: [PATCH 08/55] timfuz: matrix perf test

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 experiments/timfuz/timfuz_perf.py | 99 +++++++++++++++++++++++++++++++
 1 file changed, 99 insertions(+)
 create mode 100644 experiments/timfuz/timfuz_perf.py

diff --git a/experiments/timfuz/timfuz_perf.py b/experiments/timfuz/timfuz_perf.py
new file mode 100644
index 00000000..4246f034
--- /dev/null
+++ b/experiments/timfuz/timfuz_perf.py
@@ -0,0 +1,99 @@
+#!/usr/bin/env python3
+
+'''
+Triaging tool to help understand where we need more timing coverage
+Finds correlated variables to help make better test cases
+'''
+
+from timfuz import Benchmark, Ar_di2np, loadc_Ads_b, index_names, A_ds2np, simplify_rows
+import numpy as np
+import glob
+import math
+import json
+import sympy
+from collections import OrderedDict
+from fractions import Fraction
+import random
+
+def fracr(r):
+    DELTA = 0.0001
+
+    for i, x in enumerate(r):
+        if type(x) is float:
+            xi = int(x)
+            assert abs(xi - x) < DELTA
+            r[i] = xi
+    return [Fraction(x) for x in r]
+
+def fracm(m):
+    return [fracr(r) for r in m]
+
+def create_matrix(rows, cols):
+    ret = np.zeros((rows, cols))
+    for rowi in range(rows):
+        for coli in range(cols):
+            ret[rowi][coli] = random.randint(1, 10)
+    return ret
+
+def create_matrix_sparse(rows, cols):
+    ret = np.zeros((rows, cols))
+    for rowi in range(rows):
+        for coli in range(cols):
+            if random.randint(0, 5) < 1:
+                ret[rowi][coli] = random.randint(1, 10)
+    return ret
+
+def run(rows=35, cols=200, verbose=False, encoding='np', sparse=False):
+    random.seed(0)
+    if sparse:
+        mnp = create_matrix_sparse(rows, cols)
+    else:
+        mnp = create_matrix(rows, cols)
+    #print(mnp[0])
+
+    if encoding == 'fraction':
+        mfrac = fracm(mnp)
+        msym = sympy.Matrix(mfrac)
+    elif encoding == 'np':
+        msym = sympy.Matrix(mnp)
+    else:
+        assert 0, 'bad encoding: %s' % encoding
+
+    if verbose:
+        print('names')
+        print(names)
+        print('Matrix')
+        sympy.pprint(msym)
+
+    print('%s matrix, %u rows x %u cols, sparse: %s' % (encoding, len(mnp), len(mnp[0]), sparse))
+    bench = Benchmark()
+    try:
+        rref, pivots = msym.rref()
+    finally:
+        print('rref exiting after %s' % bench)
+
+    if verbose:
+        print('Pivots')
+        sympy.pprint(pivots)
+        print('rref')
+        sympy.pprint(rref)
+
+def main():
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description=
+        'Timing fuzzer'
+    )
+
+    parser.add_argument('--verbose', action='store_true', help='')
+    parser.add_argument('--sparse', action='store_true', help='')
+    parser.add_argument('--rows', type=int, help='')
+    parser.add_argument('--cols', type=int, help='')
+    parser.add_argument('--encoding', default='np', help='')
+    args = parser.parse_args()
+
+    run(encoding=args.encoding, rows=args.rows, cols=args.cols, sparse=args.sparse, verbose=args.verbose)
+
+if __name__ == '__main__':
+    main()

From b4874d2cf936f80f2f1e95cf65d853ce10fbb5cc Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Mon, 27 Aug 2018 13:07:30 -0700
Subject: [PATCH 09/55] timfuz: perf tests

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 experiments/timfuz/timfuz_perf.py | 36 +++++++++++++++++++++++++------
 1 file changed, 29 insertions(+), 7 deletions(-)

diff --git a/experiments/timfuz/timfuz_perf.py b/experiments/timfuz/timfuz_perf.py
index 4246f034..df1998a8 100644
--- a/experiments/timfuz/timfuz_perf.py
+++ b/experiments/timfuz/timfuz_perf.py
@@ -14,8 +14,9 @@ import sympy
 from collections import OrderedDict
 from fractions import Fraction
 import random
+from sympy import Rational
 
-def fracr(r):
+def intr(r):
     DELTA = 0.0001
 
     for i, x in enumerate(r):
@@ -23,11 +24,25 @@ def fracr(r):
             xi = int(x)
             assert abs(xi - x) < DELTA
             r[i] = xi
+
+def fracr(r):
+    intr(r)
     return [Fraction(x) for x in r]
 
 def fracm(m):
     return [fracr(r) for r in m]
 
+def symratr(r):
+    intr(r)
+    return [Rational(x) for x in r]
+
+def symratm(m):
+    return [symratr(r) for r in m]
+
+def intm(m):
+    [intr(r) for r in m]
+    return m
+
 def create_matrix(rows, cols):
     ret = np.zeros((rows, cols))
     for rowi in range(rows):
@@ -43,7 +58,7 @@ def create_matrix_sparse(rows, cols):
                 ret[rowi][coli] = random.randint(1, 10)
     return ret
 
-def run(rows=35, cols=200, verbose=False, encoding='np', sparse=False):
+def run(rows=35, cols=200, verbose=False, encoding='np', sparse=False, normalize_last=True):
     random.seed(0)
     if sparse:
         mnp = create_matrix_sparse(rows, cols)
@@ -52,12 +67,17 @@ def run(rows=35, cols=200, verbose=False, encoding='np', sparse=False):
     #print(mnp[0])
 
     if encoding == 'fraction':
-        mfrac = fracm(mnp)
-        msym = sympy.Matrix(mfrac)
+        msym = sympy.Matrix(fracm(mnp))
     elif encoding == 'np':
         msym = sympy.Matrix(mnp)
+    elif encoding == 'sympy':
+        msym = sympy.Matrix(symratm(mnp))
+    # this actually produces float results
+    elif encoding == 'int':
+        msym = sympy.Matrix(intm(mnp))
     else:
         assert 0, 'bad encoding: %s' % encoding
+    print(type(msym[0]), str(msym[0]))
 
     if verbose:
         print('names')
@@ -65,12 +85,13 @@ def run(rows=35, cols=200, verbose=False, encoding='np', sparse=False):
         print('Matrix')
         sympy.pprint(msym)
 
-    print('%s matrix, %u rows x %u cols, sparse: %s' % (encoding, len(mnp), len(mnp[0]), sparse))
+    print('%s matrix, %u rows x %u cols, sparse: %s, normlast: %s' % (encoding, len(mnp), len(mnp[0]), sparse, normalize_last))
     bench = Benchmark()
     try:
-        rref, pivots = msym.rref()
+        rref, pivots = msym.rref(normalize_last=normalize_last)
     finally:
         print('rref exiting after %s' % bench)
+    print(type(rref[0]), str(rref[0]))
 
     if verbose:
         print('Pivots')
@@ -90,10 +111,11 @@ def main():
     parser.add_argument('--sparse', action='store_true', help='')
     parser.add_argument('--rows', type=int, help='')
     parser.add_argument('--cols', type=int, help='')
+    parser.add_argument('--normalize-last', type=int, help='')
     parser.add_argument('--encoding', default='np', help='')
     args = parser.parse_args()
 
-    run(encoding=args.encoding, rows=args.rows, cols=args.cols, sparse=args.sparse, verbose=args.verbose)
+    run(encoding=args.encoding, rows=args.rows, cols=args.cols, sparse=args.sparse, normalize_last=bool(args.normalize_last), verbose=args.verbose)
 
 if __name__ == '__main__':
     main()

From 4d15c15267a18f56d2c9a985fcfcee4703890304 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Mon, 27 Aug 2018 13:16:13 -0700
Subject: [PATCH 10/55] timfuz: normalize_last=False

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 experiments/timfuz/timfuz_rref.py | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/experiments/timfuz/timfuz_rref.py b/experiments/timfuz/timfuz_rref.py
index 85122d54..59016891 100644
--- a/experiments/timfuz/timfuz_rref.py
+++ b/experiments/timfuz/timfuz_rref.py
@@ -53,6 +53,7 @@ class State(object):
         print("  Cols (preprocessed): %u" % len(self.base_names))
         print("    Drop names: %u" % len(self.drop_names))
         print("  Cols (out): %u" % len(self.names))
+        print("  Solvable vars: %u" % len(self.names & self.base_names))
         assert len(self.names) >= len(self.subs)
 
     @staticmethod
@@ -121,13 +122,17 @@ def state_rref(state, verbose=False):
     print('Converting np to sympy matrix')
     mfrac = fracm(mnp)
     msym = sympy.Matrix(mfrac)
+    # internal encoding has significnat performance implications
+    #print(type(msym[3]))
+    #assert type(msym[0]) is sympy.Integer
+
     if verbose:
         print('names')
         print(names)
         print('Matrix')
         sympy.pprint(msym)
     print('Making rref')
-    rref, pivots = msym.rref()
+    rref, pivots = msym.rref(normalize_last=False)
 
 
     if verbose:

From 42eccf21004fad94132becf66a68aceed66d20f1 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Mon, 27 Aug 2018 14:51:41 -0700
Subject: [PATCH 11/55] timfuz: quicker matrix loading

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 experiments/timfuz/timfuz.py      |  2 +-
 experiments/timfuz/timfuz_rref.py | 37 ++++++++++++++++++++++---------
 2 files changed, 27 insertions(+), 12 deletions(-)

diff --git a/experiments/timfuz/timfuz.py b/experiments/timfuz/timfuz.py
index f0b4af9f..01727a4b 100644
--- a/experiments/timfuz/timfuz.py
+++ b/experiments/timfuz/timfuz.py
@@ -138,7 +138,7 @@ def simplify_rows(Ads, b_ub):
 
     sys.stdout.write('SimpR ')
     sys.stdout.flush()
-    progress = max(1, len(b_ub) / 100)
+    progress = int(max(1, len(b_ub) / 100))
     zero_ds = 0
     zero_es = 0
     for loopi, (b, rowd) in enumerate(zip(b_ub, Ads)):
diff --git a/experiments/timfuz/timfuz_rref.py b/experiments/timfuz/timfuz_rref.py
index 59016891..74771edd 100644
--- a/experiments/timfuz/timfuz_rref.py
+++ b/experiments/timfuz/timfuz_rref.py
@@ -27,6 +27,16 @@ def fracr(r):
 def fracm(m):
     return [fracr(r) for r in m]
 
+def fracr_quick(r):
+    return [Fraction(numerator=int(x), denominator=1) for x in r]
+
+# the way I'm doing thing they should all be even integers
+# hmm this was only slightly faster
+def fracm_quick(m):
+    t = type(m[0][0])
+    print('fracm_quick type: %s' % t)
+    return [fracr_quick(r) for r in m]
+
 class State(object):
     def __init__(self, Ads, drop_names=[]):
         self.Ads = Ads
@@ -57,10 +67,11 @@ class State(object):
         assert len(self.names) >= len(self.subs)
 
     @staticmethod
-    def load(fn_ins):
-        Ads, b = loadc_Ads_b(fn_ins, corner=None, ico=True)
-        print('Simplifying')
-        #Ads, b = simplify_rows(Ads, b)
+    def load(fn_ins, simplify=False, corner=None):
+        Ads, b = loadc_Ads_b(fn_ins, corner=corner, ico=True)
+        if simplify:
+            print('Simplifying corner %s' % (corner,))
+            Ads, b = simplify_rows(Ads, b)
         return State(Ads)
 
 def write_state(state, fout):
@@ -115,12 +126,14 @@ def state_rref(state, verbose=False):
     names, Anp = A_ds2np(state.Ads)
 
     print('np: %u rows x %u cols' % (len(Anp), len(Anp[0])))
-    print('Combining rows into matrix')
-    #mnp = Anp2matrix(Anp)
-    mnp = Anp
+    if 0:
+        print('Combining rows into matrix')
+        mnp = Anp2matrix(Anp)
+    else:
+        mnp = Anp
     print('Matrix: %u rows x %u cols' % (len(mnp), len(mnp[0])))
     print('Converting np to sympy matrix')
-    mfrac = fracm(mnp)
+    mfrac = fracm_quick(mnp)
     msym = sympy.Matrix(mfrac)
     # internal encoding has significnat performance implications
     #print(type(msym[3]))
@@ -181,10 +194,10 @@ def state_rref(state, verbose=False):
 
     return state
 
-def run(fout, fn_ins, verbose=0):
+def run(fout, fn_ins, simplify=False, corner=None, verbose=0):
     print('Loading data')
 
-    state = State.load(fn_ins)
+    state = State.load(fn_ins, simplify=simplify, corner=corner)
     state_rref(state, verbose=verbose)
     state.print_stats()
     if fout:
@@ -199,6 +212,8 @@ def main():
     )
 
     parser.add_argument('--verbose', action='store_true', help='')
+    parser.add_argument('--simplify', action='store_true', help='')
+    parser.add_argument('--corner', default="slow_max", help='')
     parser.add_argument('--speed-json', default='build_speed/speed.json',
         help='Provides speed index to name translation')
     parser.add_argument('--out', help='Output sub.json substitution result')
@@ -219,7 +234,7 @@ def main():
 
     try:
         run(fout=fout,
-            fn_ins=args.fns_in, verbose=args.verbose)
+            fn_ins=args.fns_in, simplify=args.simplify, corner=args.corner, verbose=args.verbose)
     finally:
         print('Exiting after %s' % bench)
 

From 632fbffc4b0a5f6ee610433d323eeebcf0cf1e0d Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Mon, 27 Aug 2018 15:04:52 -0700
Subject: [PATCH 12/55] timfuz: dont open file until writing results

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 experiments/timfuz/timfuz_rref.py | 16 +++++++---------
 1 file changed, 7 insertions(+), 9 deletions(-)

diff --git a/experiments/timfuz/timfuz_rref.py b/experiments/timfuz/timfuz_rref.py
index 74771edd..df0d7153 100644
--- a/experiments/timfuz/timfuz_rref.py
+++ b/experiments/timfuz/timfuz_rref.py
@@ -134,6 +134,8 @@ def state_rref(state, verbose=False):
     print('Matrix: %u rows x %u cols' % (len(mnp), len(mnp[0])))
     print('Converting np to sympy matrix')
     mfrac = fracm_quick(mnp)
+    # doesn't seem to change anything
+    #msym = sympy.MutableSparseMatrix(mfrac)
     msym = sympy.Matrix(mfrac)
     # internal encoding has significnat performance implications
     #print(type(msym[3]))
@@ -147,7 +149,6 @@ def state_rref(state, verbose=False):
     print('Making rref')
     rref, pivots = msym.rref(normalize_last=False)
 
-
     if verbose:
         print('Pivots')
         sympy.pprint(pivots)
@@ -194,14 +195,15 @@ def state_rref(state, verbose=False):
 
     return state
 
-def run(fout, fn_ins, simplify=False, corner=None, verbose=0):
+def run(fnout, fn_ins, simplify=False, corner=None, verbose=0):
     print('Loading data')
 
     state = State.load(fn_ins, simplify=simplify, corner=corner)
     state_rref(state, verbose=verbose)
     state.print_stats()
-    if fout:
-        write_state(state, fout)
+    if fnout:
+        with open(fnout, 'w') as fout:
+            write_state(state, fout)
 
 def main():
     import argparse
@@ -224,16 +226,12 @@ def main():
     args = parser.parse_args()
     bench = Benchmark()
 
-    fout = None
-    if args.out:
-        fout = open(args.out, 'w')
-
     fns_in = args.fns_in
     if not fns_in:
         fns_in = glob.glob('specimen_*/timing3.csv')
 
     try:
-        run(fout=fout,
+        run(fnout=args.out,
             fn_ins=args.fns_in, simplify=args.simplify, corner=args.corner, verbose=args.verbose)
     finally:
         print('Exiting after %s' % bench)

From d4d0af9d9fe4979e0c4891d02a7590f4b0645cd3 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Tue, 28 Aug 2018 13:43:35 -0700
Subject: [PATCH 13/55] timfuz: sub2csv

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 experiments/timfuz/timfuz_sub2csv.py | 105 +++++++++++++++++++++++++++
 1 file changed, 105 insertions(+)
 create mode 100644 experiments/timfuz/timfuz_sub2csv.py

diff --git a/experiments/timfuz/timfuz_sub2csv.py b/experiments/timfuz/timfuz_sub2csv.py
new file mode 100644
index 00000000..9ea9bbbc
--- /dev/null
+++ b/experiments/timfuz/timfuz_sub2csv.py
@@ -0,0 +1,105 @@
+#!/usr/bin/env python3
+
+from timfuz import Benchmark, Ar_di2np, loadc_Ads_b, index_names, A_ds2np, simplify_rows
+import numpy as np
+import glob
+import math
+import json
+import sympy
+from collections import OrderedDict
+from fractions import Fraction
+
+def mlcm(xs):
+    '''
+    Find the LCM between elements in a group
+    '''
+    l = xs[0]
+    for n in xs:
+        for m in xs:
+            lthis = lcm(n, m)
+            l = int(max(lthis, l))
+    return ret
+
+def write_state(state, fout):
+    j = {
+        'names': dict([(x, None) for x in state.names]),
+        'drop_names': list(state.drop_names),
+        'base_names': list(state.base_names),
+        'subs': dict([(name, values) for name, values in state.subs.items()]),
+        'pivots': state.pivots,
+    }
+    json.dump(j, fout, sort_keys=True, indent=4, separators=(',', ': '))
+
+def gen_rows(fn_ins):
+    for fn_in in fn_ins:
+        try:
+            print('Loading %s' % fn_in)
+            j = json.load(open(fn_in, 'r'))
+
+            group0 = list(j['subs'].values())[0]
+            value0 = list(group0.values())[0]
+            if type(value0) is float:
+                print("WARNING: skipping old format JSON")
+                continue
+            else:
+                print("Value OK")
+
+            for sub in j['subs'].values():
+                row_ds = {}
+                # TODO: convert to gcd
+                # den may not always be 0
+                # lazy solution...just multiply out all the fractions
+                n = 1
+                for _var, (_num, den) in sub.items():
+                    n *= den
+    
+                for var, (num, den) in sub.items():
+                    num2 = n * num
+                    assert num2 % den == 0
+                    row_ds[var] = num2 / den
+                yield row_ds
+        except:
+            print("Error processing %s" % fn_in)
+            raise
+
+def run(fnout, fn_ins, verbose=0):
+    print('Loading data')
+
+    with open(fnout, 'w') as fout:
+        fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
+        for row_ds in gen_rows(fn_ins):
+            ico = '1'
+            out_b = [1e9, 1e9, 1e9, 1e9]
+            items = [ico, ' '.join(['%u' % x for x in out_b])]
+
+            for k, v in sorted(row_ds.items()):
+                items.append('%i %s' % (v, k))
+            fout.write(','.join(items) + '\n')
+
+def main():
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description=
+        'Convert substitution groups into .csv to allow incremental rref results'
+    )
+
+    parser.add_argument('--verbose', action='store_true', help='')
+    parser.add_argument('--out', help='Output csv')
+    parser.add_argument(
+        'fns_in',
+        nargs='*',
+        help='sub.json input files')
+    args = parser.parse_args()
+    bench = Benchmark()
+
+    fns_in = args.fns_in
+
+    try:
+        run(fnout=args.out,
+            fn_ins=args.fns_in, verbose=args.verbose)
+    finally:
+        print('Exiting after %s' % bench)
+
+if __name__ == '__main__':
+    main()

From 41cf8469b540eb2e70d2ba156f2076c2711932b4 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 29 Aug 2018 13:13:46 -0700
Subject: [PATCH 14/55] timfuz: least square tests

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 database/Makefile                             |  10 -
 database/Makefile.database                    |  15 -
 .../{timfuz_checksub.py => checksub.py}       |   0
 .../{timfuz_corner_csv.py => corner_csv.py}   |   0
 .../timfuz/{timfuz_perf.py => perf_test.py}   |   0
 experiments/timfuz/solve_leastsq.py           | 272 ++++++++++++++++++
 experiments/timfuz/solve_linprog.py           | 150 ++++++++++
 .../timfuz/{timfuz_sub2csv.py => sub2csv.py}  |   0
 experiments/timfuz/timfuz.py                  |  15 +-
 experiments/timfuz/timfuz_massage.py          |  10 +-
 experiments/timfuz/timfuz_solve.py            | 167 ++---------
 11 files changed, 470 insertions(+), 169 deletions(-)
 delete mode 100644 database/Makefile
 delete mode 100644 database/Makefile.database
 rename experiments/timfuz/{timfuz_checksub.py => checksub.py} (100%)
 rename experiments/timfuz/{timfuz_corner_csv.py => corner_csv.py} (100%)
 rename experiments/timfuz/{timfuz_perf.py => perf_test.py} (100%)
 create mode 100644 experiments/timfuz/solve_leastsq.py
 create mode 100644 experiments/timfuz/solve_linprog.py
 rename experiments/timfuz/{timfuz_sub2csv.py => sub2csv.py} (100%)

diff --git a/database/Makefile b/database/Makefile
deleted file mode 100644
index 99fab407..00000000
--- a/database/Makefile
+++ /dev/null
@@ -1,10 +0,0 @@
-.NOTPARALLEL:
-
-SUBDIRS := $(patsubst %/,%, $(wildcard */))
-
-.PHONY: $(SUBDIRS)
-
-$(MAKECMDGOALS): $(SUBDIRS)
-
-$(SUBDIRS):
-	$(MAKE) -C $@ -f ../Makefile.database $(MAKECMDGOALS)
diff --git a/database/Makefile.database b/database/Makefile.database
deleted file mode 100644
index 2e407968..00000000
--- a/database/Makefile.database
+++ /dev/null
@@ -1,15 +0,0 @@
-.PHONY: all clean
-
-all: tilegrid.json
-
-# Small dance to say that there is a single recipe that is run once to generate
-# multiple files.
-tileconn.json tilegrid.json: fuzzers
-.INTERMEDIATE: fuzzers
-fuzzers: SHELL:=/bin/bash
-fuzzers: settings.sh
-	source settings.sh && $(MAKE) -C ../../fuzzers all
-
-clean:
-	rm -f *.db tileconn.json tilegrid.json *.yaml
-	rm -rf html
diff --git a/experiments/timfuz/timfuz_checksub.py b/experiments/timfuz/checksub.py
similarity index 100%
rename from experiments/timfuz/timfuz_checksub.py
rename to experiments/timfuz/checksub.py
diff --git a/experiments/timfuz/timfuz_corner_csv.py b/experiments/timfuz/corner_csv.py
similarity index 100%
rename from experiments/timfuz/timfuz_corner_csv.py
rename to experiments/timfuz/corner_csv.py
diff --git a/experiments/timfuz/timfuz_perf.py b/experiments/timfuz/perf_test.py
similarity index 100%
rename from experiments/timfuz/timfuz_perf.py
rename to experiments/timfuz/perf_test.py
diff --git a/experiments/timfuz/solve_leastsq.py b/experiments/timfuz/solve_leastsq.py
new file mode 100644
index 00000000..b00c58ad
--- /dev/null
+++ b/experiments/timfuz/solve_leastsq.py
@@ -0,0 +1,272 @@
+#!/usr/bin/env python3
+
+# https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
+from scipy.optimize import linprog
+from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json, A_ub_np2d, print_eqns, print_eqns_np
+from timfuz_massage import massage_equations
+import numpy as np
+import glob
+import json
+import math
+from collections import OrderedDict
+from fractions import Fraction
+import sys
+import datetime
+import os
+import time
+import timfuz_solve
+import numpy
+import scipy.optimize as optimize
+from scipy.optimize import least_squares
+
+def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
+    # Given timing scores for above delays (-ps)
+    assert type(Anp[0]) is np.ndarray, type(Anp[0])
+    assert type(b) is np.ndarray, type(b)
+
+    #check_feasible(Anp, b)
+
+    '''
+    Be mindful of signs
+    Have something like
+    timing1/timing 2 are constants
+    delay1 +   delay2 +               delay4     >= timing1
+               delay2 +   delay3                 >= timing2
+
+    But need it in compliant form:
+    -delay1 +   -delay2 +               -delay4     <= -timing1
+                -delay2 +   -delay3                 <= -timing2
+    '''
+    rows = len(Anp)
+    cols = len(Anp[0])
+
+    print('Unique delay elements: %d' % len(names))
+    print('Input paths')
+    print('  # timing scores: %d' % len(b))
+    print('  Rows: %d' % rows)
+
+    '''
+    You must have at least as many things to optimize as variables
+    That is, the system must be plausibly constrained for it to attempt a solve
+    If not, you'll get a message like
+    TypeError: Improper input: N=3 must not exceed M=2
+    '''
+    if rows < cols:
+        raise Exception("rows must be >= cols")
+
+    def func(params, xdata, ydata):
+        return (ydata - np.dot(xdata, params))
+
+    print('')
+    # Now find smallest values for delay constants
+    # Due to input bounds (ex: column limit), some delay elements may get eliminated entirely
+    print('Running leastsq w/ %d r, %d c (%d name)' % (rows, cols, len(names)))
+    x0 = np.array([0.0 for _x in range(cols)])
+    x, cov_x, infodict, mesg, ier = optimize.leastsq(func, x0, args=(Anp, b), full_output=True)
+    print('x', x)
+    print('cov_x', cov_x)
+    print('infodictx', infodict)
+    print('mesg', mesg)
+    print('ier', ier)
+    print('  Solution found: %s' % (ier in (1, 2, 3, 4)))
+
+def main():
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description=
+        'Solve timing solution'
+    )
+
+    parser.add_argument('--verbose', action='store_true', help='')
+    parser.add_argument('--massage', action='store_true', help='')
+    parser.add_argument('--sub-json', help='Group substitutions to make fully ranked')
+    parser.add_argument('--corner', default="slow_max", help='')
+    parser.add_argument('--out', default=None, help='output timing delay .json')
+    parser.add_argument(
+        'fns_in',
+        nargs='*',
+        help='timing3.csv input files')
+    args = parser.parse_args()
+    # Store options in dict to ease passing through functions
+    bench = Benchmark()
+
+    fns_in = args.fns_in
+    if not fns_in:
+        fns_in = glob.glob('specimen_*/timing3.csv')
+
+    sub_json = None
+    if args.sub_json:
+        sub_json = load_sub(args.sub_json)
+
+    try:
+        timfuz_solve.run(run_corner=run_corner, sub_json=sub_json, 
+            fns_in=fns_in, corner=args.corner, massage=args.massage, outfn=args.out, verbose=args.verbose)
+    finally:
+        print('Exiting after %s' % bench)
+
+# optimize.curve_fit wrapper
+def test1():
+    # Generate artificial data = straight line with a=0 and b=1
+    # plus some noise.
+    xdata = np.array([0.0,1.0,2.0,3.0,4.0,5.0])
+    ydata = np.array([0.1,0.9,2.2,2.8,3.9,5.1])
+    # Initial guess.
+    x0    = np.array([0.0, 0.0, 0.0])
+    sigma = np.array([1.0,1.0,1.0,1.0,1.0,1.0])
+
+    def func(x, a, b, c):
+        return a + b*x + c*x*x
+
+    print(optimize.curve_fit(func, xdata, ydata, x0, sigma))
+
+# optimize.leastsq
+def test2():
+    
+    # The function whose square is to be minimised.
+    # params ... list of parameters tuned to minimise function.
+    # Further arguments:
+    # xdata ... design matrix for a linear model.
+    # ydata ... observed data.
+    def func(params, xdata, ydata):
+        return (ydata - np.dot(xdata, params))
+
+    x0 = np.array([0.0, 0.0])
+
+    '''
+    a  = 10
+    a + b = 100
+    '''
+    xdata = np.array([[1, 0],
+                      [1, 1]])
+    ydata = np.array([10, 100])
+
+    '''
+    x [ 10.  90.]
+    cov_x [[ 1. -1.]
+     [-1.  2.]]
+    infodictx {'ipvt': array([1, 2], dtype=int32), 'qtf': array([  1.69649118e-10,   1.38802454e-10]), 'nfev': 7, 'fjac': array([[ 1.41421356,  0.70710678],
+           [ 0.70710678,  0.70710678]]), 'fvec': array([ 0.,  0.])}
+    mesg The relative error between two consecutive iterates is at most 0.000000
+    ier 2
+      Solution found: True
+    '''
+    x, cov_x, infodict, mesg, ier = optimize.leastsq(func, x0, args=(xdata, ydata), full_output=True)
+    print('x', x)
+    print('cov_x', cov_x)
+    print('infodictx', infodict)
+    print('mesg', mesg)
+    print('ier', ier)
+    print('  Solution found: %s' % (ier in (1, 2, 3, 4)))
+
+# non-square
+def test3():
+    def func(params, xdata, ydata):
+        return (ydata - np.dot(xdata, params))
+
+    x0 = np.array([0.0, 0.0, 0.0])
+
+    '''
+    a  = 10
+    a + b + c = 100
+    '''
+    xdata = np.array([[1, 0, 0],
+                      [1, 1, 1],
+                      [0, 0, 0]])
+    ydata = np.array([10, 100, 0])
+
+    x, cov_x, infodict, mesg, ier = optimize.leastsq(func, x0, args=(xdata, ydata), full_output=True)
+    print('x', x)
+    print('cov_x', cov_x)
+    print('infodictx', infodict)
+    print('mesg', mesg)
+    print('ier', ier)
+    print('  Solution found: %s' % (ier in (1, 2, 3, 4)))
+
+def test4():
+    def func(params):
+        print('')
+        print('iter')
+        print(params)
+        print(xdata)
+        print(ydata)
+        return (ydata - np.dot(xdata, params))
+
+    x0 = np.array([0.0, 0.0, 0.0])
+
+    '''
+    You must have at least as many things to optimize as variables
+    That is, the system must be plausibly constrained for it to attempt a solve
+    If not, you'll get a message like
+    TypeError: Improper input: N=3 must not exceed M=2
+    '''
+    xdata = np.array([[1, 0, 0],
+                      [1, 1, 1],
+                      [1, 0, 1],
+                      [0, 1, 1],
+                      ])
+    ydata = np.array([10, 100, 120, 140])
+
+    x, cov_x, infodict, mesg, ier = optimize.leastsq(func, x0, full_output=True)
+    print('x', x)
+    print('cov_x', cov_x)
+    print('infodictx', infodict)
+    print('mesg', mesg)
+    print('ier', ier)
+    print('  Solution found: %s' % (ier in (1, 2, 3, 4)))
+
+def test5():
+    from scipy.optimize import least_squares
+
+    def fun_rosenbrock(x):
+        return np.array([10 * (x[1] - x[0]**2), (1 - x[0])])
+    x0_rosenbrock = np.array([2, 2])
+    res = least_squares(fun_rosenbrock, x0_rosenbrock)
+    '''
+     active_mask: array([ 0.,  0.])
+            cost: 9.8669242910846867e-30
+             fun: array([  4.44089210e-15,   1.11022302e-16])
+            grad: array([ -8.89288649e-14,   4.44089210e-14])
+             jac: array([[-20.00000015,  10.        ],
+           [ -1.        ,   0.        ]])
+         message: '`gtol` termination condition is satisfied.'
+            nfev: 3
+            njev: 3
+      optimality: 8.8928864934219529e-14
+          status: 1
+         success: True
+               x: array([ 1.,  1.])
+    '''
+    print(res)
+
+def test6():
+    from scipy.optimize import least_squares
+
+    def func(params):
+        return (ydata - np.dot(xdata, params))
+
+    x0 = np.array([0.0, 0.0, 0.0])
+
+    '''
+    a  = 10
+    a + b + c = 100
+    '''
+    xdata = np.array([[1, 0, 0],
+                      [1, 1, 1],
+                      [0, 0, 0]])
+    ydata = np.array([10, 100, 0])
+
+    res = least_squares(func, x0)
+    '''
+    '''
+    print(res)
+
+if __name__ == '__main__':
+    #main()
+    #test1()
+    #test2()
+    #test3()
+    #test4()
+    #test5()
+    test6()
+
diff --git a/experiments/timfuz/solve_linprog.py b/experiments/timfuz/solve_linprog.py
new file mode 100644
index 00000000..2eef5e75
--- /dev/null
+++ b/experiments/timfuz/solve_linprog.py
@@ -0,0 +1,150 @@
+#!/usr/bin/env python3
+
+# https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
+from scipy.optimize import linprog
+from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json, A_ub_np2d, print_eqns, print_eqns_np
+from timfuz_massage import massage_equations
+import numpy as np
+import glob
+import json
+import math
+from collections import OrderedDict
+from fractions import Fraction
+import sys
+import datetime
+import os
+import time
+import timfuz_solve
+
+def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
+    # Given timing scores for above delays (-ps)
+    assert type(Anp[0]) is np.ndarray, type(Anp[0])
+    assert type(b) is np.ndarray, type(b)
+
+    #check_feasible(Anp, b)
+
+    '''
+    Be mindful of signs
+    Have something like
+    timing1/timing 2 are constants
+    delay1 +   delay2 +               delay4     >= timing1
+               delay2 +   delay3                 >= timing2
+
+    But need it in compliant form:
+    -delay1 +   -delay2 +               -delay4     <= -timing1
+                -delay2 +   -delay3                 <= -timing2
+    '''
+    rows = len(Anp)
+    cols = len(Anp[0])
+    print('Scaling to solution form...')
+    b_ub = -1.0 * b
+    #A_ub = -1.0 * Anp
+    A_ub = [-1.0 * x for x in Anp]
+
+    if verbose:
+        print('')
+        print('A_ub b_ub')
+        print_eqns_np(A_ub, b_ub, verbose=verbose)
+        print('')
+
+    print('Creating misc constants...')
+    # Minimization function scalars
+    # Treat all logic elements as equally important
+    c = [1 for _i in range(len(names))]
+    # Delays cannot be negative
+    # (this is also the default constraint)
+    #bounds =  [(0, None) for _i in range(len(names))]
+    # Also you can provide one to apply to all
+    bounds = (0, None)
+
+    # Seems to take about rows + 3 iterations
+    # Give some margin
+    #maxiter = int(1.1 * rows + 100)
+    #maxiter = max(1000, int(1000 * rows + 1000))
+    # Most of the time I want it to just keep going unless I ^C it
+    maxiter = 1000000
+
+    if verbose >= 2:
+        print('b_ub', b)
+    print('Unique delay elements: %d' % len(names))
+    print('  # delay minimization weights: %d' % len(c))
+    print('  # delay constraints: %d' % len(bounds))
+    print('Input paths')
+    print('  # timing scores: %d' % len(b))
+    print('  Rows: %d' % rows)
+
+    tlast = [time.time()]
+    iters = [0]
+    printn = [0]
+    def callback(xk, **kwargs):
+        iters[0] = kwargs['nit']
+        if time.time() - tlast[0] > 1.0:
+            sys.stdout.write('I:%d ' % kwargs['nit'])
+            tlast[0] = time.time()
+            printn[0] += 1
+            if printn[0] % 10 == 0:
+                sys.stdout.write('\n')
+            sys.stdout.flush()
+
+    print('')
+    # Now find smallest values for delay constants
+    # Due to input bounds (ex: column limit), some delay elements may get eliminated entirely
+    print('Running linprog w/ %d r, %d c (%d name)' % (rows, cols, len(names)))
+    res = linprog(c, A_ub=A_ub, b_ub=b_ub, bounds=bounds, callback=callback,
+          options={"disp": True, 'maxiter': maxiter, 'bland': True, 'tol': 1e-6,})
+    nonzeros = 0
+    print('Ran %d iters' % iters[0])
+    if res.success:
+        print('Result sample (%d elements)' % (len(res.x)))
+        plim = 3
+        for xi, (name, x) in enumerate(zip(names, res.x)):
+            nonzero = x >= 0.001
+            if nonzero:
+                nonzeros += 1
+            #if nonzero and (verbose >= 1 or xi > 30):
+            if nonzero and (verbose or ((nonzeros < 100 or nonzeros % 20 == 0) and nonzeros <= plim)):
+                print('  % 4u % -80s % 10.1f' % (xi, name, x))
+        print('Delay on %d / %d' % (nonzeros, len(res.x)))
+        if not os.path.exists('res'):
+            os.mkdir('res')
+        fn_out = 'res/%s' % datetime.datetime.utcnow().isoformat().split('.')[0]
+        print('Writing %s' % fn_out)
+        np.save(fn_out, (3, c, A_ub, b_ub, bounds, names, res, meta))
+
+def main():
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description=
+        'Solve timing solution'
+    )
+
+    parser.add_argument('--verbose', action='store_true', help='')
+    parser.add_argument('--massage', action='store_true', help='')
+    parser.add_argument('--sub-json', help='Group substitutions to make fully ranked')
+    parser.add_argument('--corner', default="slow_max", help='')
+    parser.add_argument('--out', default=None, help='output timing delay .json')
+    parser.add_argument(
+        'fns_in',
+        nargs='*',
+        help='timing3.csv input files')
+    args = parser.parse_args()
+    # Store options in dict to ease passing through functions
+    bench = Benchmark()
+
+    fns_in = args.fns_in
+    if not fns_in:
+        fns_in = glob.glob('specimen_*/timing3.csv')
+
+    sub_json = None
+    if args.sub_json:
+        sub_json = load_sub(args.sub_json)
+
+    try:
+        timfuz_solve.run(run_corner=run_corner, sub_json=sub_json,
+            fns_in=fns_in, corner=args.corner, massage=args.massage, outfn=args.out, verbose=args.verbose)
+    finally:
+        print('Exiting after %s' % bench)
+
+if __name__ == '__main__':
+    main()
diff --git a/experiments/timfuz/timfuz_sub2csv.py b/experiments/timfuz/sub2csv.py
similarity index 100%
rename from experiments/timfuz/timfuz_sub2csv.py
rename to experiments/timfuz/sub2csv.py
diff --git a/experiments/timfuz/timfuz.py b/experiments/timfuz/timfuz.py
index 01727a4b..d2bcd300 100644
--- a/experiments/timfuz/timfuz.py
+++ b/experiments/timfuz/timfuz.py
@@ -718,6 +718,9 @@ def load_sub(fn):
     return j
 
 def row_sub_syms(row, sub_json, verbose=False):
+    zero = Fraction(0)
+    zero = 0
+
     if 0 and verbose:
         print("")
         print(row.items())
@@ -751,8 +754,9 @@ def row_sub_syms(row, sub_json, verbose=False):
         if verbose:
             print('pivot %i %s' % (n, pivot))
         for subk, subv in sorted(sub_json['subs'][group].items()):
-            oldn = row.get(subk, Fraction(0))
-            rown = oldn - n * subv
+            oldn = row.get(subk, zero)
+            rown = -n * subv
+            rown += type(rown)(oldn)
             if verbose:
                 print("  %s: %d => %d" % (subk, oldn, rown))
             if rown == 0:
@@ -768,8 +772,9 @@ def row_sub_syms(row, sub_json, verbose=False):
     # after all constants are applied, the row should end up positive?
     # numeric precision issues previously limited this
     # Ex: AssertionError: ('PIP_BSW_2ELSING0', -2.220446049250313e-16)
-    for k, v in sorted(row.items()):
-        assert v > 0, (k, v)
+    if 0:
+        for k, v in sorted(row.items()):
+            assert v > 0, (k, v)
 
 def run_sub_json(Ads, sub_json, verbose=False):
     nrows = 0
@@ -805,7 +810,7 @@ def run_sub_json(Ads, sub_json, verbose=False):
         print('')
 
     print("Sub: %u / %u rows changed" % (nsubs, nrows))
-    print("Sub: %u => %u cols" % (ncols_old, ncols_new))
+    print("Sub: %u => %u non-zero row cols" % (ncols_old, ncols_new))
 
 def print_eqns(Ads, b, verbose=0, lim=3, label=''):
     rows = len(b)
diff --git a/experiments/timfuz/timfuz_massage.py b/experiments/timfuz/timfuz_massage.py
index 3c7b78b8..046886ce 100644
--- a/experiments/timfuz/timfuz_massage.py
+++ b/experiments/timfuz/timfuz_massage.py
@@ -322,6 +322,7 @@ def derive_eq_by_col(Ads, b_ub, verbose=0):
     print('Derive col: %d => %d rows' % (len(b_ub), len(b_ret)))
     return Ads_ret, b_ret
 
+# keep derriving until solution is (probably) stable
 def massage_equations_old(Ads, b, verbose=False, derive_lim=3):
     '''
     Equation pipeline
@@ -392,7 +393,8 @@ def massage_equations_old(Ads, b, verbose=False, derive_lim=3):
     debug("final (sorted)")
     return Ads, b
 
-def massage_equations_old2(Ads, b, verbose=False):
+# iteratively increasing column limit until all columns are added
+def massage_equations_inc_col_lim(Ads, b, verbose=False):
     '''
     Equation pipeline
     Some operations may generate new equations
@@ -463,7 +465,9 @@ def massage_equations_old2(Ads, b, verbose=False):
     print('Massage final: %d => %d rows' % (dstart, dend))
     return Ads, b
 
-def massage_equations(Ads, b, verbose=False):
+# only derive based on nearby equations
+# theory is they will be the best to diff
+def massage_equations_near(Ads, b, verbose=False):
     '''
     Equation pipeline
     Some operations may generate new equations
@@ -525,3 +529,5 @@ def massage_equations(Ads, b, verbose=False):
     print('')
     print('Massage final: %d => %d rows' % (dstart, dend))
     return Ads, b
+
+massage_equations = massage_equations_inc_col_lim
diff --git a/experiments/timfuz/timfuz_solve.py b/experiments/timfuz/timfuz_solve.py
index 356476e5..a2e6526a 100644
--- a/experiments/timfuz/timfuz_solve.py
+++ b/experiments/timfuz/timfuz_solve.py
@@ -32,9 +32,12 @@ def check_feasible(A_ub, b_ub):
 
     progress = max(1, rows / 100)
 
-    # Chose a high arbitrary value for x
-    # Delays should be in order of ns, so a 10 ns delay should be way above what anything should be
-    xs = [10e3 for _i in range(cols)]
+    '''
+    Delays should be in order of ns, so a 10 ns delay should be way above what anything should be
+    Series can have several hundred delay elements
+    Max delay in ballpark
+    ''' 
+    xs = [1e9 for _i in range(cols)]
 
     # FIXME: use the correct np function to do this for me
     # Verify bounds
@@ -65,102 +68,14 @@ def check_feasible(A_ub, b_ub):
             raise Exception("Bad ")
     print(' done')
 
-def run_corner(Anp, b, names, verbose=False, opts={}, meta={}):
-    # Given timing scores for above delays (-ps)
-    assert type(Anp[0]) is np.ndarray, type(Anp[0])
-    assert type(b) is np.ndarray, type(b)
+def instances(Ads):
+    ret = 0
+    for row_ds in Ads:
+        ret += sum(row_ds.values())
+    return ret
 
-    #check_feasible(Anp, b)
-
-    '''
-    Be mindful of signs
-    Have something like
-    timing1/timing 2 are constants
-    delay1 +   delay2 +               delay4     >= timing1
-               delay2 +   delay3                 >= timing2
-
-    But need it in compliant form:
-    -delay1 +   -delay2 +               -delay4     <= -timing1
-                -delay2 +   -delay3                 <= -timing2
-    '''
-    rows = len(Anp)
-    cols = len(Anp[0])
-    print('Scaling to solution form...')
-    b_ub = -1.0 * b
-    #A_ub = -1.0 * Anp
-    A_ub = [-1.0 * x for x in Anp]
-
-    if verbose:
-        print('')
-        print('A_ub b_ub')
-        print_eqns_np(A_ub, b_ub, verbose=verbose)
-        print('')
-
-    print('Creating misc constants...')
-    # Minimization function scalars
-    # Treat all logic elements as equally important
-    c = [1 for _i in range(len(names))]
-    # Delays cannot be negative
-    # (this is also the default constraint)
-    #bounds =  [(0, None) for _i in range(len(names))]
-    # Also you can provide one to apply to all
-    bounds = (0, None)
-
-    # Seems to take about rows + 3 iterations
-    # Give some margin
-    #maxiter = int(1.1 * rows + 100)
-    #maxiter = max(1000, int(1000 * rows + 1000))
-    # Most of the time I want it to just keep going unless I ^C it
-    maxiter = 1000000
-
-    if verbose >= 2:
-        print('b_ub', b)
-    print('Unique delay elements: %d' % len(names))
-    print('  # delay minimization weights: %d' % len(c))
-    print('  # delay constraints: %d' % len(bounds))
-    print('Input paths')
-    print('  # timing scores: %d' % len(b))
-    print('  Rows: %d' % rows)
-
-    tlast = [time.time()]
-    iters = [0]
-    printn = [0]
-    def callback(xk, **kwargs):
-        iters[0] = kwargs['nit']
-        if time.time() - tlast[0] > 1.0:
-            sys.stdout.write('I:%d ' % kwargs['nit'])
-            tlast[0] = time.time()
-            printn[0] += 1
-            if printn[0] % 10 == 0:
-                sys.stdout.write('\n')
-            sys.stdout.flush()
-
-    print('')
-    # Now find smallest values for delay constants
-    # Due to input bounds (ex: column limit), some delay elements may get eliminated entirely
-    print('Running linprog w/ %d r, %d c (%d name)' % (rows, cols, len(names)))
-    res = linprog(c, A_ub=A_ub, b_ub=b_ub, bounds=bounds, callback=callback,
-          options={"disp": True, 'maxiter': maxiter, 'bland': True, 'tol': 1e-6,})
-    nonzeros = 0
-    print('Ran %d iters' % iters[0])
-    if res.success:
-        print('Result sample (%d elements)' % (len(res.x)))
-        plim = 3
-        for xi, (name, x) in enumerate(zip(names, res.x)):
-            nonzero = x >= 0.001
-            if nonzero:
-                nonzeros += 1
-            #if nonzero and (verbose >= 1 or xi > 30):
-            if nonzero and (verbose or ((nonzeros < 100 or nonzeros % 20 == 0) and nonzeros <= plim)):
-                print('  % 4u % -80s % 10.1f' % (xi, name, x))
-        print('Delay on %d / %d' % (nonzeros, len(res.x)))
-        if not os.path.exists('res'):
-            os.mkdir('res')
-        fn_out = 'res/%s' % datetime.datetime.utcnow().isoformat().split('.')[0]
-        print('Writing %s' % fn_out)
-        np.save(fn_out, (3, c, A_ub, b_ub, bounds, names, res, meta))
-
-def run(fns_in, corner, sub_json=None, dedup=True, massage=False, verbose=False):
+def run(fns_in, corner, run_corner, sub_json=None, dedup=True, massage=False, outfn=None, verbose=False, **kwargs):
+    print('Loading data')
     Ads, b = loadc_Ads_b(fns_in, corner, ico=True)
 
     # Remove duplicate rows
@@ -168,15 +83,19 @@ def run(fns_in, corner, sub_json=None, dedup=True, massage=False, verbose=False)
     # maybe better to just add them into the matrix directly
     if dedup:
         oldn = len(Ads)
+        iold = instances(Ads)
         Ads, b = simplify_rows(Ads, b)
         print('Simplify %u => %u rows' % (oldn, len(Ads)))
-
+        print('Simplify %u => %u instances' % (iold, instances(Ads)))
+        
     if sub_json:
         print('Sub: %u rows' % len(Ads))
+        iold = instances(Ads)
         names_old = index_names(Ads)
         run_sub_json(Ads, sub_json, verbose=verbose)
         names = index_names(Ads)
         print("Sub: %u => %u names" % (len(names_old), len(names)))
+        print('Sub: %u => %u instances' % (iold, instances(Ads)))
     else:
         names = index_names(Ads)
 
@@ -187,46 +106,20 @@ def run(fns_in, corner, sub_json=None, dedup=True, massage=False, verbose=False)
         #print
         #col_dist(A_ubd, 'final', names)
 
+    '''
+    Given:
+    a >= 10
+    a + b >= 100
+    A valid solution is:
+         a = 100
+    However, a better solution is something like
+        a = 10
+        b = 90
+    This creates derived constraints to provide more realistic results 
+    '''
     if massage:
         Ads, b = massage_equations(Ads, b)
 
     print('Converting to numpy...')
     names, Anp = A_ds2np(Ads)
-    run_corner(Anp, np.asarray(b), names, verbose=verbose)
-
-def main():
-    import argparse
-
-    parser = argparse.ArgumentParser(
-        description=
-        'Solve timing solution'
-    )
-
-    parser.add_argument('--verbose', action='store_true', help='')
-    parser.add_argument('--massage', action='store_true', help='')
-    parser.add_argument('--sub-json', help='Group substitutions to make fully ranked')
-    parser.add_argument('--corner', default="slow_max", help='')
-    parser.add_argument(
-        'fns_in',
-        nargs='*',
-        help='timing3.csv input files')
-    args = parser.parse_args()
-    # Store options in dict to ease passing through functions
-    bench = Benchmark()
-
-    fns_in = args.fns_in
-    if not fns_in:
-        fns_in = glob.glob('specimen_*/timing3.csv')
-
-    sub_json = None
-    if args.sub_json:
-        sub_json = load_sub(args.sub_json)
-
-    try:
-        run(sub_json=sub_json,
-            fns_in=fns_in, verbose=args.verbose, corner=args.corner, massage=args.massage)
-    finally:
-        print('Exiting after %s' % bench)
-
-if __name__ == '__main__':
-    main()
+    run_corner(Anp, np.asarray(b), names, outfn=outfn, verbose=verbose, **kwargs)

From 9e63d9ee55ba5c26664f41f2fbfb419c5bd78fb3 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 29 Aug 2018 13:31:53 -0700
Subject: [PATCH 15/55] timfuz: leastsq reasonable delays

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 experiments/timfuz/solve_leastsq.py | 47 ++++++++++++++++++++---------
 1 file changed, 33 insertions(+), 14 deletions(-)

diff --git a/experiments/timfuz/solve_leastsq.py b/experiments/timfuz/solve_leastsq.py
index b00c58ad..1fc2f8f9 100644
--- a/experiments/timfuz/solve_leastsq.py
+++ b/experiments/timfuz/solve_leastsq.py
@@ -19,6 +19,17 @@ import numpy
 import scipy.optimize as optimize
 from scipy.optimize import least_squares
 
+def mkestimate(Anp, b):
+    cols = len(Anp[0])
+    x0 = np.array([1e3 for _x in range(cols)])
+    for row_np, row_b in zip(Anp, b):
+        for coli, val in enumerate(row_np):
+            if val:
+                ub = row_b / val
+                if ub >= 0:
+                    x0[coli] = min(x0[coli], ub)
+    return x0
+
 def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
     # Given timing scores for above delays (-ps)
     assert type(Anp[0]) is np.ndarray, type(Anp[0])
@@ -54,21 +65,31 @@ def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
     if rows < cols:
         raise Exception("rows must be >= cols")
 
-    def func(params, xdata, ydata):
-        return (ydata - np.dot(xdata, params))
+    def func(params):
+        return (b - np.dot(Anp, params))
 
     print('')
     # Now find smallest values for delay constants
     # Due to input bounds (ex: column limit), some delay elements may get eliminated entirely
     print('Running leastsq w/ %d r, %d c (%d name)' % (rows, cols, len(names)))
-    x0 = np.array([0.0 for _x in range(cols)])
-    x, cov_x, infodict, mesg, ier = optimize.leastsq(func, x0, args=(Anp, b), full_output=True)
-    print('x', x)
-    print('cov_x', cov_x)
-    print('infodictx', infodict)
-    print('mesg', mesg)
-    print('ier', ier)
-    print('  Solution found: %s' % (ier in (1, 2, 3, 4)))
+    # starting at 0 completes quicky, but gives a solution near 0 with terrible results
+    # maybe give a starting estimate to the smallest net delay with the indicated variable
+    #x0 = np.array([1000.0 for _x in range(cols)])
+    x0 = mkestimate(Anp, b)
+    #print('x0', x0)
+    if 0:
+        x, cov_x, infodict, mesg, ier = optimize.leastsq(func, x0, args=(), full_output=True)
+        print('x', x)
+        print('cov_x', cov_x)
+        print('infodictx', infodict)
+        print('mesg', mesg)
+        print('ier', ier)
+        print('  Solution found: %s' % (ier in (1, 2, 3, 4)))
+    else:
+        res = least_squares(func, x0, bounds=(0, float('inf')))
+        print(res)
+        print('')
+        print(res.x)
 
 def main():
     import argparse
@@ -240,8 +261,6 @@ def test5():
     print(res)
 
 def test6():
-    from scipy.optimize import least_squares
-
     def func(params):
         return (ydata - np.dot(xdata, params))
 
@@ -262,11 +281,11 @@ def test6():
     print(res)
 
 if __name__ == '__main__':
-    #main()
+    main()
     #test1()
     #test2()
     #test3()
     #test4()
     #test5()
-    test6()
+    #test6()
 

From 4fee67322f623fad671bc0289e3eb20135ce1e5f Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 29 Aug 2018 13:37:20 -0700
Subject: [PATCH 16/55] timfuz leastsq: iteration print

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 experiments/timfuz/solve_leastsq.py | 27 ++++++++++++++++++++++++---
 1 file changed, 24 insertions(+), 3 deletions(-)

diff --git a/experiments/timfuz/solve_leastsq.py b/experiments/timfuz/solve_leastsq.py
index 1fc2f8f9..0fc362c8 100644
--- a/experiments/timfuz/solve_leastsq.py
+++ b/experiments/timfuz/solve_leastsq.py
@@ -65,7 +65,23 @@ def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
     if rows < cols:
         raise Exception("rows must be >= cols")
 
+    tlast = [None]
+    iters = [0]
+    printn = [0]
+    def progress_print():
+        iters[0] += 1
+        if tlast[0] is None:
+            tlast[0]= time.time()
+        if time.time() - tlast[0] > 1.0:
+            sys.stdout.write('I:%d ' % iters[0])
+            tlast[0] = time.time()
+            printn[0] += 1
+            if printn[0] % 10 == 0:
+                sys.stdout.write('\n')
+            sys.stdout.flush()
+
     def func(params):
+        progress_print()
         return (b - np.dot(Anp, params))
 
     print('')
@@ -75,8 +91,10 @@ def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
     # starting at 0 completes quicky, but gives a solution near 0 with terrible results
     # maybe give a starting estimate to the smallest net delay with the indicated variable
     #x0 = np.array([1000.0 for _x in range(cols)])
+    print('Creating x0 estimate')
     x0 = mkestimate(Anp, b)
     #print('x0', x0)
+
     if 0:
         x, cov_x, infodict, mesg, ier = optimize.leastsq(func, x0, args=(), full_output=True)
         print('x', x)
@@ -86,10 +104,13 @@ def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
         print('ier', ier)
         print('  Solution found: %s' % (ier in (1, 2, 3, 4)))
     else:
+        print('Solving')
         res = least_squares(func, x0, bounds=(0, float('inf')))
-        print(res)
-        print('')
-        print(res.x)
+        if 0:
+            print(res)
+            print('')
+            print(res.x)
+        print('Done')
 
 def main():
     import argparse

From 7021c638c279257a1520c0d33bb551068db3f191 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 29 Aug 2018 13:41:14 -0700
Subject: [PATCH 17/55] timfuz: timfuz_rref => rref

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 experiments/timfuz/{timfuz_rref.py => rref.py} | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 rename experiments/timfuz/{timfuz_rref.py => rref.py} (100%)

diff --git a/experiments/timfuz/timfuz_rref.py b/experiments/timfuz/rref.py
similarity index 100%
rename from experiments/timfuz/timfuz_rref.py
rename to experiments/timfuz/rref.py

From 250e48c7a8934dc6ce9e3e9ef568591dc11f58a7 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 29 Aug 2018 13:41:56 -0700
Subject: [PATCH 18/55] timfuz: move to top level

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 {experiments/timfuz => timfuz}/.gitignore        | 0
 {experiments/timfuz => timfuz}/Makefile          | 0
 {experiments/timfuz => timfuz}/README.txt        | 0
 {experiments/timfuz => timfuz}/benchmark.py      | 0
 {experiments/timfuz => timfuz}/checksub.py       | 0
 {experiments/timfuz => timfuz}/corner_csv.py     | 0
 {experiments/timfuz => timfuz}/generate.sh       | 0
 {experiments/timfuz => timfuz}/generate.tcl      | 0
 {experiments/timfuz => timfuz}/node_unique.py    | 0
 {experiments/timfuz => timfuz}/oneblinkw.v       | 0
 {experiments/timfuz => timfuz}/perf_test.py      | 0
 {experiments/timfuz => timfuz}/picorv32.v        | 0
 {experiments/timfuz => timfuz}/pip_unique.py     | 0
 {experiments/timfuz => timfuz}/placelut.py       | 0
 {experiments/timfuz => timfuz}/placelut_fb.py    | 0
 {experiments/timfuz => timfuz}/placelut_ff_fb.py | 0
 {experiments/timfuz => timfuz}/rref.py           | 0
 {experiments/timfuz => timfuz}/solve_leastsq.py  | 0
 {experiments/timfuz => timfuz}/solve_linprog.py  | 0
 {experiments/timfuz => timfuz}/speed.sh          | 0
 {experiments/timfuz => timfuz}/speed.tcl         | 0
 {experiments/timfuz => timfuz}/speed_json.py     | 0
 {experiments/timfuz => timfuz}/sub2csv.py        | 0
 {experiments/timfuz => timfuz}/timfuz.py         | 0
 {experiments/timfuz => timfuz}/timfuz_csv.py     | 0
 {experiments/timfuz => timfuz}/timfuz_massage.py | 0
 {experiments/timfuz => timfuz}/timfuz_solve.py   | 0
 {experiments/timfuz => timfuz}/top.v             | 0
 {experiments/timfuz => timfuz}/wire_unique.py    | 0
 29 files changed, 0 insertions(+), 0 deletions(-)
 rename {experiments/timfuz => timfuz}/.gitignore (100%)
 rename {experiments/timfuz => timfuz}/Makefile (100%)
 rename {experiments/timfuz => timfuz}/README.txt (100%)
 rename {experiments/timfuz => timfuz}/benchmark.py (100%)
 rename {experiments/timfuz => timfuz}/checksub.py (100%)
 rename {experiments/timfuz => timfuz}/corner_csv.py (100%)
 rename {experiments/timfuz => timfuz}/generate.sh (100%)
 rename {experiments/timfuz => timfuz}/generate.tcl (100%)
 rename {experiments/timfuz => timfuz}/node_unique.py (100%)
 rename {experiments/timfuz => timfuz}/oneblinkw.v (100%)
 rename {experiments/timfuz => timfuz}/perf_test.py (100%)
 rename {experiments/timfuz => timfuz}/picorv32.v (100%)
 rename {experiments/timfuz => timfuz}/pip_unique.py (100%)
 rename {experiments/timfuz => timfuz}/placelut.py (100%)
 rename {experiments/timfuz => timfuz}/placelut_fb.py (100%)
 rename {experiments/timfuz => timfuz}/placelut_ff_fb.py (100%)
 rename {experiments/timfuz => timfuz}/rref.py (100%)
 rename {experiments/timfuz => timfuz}/solve_leastsq.py (100%)
 rename {experiments/timfuz => timfuz}/solve_linprog.py (100%)
 rename {experiments/timfuz => timfuz}/speed.sh (100%)
 rename {experiments/timfuz => timfuz}/speed.tcl (100%)
 rename {experiments/timfuz => timfuz}/speed_json.py (100%)
 rename {experiments/timfuz => timfuz}/sub2csv.py (100%)
 rename {experiments/timfuz => timfuz}/timfuz.py (100%)
 rename {experiments/timfuz => timfuz}/timfuz_csv.py (100%)
 rename {experiments/timfuz => timfuz}/timfuz_massage.py (100%)
 rename {experiments/timfuz => timfuz}/timfuz_solve.py (100%)
 rename {experiments/timfuz => timfuz}/top.v (100%)
 rename {experiments/timfuz => timfuz}/wire_unique.py (100%)

diff --git a/experiments/timfuz/.gitignore b/timfuz/.gitignore
similarity index 100%
rename from experiments/timfuz/.gitignore
rename to timfuz/.gitignore
diff --git a/experiments/timfuz/Makefile b/timfuz/Makefile
similarity index 100%
rename from experiments/timfuz/Makefile
rename to timfuz/Makefile
diff --git a/experiments/timfuz/README.txt b/timfuz/README.txt
similarity index 100%
rename from experiments/timfuz/README.txt
rename to timfuz/README.txt
diff --git a/experiments/timfuz/benchmark.py b/timfuz/benchmark.py
similarity index 100%
rename from experiments/timfuz/benchmark.py
rename to timfuz/benchmark.py
diff --git a/experiments/timfuz/checksub.py b/timfuz/checksub.py
similarity index 100%
rename from experiments/timfuz/checksub.py
rename to timfuz/checksub.py
diff --git a/experiments/timfuz/corner_csv.py b/timfuz/corner_csv.py
similarity index 100%
rename from experiments/timfuz/corner_csv.py
rename to timfuz/corner_csv.py
diff --git a/experiments/timfuz/generate.sh b/timfuz/generate.sh
similarity index 100%
rename from experiments/timfuz/generate.sh
rename to timfuz/generate.sh
diff --git a/experiments/timfuz/generate.tcl b/timfuz/generate.tcl
similarity index 100%
rename from experiments/timfuz/generate.tcl
rename to timfuz/generate.tcl
diff --git a/experiments/timfuz/node_unique.py b/timfuz/node_unique.py
similarity index 100%
rename from experiments/timfuz/node_unique.py
rename to timfuz/node_unique.py
diff --git a/experiments/timfuz/oneblinkw.v b/timfuz/oneblinkw.v
similarity index 100%
rename from experiments/timfuz/oneblinkw.v
rename to timfuz/oneblinkw.v
diff --git a/experiments/timfuz/perf_test.py b/timfuz/perf_test.py
similarity index 100%
rename from experiments/timfuz/perf_test.py
rename to timfuz/perf_test.py
diff --git a/experiments/timfuz/picorv32.v b/timfuz/picorv32.v
similarity index 100%
rename from experiments/timfuz/picorv32.v
rename to timfuz/picorv32.v
diff --git a/experiments/timfuz/pip_unique.py b/timfuz/pip_unique.py
similarity index 100%
rename from experiments/timfuz/pip_unique.py
rename to timfuz/pip_unique.py
diff --git a/experiments/timfuz/placelut.py b/timfuz/placelut.py
similarity index 100%
rename from experiments/timfuz/placelut.py
rename to timfuz/placelut.py
diff --git a/experiments/timfuz/placelut_fb.py b/timfuz/placelut_fb.py
similarity index 100%
rename from experiments/timfuz/placelut_fb.py
rename to timfuz/placelut_fb.py
diff --git a/experiments/timfuz/placelut_ff_fb.py b/timfuz/placelut_ff_fb.py
similarity index 100%
rename from experiments/timfuz/placelut_ff_fb.py
rename to timfuz/placelut_ff_fb.py
diff --git a/experiments/timfuz/rref.py b/timfuz/rref.py
similarity index 100%
rename from experiments/timfuz/rref.py
rename to timfuz/rref.py
diff --git a/experiments/timfuz/solve_leastsq.py b/timfuz/solve_leastsq.py
similarity index 100%
rename from experiments/timfuz/solve_leastsq.py
rename to timfuz/solve_leastsq.py
diff --git a/experiments/timfuz/solve_linprog.py b/timfuz/solve_linprog.py
similarity index 100%
rename from experiments/timfuz/solve_linprog.py
rename to timfuz/solve_linprog.py
diff --git a/experiments/timfuz/speed.sh b/timfuz/speed.sh
similarity index 100%
rename from experiments/timfuz/speed.sh
rename to timfuz/speed.sh
diff --git a/experiments/timfuz/speed.tcl b/timfuz/speed.tcl
similarity index 100%
rename from experiments/timfuz/speed.tcl
rename to timfuz/speed.tcl
diff --git a/experiments/timfuz/speed_json.py b/timfuz/speed_json.py
similarity index 100%
rename from experiments/timfuz/speed_json.py
rename to timfuz/speed_json.py
diff --git a/experiments/timfuz/sub2csv.py b/timfuz/sub2csv.py
similarity index 100%
rename from experiments/timfuz/sub2csv.py
rename to timfuz/sub2csv.py
diff --git a/experiments/timfuz/timfuz.py b/timfuz/timfuz.py
similarity index 100%
rename from experiments/timfuz/timfuz.py
rename to timfuz/timfuz.py
diff --git a/experiments/timfuz/timfuz_csv.py b/timfuz/timfuz_csv.py
similarity index 100%
rename from experiments/timfuz/timfuz_csv.py
rename to timfuz/timfuz_csv.py
diff --git a/experiments/timfuz/timfuz_massage.py b/timfuz/timfuz_massage.py
similarity index 100%
rename from experiments/timfuz/timfuz_massage.py
rename to timfuz/timfuz_massage.py
diff --git a/experiments/timfuz/timfuz_solve.py b/timfuz/timfuz_solve.py
similarity index 100%
rename from experiments/timfuz/timfuz_solve.py
rename to timfuz/timfuz_solve.py
diff --git a/experiments/timfuz/top.v b/timfuz/top.v
similarity index 100%
rename from experiments/timfuz/top.v
rename to timfuz/top.v
diff --git a/experiments/timfuz/wire_unique.py b/timfuz/wire_unique.py
similarity index 100%
rename from experiments/timfuz/wire_unique.py
rename to timfuz/wire_unique.py

From f6fb4cb60c40d9db7e971ad8d39a0f9a08203f18 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 29 Aug 2018 14:05:25 -0700
Subject: [PATCH 19/55] timfuz leastsq: write output solution

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 timfuz/solve_leastsq.py | 32 ++++++++++++++++++++++++++++++--
 1 file changed, 30 insertions(+), 2 deletions(-)

diff --git a/timfuz/solve_leastsq.py b/timfuz/solve_leastsq.py
index 0fc362c8..6d298969 100644
--- a/timfuz/solve_leastsq.py
+++ b/timfuz/solve_leastsq.py
@@ -111,6 +111,34 @@ def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
             print('')
             print(res.x)
         print('Done')
+        if outfn:
+            # ballpark minimum actual observed delay is around 7 (carry chain)
+            # anything less than one is probably a solver artifact
+            delta = 0.5
+
+            print('Writing resutls')
+            skips = 0
+            with open(outfn, 'w') as fout:
+                # write as one variable per line
+                # this natively forms a bound if fed into linprog solver
+                fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
+                for xval, name in zip(res.x, names):
+                    row_ico = 1
+
+                    # FIXME: only report for the given corner?
+                    # also review ceil vs floor choice for min vs max
+                    # lets be more conservative for now
+                    if xval < delta:
+                        #print('Skipping %s: %0.6f' % (name, xval))
+                        skips += 1
+                        continue
+                    #xvali = round(xval)
+                    xvali = math.ceil(xval)
+                    corners = [xvali for _ in range(4)]
+                    items = [str(row_ico), ' '.join([str(x) for x in corners])]
+                    items.append('%u %s' % (1, name))
+                    fout.write(','.join(items) + '\n')
+            print('Wrote: skip %u => %u / %u valid delays' % (skips, len(names) - skips, len(names)))
 
 def main():
     import argparse
@@ -142,7 +170,7 @@ def main():
         sub_json = load_sub(args.sub_json)
 
     try:
-        timfuz_solve.run(run_corner=run_corner, sub_json=sub_json, 
+        timfuz_solve.run(run_corner=run_corner, sub_json=sub_json,
             fns_in=fns_in, corner=args.corner, massage=args.massage, outfn=args.out, verbose=args.verbose)
     finally:
         print('Exiting after %s' % bench)
@@ -164,7 +192,7 @@ def test1():
 
 # optimize.leastsq
 def test2():
-    
+
     # The function whose square is to be minimised.
     # params ... list of parameters tuned to minimise function.
     # Further arguments:

From 5ecbd135cef75ae5aa19080e365c7dabde17d9e8 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 29 Aug 2018 14:05:48 -0700
Subject: [PATCH 20/55] timfuz leastsq: remove test code

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 timfuz/solve_leastsq.py | 161 ----------------------------------------
 1 file changed, 161 deletions(-)

diff --git a/timfuz/solve_leastsq.py b/timfuz/solve_leastsq.py
index 6d298969..fde102c2 100644
--- a/timfuz/solve_leastsq.py
+++ b/timfuz/solve_leastsq.py
@@ -175,166 +175,5 @@ def main():
     finally:
         print('Exiting after %s' % bench)
 
-# optimize.curve_fit wrapper
-def test1():
-    # Generate artificial data = straight line with a=0 and b=1
-    # plus some noise.
-    xdata = np.array([0.0,1.0,2.0,3.0,4.0,5.0])
-    ydata = np.array([0.1,0.9,2.2,2.8,3.9,5.1])
-    # Initial guess.
-    x0    = np.array([0.0, 0.0, 0.0])
-    sigma = np.array([1.0,1.0,1.0,1.0,1.0,1.0])
-
-    def func(x, a, b, c):
-        return a + b*x + c*x*x
-
-    print(optimize.curve_fit(func, xdata, ydata, x0, sigma))
-
-# optimize.leastsq
-def test2():
-
-    # The function whose square is to be minimised.
-    # params ... list of parameters tuned to minimise function.
-    # Further arguments:
-    # xdata ... design matrix for a linear model.
-    # ydata ... observed data.
-    def func(params, xdata, ydata):
-        return (ydata - np.dot(xdata, params))
-
-    x0 = np.array([0.0, 0.0])
-
-    '''
-    a  = 10
-    a + b = 100
-    '''
-    xdata = np.array([[1, 0],
-                      [1, 1]])
-    ydata = np.array([10, 100])
-
-    '''
-    x [ 10.  90.]
-    cov_x [[ 1. -1.]
-     [-1.  2.]]
-    infodictx {'ipvt': array([1, 2], dtype=int32), 'qtf': array([  1.69649118e-10,   1.38802454e-10]), 'nfev': 7, 'fjac': array([[ 1.41421356,  0.70710678],
-           [ 0.70710678,  0.70710678]]), 'fvec': array([ 0.,  0.])}
-    mesg The relative error between two consecutive iterates is at most 0.000000
-    ier 2
-      Solution found: True
-    '''
-    x, cov_x, infodict, mesg, ier = optimize.leastsq(func, x0, args=(xdata, ydata), full_output=True)
-    print('x', x)
-    print('cov_x', cov_x)
-    print('infodictx', infodict)
-    print('mesg', mesg)
-    print('ier', ier)
-    print('  Solution found: %s' % (ier in (1, 2, 3, 4)))
-
-# non-square
-def test3():
-    def func(params, xdata, ydata):
-        return (ydata - np.dot(xdata, params))
-
-    x0 = np.array([0.0, 0.0, 0.0])
-
-    '''
-    a  = 10
-    a + b + c = 100
-    '''
-    xdata = np.array([[1, 0, 0],
-                      [1, 1, 1],
-                      [0, 0, 0]])
-    ydata = np.array([10, 100, 0])
-
-    x, cov_x, infodict, mesg, ier = optimize.leastsq(func, x0, args=(xdata, ydata), full_output=True)
-    print('x', x)
-    print('cov_x', cov_x)
-    print('infodictx', infodict)
-    print('mesg', mesg)
-    print('ier', ier)
-    print('  Solution found: %s' % (ier in (1, 2, 3, 4)))
-
-def test4():
-    def func(params):
-        print('')
-        print('iter')
-        print(params)
-        print(xdata)
-        print(ydata)
-        return (ydata - np.dot(xdata, params))
-
-    x0 = np.array([0.0, 0.0, 0.0])
-
-    '''
-    You must have at least as many things to optimize as variables
-    That is, the system must be plausibly constrained for it to attempt a solve
-    If not, you'll get a message like
-    TypeError: Improper input: N=3 must not exceed M=2
-    '''
-    xdata = np.array([[1, 0, 0],
-                      [1, 1, 1],
-                      [1, 0, 1],
-                      [0, 1, 1],
-                      ])
-    ydata = np.array([10, 100, 120, 140])
-
-    x, cov_x, infodict, mesg, ier = optimize.leastsq(func, x0, full_output=True)
-    print('x', x)
-    print('cov_x', cov_x)
-    print('infodictx', infodict)
-    print('mesg', mesg)
-    print('ier', ier)
-    print('  Solution found: %s' % (ier in (1, 2, 3, 4)))
-
-def test5():
-    from scipy.optimize import least_squares
-
-    def fun_rosenbrock(x):
-        return np.array([10 * (x[1] - x[0]**2), (1 - x[0])])
-    x0_rosenbrock = np.array([2, 2])
-    res = least_squares(fun_rosenbrock, x0_rosenbrock)
-    '''
-     active_mask: array([ 0.,  0.])
-            cost: 9.8669242910846867e-30
-             fun: array([  4.44089210e-15,   1.11022302e-16])
-            grad: array([ -8.89288649e-14,   4.44089210e-14])
-             jac: array([[-20.00000015,  10.        ],
-           [ -1.        ,   0.        ]])
-         message: '`gtol` termination condition is satisfied.'
-            nfev: 3
-            njev: 3
-      optimality: 8.8928864934219529e-14
-          status: 1
-         success: True
-               x: array([ 1.,  1.])
-    '''
-    print(res)
-
-def test6():
-    def func(params):
-        return (ydata - np.dot(xdata, params))
-
-    x0 = np.array([0.0, 0.0, 0.0])
-
-    '''
-    a  = 10
-    a + b + c = 100
-    '''
-    xdata = np.array([[1, 0, 0],
-                      [1, 1, 1],
-                      [0, 0, 0]])
-    ydata = np.array([10, 100, 0])
-
-    res = least_squares(func, x0)
-    '''
-    '''
-    print(res)
-
 if __name__ == '__main__':
     main()
-    #test1()
-    #test2()
-    #test3()
-    #test4()
-    #test5()
-    #test6()
-

From e83866af720375d2f5ae5aca19b6bb6fe955c575 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 29 Aug 2018 14:27:57 -0700
Subject: [PATCH 21/55] timfuz: linprog write output csv

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 timfuz/solve_linprog.py | 33 ++++++++++++++++++++++++++++-
 timfuz/timfuz_solve.py  | 47 +++++++++++++++++++++++++++++++++++++----
 2 files changed, 75 insertions(+), 5 deletions(-)

diff --git a/timfuz/solve_linprog.py b/timfuz/solve_linprog.py
index 2eef5e75..2389de6c 100644
--- a/timfuz/solve_linprog.py
+++ b/timfuz/solve_linprog.py
@@ -111,6 +111,36 @@ def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
         print('Writing %s' % fn_out)
         np.save(fn_out, (3, c, A_ub, b_ub, bounds, names, res, meta))
 
+        if outfn:
+            # ballpark minimum actual observed delay is around 7 (carry chain)
+            # anything less than one is probably a solver artifact
+            delta = 0.5
+
+            print('Writing resutls')
+            skips = 0
+            with open(outfn, 'w') as fout:
+                # write as one variable per line
+                # this natively forms a bound if fed into linprog solver
+                fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
+                for xval, name in zip(res.x, names):
+                    row_ico = 1
+
+                    # FIXME: only report for the given corner?
+                    # also review ceil vs floor choice for min vs max
+                    # lets be more conservative for now
+                    if xval < delta:
+                        #print('Skipping %s: %0.6f' % (name, xval))
+                        skips += 1
+                        continue
+                    #xvali = round(xval)
+                    xvali = math.ceil(xval)
+                    corners = [xvali for _ in range(4)]
+                    items = [str(row_ico), ' '.join([str(x) for x in corners])]
+                    items.append('%u %s' % (1, name))
+                    fout.write(','.join(items) + '\n')
+            print('Wrote: skip %u => %u / %u valid delays' % (skips, len(names) - skips, len(names)))
+
+
 def main():
     import argparse
 
@@ -121,6 +151,7 @@ def main():
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--massage', action='store_true', help='')
+    parser.add_argument('--sub-csv', help='')
     parser.add_argument('--sub-json', help='Group substitutions to make fully ranked')
     parser.add_argument('--corner', default="slow_max", help='')
     parser.add_argument('--out', default=None, help='output timing delay .json')
@@ -141,7 +172,7 @@ def main():
         sub_json = load_sub(args.sub_json)
 
     try:
-        timfuz_solve.run(run_corner=run_corner, sub_json=sub_json,
+        timfuz_solve.run(run_corner=run_corner, sub_json=sub_json, sub_csv=args.sub_csv,
             fns_in=fns_in, corner=args.corner, massage=args.massage, outfn=args.out, verbose=args.verbose)
     finally:
         print('Exiting after %s' % bench)
diff --git a/timfuz/timfuz_solve.py b/timfuz/timfuz_solve.py
index a2e6526a..a7f33e77 100644
--- a/timfuz/timfuz_solve.py
+++ b/timfuz/timfuz_solve.py
@@ -36,7 +36,7 @@ def check_feasible(A_ub, b_ub):
     Delays should be in order of ns, so a 10 ns delay should be way above what anything should be
     Series can have several hundred delay elements
     Max delay in ballpark
-    ''' 
+    '''
     xs = [1e9 for _i in range(cols)]
 
     # FIXME: use the correct np function to do this for me
@@ -74,7 +74,29 @@ def instances(Ads):
         ret += sum(row_ds.values())
     return ret
 
-def run(fns_in, corner, run_corner, sub_json=None, dedup=True, massage=False, outfn=None, verbose=False, **kwargs):
+def Ads2bounds(Ads, b):
+    ret = {}
+    for row_ds, row_b in zip(Ads, b):
+        assert len(row_ds) == 1
+        k, v = list(row_ds.items())[0]
+        assert v == 1
+        ret[k] = row_b
+    return ret
+
+def filter_bounds(Ads, b, bounds):
+    '''Given min variable delays, remove rows that won't constrain solution'''
+    ret_Ads = []
+    ret_b = []
+    for row_ds, row_b in zip(Ads, b):
+        # some variables get estimated at 0
+        est = sum([bounds.get(k, 0) * v for k, v in row_ds.items()])
+        # will this row potentially constrain us more?
+        if row_b > est:
+            ret_Ads.append(row_ds)
+            ret_b.append(row_b)
+    return ret_Ads, ret_b
+
+def run(fns_in, corner, run_corner, sub_json=None, sub_csv=None, dedup=True, massage=False, outfn=None, verbose=False, **kwargs):
     print('Loading data')
     Ads, b = loadc_Ads_b(fns_in, corner, ico=True)
 
@@ -87,7 +109,7 @@ def run(fns_in, corner, run_corner, sub_json=None, dedup=True, massage=False, ou
         Ads, b = simplify_rows(Ads, b)
         print('Simplify %u => %u rows' % (oldn, len(Ads)))
         print('Simplify %u => %u instances' % (iold, instances(Ads)))
-        
+
     if sub_json:
         print('Sub: %u rows' % len(Ads))
         iold = instances(Ads)
@@ -99,6 +121,23 @@ def run(fns_in, corner, run_corner, sub_json=None, dedup=True, massage=False, ou
     else:
         names = index_names(Ads)
 
+    # post substitution csv
+    # actually this might not be strictly necessary since subs would just not apply
+    # however, I wanted to do some filtering based on expected form
+    if sub_csv:
+        Ads2, b2 = loadc_Ads_b([sub_csv], corner, ico=True)
+        if 0:
+            Ads = Ads + Ads2
+            b = b + b2
+        else:
+            bounds = Ads2bounds(Ads2, b2)
+            rows_old = len(Ads)
+            Ads, b = filter_bounds(Ads, b, bounds)
+            print('Filter bounds: %s => %s rows' % (rows_old, len(Ads)))
+            if 1:
+                Ads = Ads + Ads2
+                b = b + b2
+
     if verbose:
         print
         print_eqns(Ads, b, verbose=verbose)
@@ -115,7 +154,7 @@ def run(fns_in, corner, run_corner, sub_json=None, dedup=True, massage=False, ou
     However, a better solution is something like
         a = 10
         b = 90
-    This creates derived constraints to provide more realistic results 
+    This creates derived constraints to provide more realistic results
     '''
     if massage:
         Ads, b = massage_equations(Ads, b)

From 1aa15ae8b612dd228113986cb3f39abd762a688d Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 29 Aug 2018 15:24:41 -0700
Subject: [PATCH 22/55] timfuz: utility to flatten groups out of csv

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 timfuz/csv_group2flat.py | 88 ++++++++++++++++++++++++++++++++++++++++
 timfuz/solve_linprog.py  | 11 +++--
 timfuz/timfuz.py         | 16 ++++++++
 timfuz/timfuz_solve.py   | 11 +----
 4 files changed, 110 insertions(+), 16 deletions(-)
 create mode 100644 timfuz/csv_group2flat.py

diff --git a/timfuz/csv_group2flat.py b/timfuz/csv_group2flat.py
new file mode 100644
index 00000000..c88b6992
--- /dev/null
+++ b/timfuz/csv_group2flat.py
@@ -0,0 +1,88 @@
+#!/usr/bin/env python3
+
+# https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
+from scipy.optimize import linprog
+from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json, A_ub_np2d, print_eqns, print_eqns_np, Ads2bounds, loadc_Ads_raw
+from timfuz_massage import massage_equations
+import numpy as np
+import glob
+import json
+import math
+from collections import OrderedDict
+from fractions import Fraction
+import sys
+import datetime
+import os
+import time
+
+def gen_flat(fnin, sub_json):
+    # FIXME: preserve all bounds
+    # Ads, bs = loadc_Ads_raw([csv_fn_in])
+    Ads, b = loadc_Ads_b([fnin], corner=None, ico=True)
+    bounds = Ads2bounds(Ads, b)
+    zeros = set()
+    nonzeros = set()
+
+    for bound_name, bound_b in bounds.items():
+        sub = sub_json['subs'].get(bound_name, None)
+        if sub:
+            # put entire delay into pivot
+            pivot = sub_json['pivots'][bound_name]
+            assert pivot not in zeros
+            nonzeros.add(pivot)
+            non_pivot = set(sub.keys() - set([pivot]))
+            #for name in non_pivot:
+            #    assert name not in nonzeros, (pivot, name, nonzeros)
+            zeros.update(non_pivot)
+            yield pivot, bound_b
+        else:
+            nonzeros.add(bound_name)
+            yield bound_name, bound_b
+    # non-pivots can appear multiple times, but they should always be zero
+    # however, due to substitution limitations, just warn
+    violations = zeros.intersection(nonzeros)
+    if len(violations):
+        print('WARNING: %s non-0 non-pivot' % (len(violations)))
+
+    for zero in zeros - violations:
+        yield zero, 0
+
+def run(fnin, fnout, sub_json, corner=None, verbose=False):
+    with open(fnout, 'w') as fout:
+        fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
+        for name, delay in sorted(gen_flat(fnin, sub_json)):
+            row_ico = 1
+            corners = [delay for _ in range(4)]
+            items = [str(row_ico), ' '.join([str(x) for x in corners])]
+            items.append('%u %s' % (1, name))
+            fout.write(','.join(items) + '\n')
+
+def main():
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description=
+        'Solve timing solution'
+    )
+
+    parser.add_argument('--verbose', action='store_true', help='')
+    parser.add_argument('--massage', action='store_true', help='')
+    parser.add_argument('--sub-csv', help='')
+    parser.add_argument('--sub-json', required=True, help='Group substitutions to make fully ranked')
+    parser.add_argument('fnin', default=None, help='input timing delay .csv')
+    parser.add_argument('fnout', default=None, help='output timing delay .csv')
+    args = parser.parse_args()
+    # Store options in dict to ease passing through functions
+    bench = Benchmark()
+
+    sub_json = None
+    if args.sub_json:
+        sub_json = load_sub(args.sub_json)
+
+    try:
+        run(args.fnin, args.fnout, sub_json=sub_json, verbose=args.verbose)
+    finally:
+        print('Exiting after %s' % bench)
+
+if __name__ == '__main__':
+    main()
diff --git a/timfuz/solve_linprog.py b/timfuz/solve_linprog.py
index 2389de6c..201ba7ca 100644
--- a/timfuz/solve_linprog.py
+++ b/timfuz/solve_linprog.py
@@ -117,7 +117,7 @@ def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
             delta = 0.5
 
             print('Writing resutls')
-            skips = 0
+            zeros = 0
             with open(outfn, 'w') as fout:
                 # write as one variable per line
                 # this natively forms a bound if fed into linprog solver
@@ -129,17 +129,16 @@ def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
                     # also review ceil vs floor choice for min vs max
                     # lets be more conservative for now
                     if xval < delta:
-                        #print('Skipping %s: %0.6f' % (name, xval))
-                        skips += 1
-                        continue
+                        print('WARNING: near 0 delay on %s: %0.6f' % (name, xval))
+                        zeros += 1
+                        #continue
                     #xvali = round(xval)
                     xvali = math.ceil(xval)
                     corners = [xvali for _ in range(4)]
                     items = [str(row_ico), ' '.join([str(x) for x in corners])]
                     items.append('%u %s' % (1, name))
                     fout.write(','.join(items) + '\n')
-            print('Wrote: skip %u => %u / %u valid delays' % (skips, len(names) - skips, len(names)))
-
+            print('Wrote: zeros %u => %u / %u constrained delays' % (zeros, len(names) - zeros, len(names)))
 
 def main():
     import argparse
diff --git a/timfuz/timfuz.py b/timfuz/timfuz.py
index d2bcd300..ec9bfe28 100644
--- a/timfuz/timfuz.py
+++ b/timfuz/timfuz.py
@@ -701,6 +701,13 @@ def loadc_Ads_b(fns, corner, ico=None):
         return val[corneri]
     return loadc_Ads_mkb(fns, mkb, filt)
 
+def loadc_Ads_raw(fns):
+    filt = lambda ico, corners, vars: True
+
+    def mkb(val):
+        return val
+    return loadc_Ads_mkb(fns, mkb, filt)
+
 def index_names(Ads):
     names = set()
     for row_ds in Ads:
@@ -829,3 +836,12 @@ def print_eqns(Ads, b, verbose=0, lim=3, label=''):
 def print_eqns_np(A_ub, b_ub, verbose=0):
     Adi = A_ub_np2d(A_ub)
     print_eqns(Adi, b_ub, verbose=verbose)
+
+def Ads2bounds(Ads, b):
+    ret = {}
+    for row_ds, row_b in zip(Ads, b):
+        assert len(row_ds) == 1
+        k, v = list(row_ds.items())[0]
+        assert v == 1
+        ret[k] = row_b
+    return ret
diff --git a/timfuz/timfuz_solve.py b/timfuz/timfuz_solve.py
index a7f33e77..4fdf5dbf 100644
--- a/timfuz/timfuz_solve.py
+++ b/timfuz/timfuz_solve.py
@@ -2,7 +2,7 @@
 
 # https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
 from scipy.optimize import linprog
-from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json, A_ub_np2d, print_eqns, print_eqns_np
+from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json, A_ub_np2d, print_eqns, print_eqns_np, Ads2bounds
 from timfuz_massage import massage_equations
 import numpy as np
 import glob
@@ -74,15 +74,6 @@ def instances(Ads):
         ret += sum(row_ds.values())
     return ret
 
-def Ads2bounds(Ads, b):
-    ret = {}
-    for row_ds, row_b in zip(Ads, b):
-        assert len(row_ds) == 1
-        k, v = list(row_ds.items())[0]
-        assert v == 1
-        ret[k] = row_b
-    return ret
-
 def filter_bounds(Ads, b, bounds):
     '''Given min variable delays, remove rows that won't constrain solution'''
     ret_Ads = []

From e76e84f72c765aaf2e5066b84f92739c4516d317 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 29 Aug 2018 16:05:10 -0700
Subject: [PATCH 23/55] timfuz: csv_flat2group

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 timfuz/csv_flat2group.py | 71 ++++++++++++++++++++++++++++++++++++++++
 timfuz/csv_group2flat.py | 16 +++++----
 timfuz/timfuz.py         | 26 ++++++++++++---
 timfuz/timfuz_solve.py   |  8 +----
 4 files changed, 103 insertions(+), 18 deletions(-)
 create mode 100644 timfuz/csv_flat2group.py

diff --git a/timfuz/csv_flat2group.py b/timfuz/csv_flat2group.py
new file mode 100644
index 00000000..7a050585
--- /dev/null
+++ b/timfuz/csv_flat2group.py
@@ -0,0 +1,71 @@
+#!/usr/bin/env python3
+
+# https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
+from scipy.optimize import linprog
+from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json, A_ub_np2d, print_eqns, print_eqns_np, Ads2bounds, loadc_Ads_raw, instances
+from timfuz_massage import massage_equations
+import numpy as np
+import glob
+import json
+import math
+from collections import OrderedDict
+from fractions import Fraction
+import sys
+import datetime
+import os
+import time
+
+def gen_group(fnin, sub_json, strict=False, verbose=False):
+    print('Loading data')
+    # FIXME: preserve corners
+    Ads, b = loadc_Ads_b([fnin], corner=None, ico=True)
+
+    print('Sub: %u rows' % len(Ads))
+    iold = instances(Ads)
+    names_old = index_names(Ads)
+    run_sub_json(Ads, sub_json, strict=strict, verbose=verbose)
+    names = index_names(Ads)
+    print("Sub: %u => %u names" % (len(names_old), len(names)))
+    print('Sub: %u => %u instances' % (iold, instances(Ads)))
+
+    for row_ds, row_b in zip(Ads, b):
+        yield row_ds, [row_b for _ in range(4)]
+
+def run(fnin, fnout, sub_json, corner=None, strict=False, verbose=False):
+    with open(fnout, 'w') as fout:
+        fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
+        for row_ds, row_bs in gen_group(fnin, sub_json, strict=strict):
+            row_ico = 1
+            items = [str(row_ico), ' '.join([str(x) for x in row_bs])]
+            for k, v in sorted(row_ds.items()):
+                items.append('%u %s' % (v, k))
+            fout.write(','.join(items) + '\n')
+
+def main():
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description=
+        'Solve timing solution'
+    )
+
+    parser.add_argument('--verbose', action='store_true', help='')
+    parser.add_argument('--massage', action='store_true', help='')
+    parser.add_argument('--strict', action='store_true', help='')
+    parser.add_argument('--sub-csv', help='')
+    parser.add_argument('--sub-json', required=True, help='Group substitutions to make fully ranked')
+    parser.add_argument('fnin', default=None, help='input timing delay .csv')
+    parser.add_argument('fnout', default=None, help='output timing delay .csv')
+    args = parser.parse_args()
+    # Store options in dict to ease passing through functions
+    bench = Benchmark()
+
+    sub_json = load_sub(args.sub_json)
+
+    try:
+        run(args.fnin, args.fnout, sub_json=sub_json, strict=args.strict, verbose=args.verbose)
+    finally:
+        print('Exiting after %s' % bench)
+
+if __name__ == '__main__':
+    main()
diff --git a/timfuz/csv_group2flat.py b/timfuz/csv_group2flat.py
index c88b6992..14f51b60 100644
--- a/timfuz/csv_group2flat.py
+++ b/timfuz/csv_group2flat.py
@@ -47,10 +47,15 @@ def gen_flat(fnin, sub_json):
     for zero in zeros - violations:
         yield zero, 0
 
-def run(fnin, fnout, sub_json, corner=None, verbose=False):
+def run(fnin, fnout, sub_json, corner=None, sort=False, verbose=False):
+    if sort:
+        sortf = sorted
+    else:
+        sortf = lambda x: x
+
     with open(fnout, 'w') as fout:
         fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
-        for name, delay in sorted(gen_flat(fnin, sub_json)):
+        for name, delay in sortf(gen_flat(fnin, sub_json)):
             row_ico = 1
             corners = [delay for _ in range(4)]
             items = [str(row_ico), ' '.join([str(x) for x in corners])]
@@ -67,6 +72,7 @@ def main():
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--massage', action='store_true', help='')
+    parser.add_argument('--sort', action='store_true', help='')
     parser.add_argument('--sub-csv', help='')
     parser.add_argument('--sub-json', required=True, help='Group substitutions to make fully ranked')
     parser.add_argument('fnin', default=None, help='input timing delay .csv')
@@ -75,12 +81,10 @@ def main():
     # Store options in dict to ease passing through functions
     bench = Benchmark()
 
-    sub_json = None
-    if args.sub_json:
-        sub_json = load_sub(args.sub_json)
+    sub_json = load_sub(args.sub_json)
 
     try:
-        run(args.fnin, args.fnout, sub_json=sub_json, verbose=args.verbose)
+        run(args.fnin, args.fnout, sub_json=sub_json, sort=args.sort, verbose=args.verbose)
     finally:
         print('Exiting after %s' % bench)
 
diff --git a/timfuz/timfuz.py b/timfuz/timfuz.py
index ec9bfe28..6f2f8918 100644
--- a/timfuz/timfuz.py
+++ b/timfuz/timfuz.py
@@ -724,7 +724,7 @@ def load_sub(fn):
 
     return j
 
-def row_sub_syms(row, sub_json, verbose=False):
+def row_sub_syms(row, sub_json, strict=False, verbose=False):
     zero = Fraction(0)
     zero = 0
 
@@ -751,10 +751,10 @@ def row_sub_syms(row, sub_json, verbose=False):
             n = row[pivot]
             print('  pivot %u %s' % (n, pivot))
 
+    #pivots = set(sub_json['pivots'].values()).intersection(row.keys())
     for group, pivot in sorted(sub_json['pivots'].items()):
         if pivot not in row:
             continue
-
         # take the sub out n times
         # note constants may be negative
         n = row[pivot]
@@ -779,11 +779,21 @@ def row_sub_syms(row, sub_json, verbose=False):
     # after all constants are applied, the row should end up positive?
     # numeric precision issues previously limited this
     # Ex: AssertionError: ('PIP_BSW_2ELSING0', -2.220446049250313e-16)
-    if 0:
+    if strict:
+        # verify no subs are left
+        for subs in sub_json['subs'].values():
+            for sub in subs:
+                assert sub not in row, 'Unexpected element %s' % sub
+
+        # Verify all constants are positive
         for k, v in sorted(row.items()):
             assert v > 0, (k, v)
 
-def run_sub_json(Ads, sub_json, verbose=False):
+def run_sub_json(Ads, sub_json, strict=False, verbose=False):
+    '''
+    strict: complain if a sub doesn't go in evenly
+    '''
+
     nrows = 0
     nsubs = 0
 
@@ -801,7 +811,7 @@ def run_sub_json(Ads, sub_json, verbose=False):
             print('Row %u w/ %u elements' % (rowi, len(row)))
 
         row_orig = dict(row)
-        row_sub_syms(row, sub_json, verbose=verbose)
+        row_sub_syms(row, sub_json, strict=strict, verbose=verbose)
         nrows += 1
         if row_orig != row:
             nsubs += 1
@@ -845,3 +855,9 @@ def Ads2bounds(Ads, b):
         assert v == 1
         ret[k] = row_b
     return ret
+
+def instances(Ads):
+    ret = 0
+    for row_ds in Ads:
+        ret += sum(row_ds.values())
+    return ret
diff --git a/timfuz/timfuz_solve.py b/timfuz/timfuz_solve.py
index 4fdf5dbf..c6343e70 100644
--- a/timfuz/timfuz_solve.py
+++ b/timfuz/timfuz_solve.py
@@ -2,7 +2,7 @@
 
 # https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
 from scipy.optimize import linprog
-from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json, A_ub_np2d, print_eqns, print_eqns_np, Ads2bounds
+from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json, A_ub_np2d, print_eqns, print_eqns_np, Ads2bounds, instances
 from timfuz_massage import massage_equations
 import numpy as np
 import glob
@@ -68,12 +68,6 @@ def check_feasible(A_ub, b_ub):
             raise Exception("Bad ")
     print(' done')
 
-def instances(Ads):
-    ret = 0
-    for row_ds in Ads:
-        ret += sum(row_ds.values())
-    return ret
-
 def filter_bounds(Ads, b, bounds):
     '''Given min variable delays, remove rows that won't constrain solution'''
     ret_Ads = []

From 51763748174140abb16fad6916f9c84a7527e05e Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 29 Aug 2018 16:17:16 -0700
Subject: [PATCH 24/55] timfuz group2flat: remove old option

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 timfuz/csv_group2flat.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/timfuz/csv_group2flat.py b/timfuz/csv_group2flat.py
index 14f51b60..bf5c2870 100644
--- a/timfuz/csv_group2flat.py
+++ b/timfuz/csv_group2flat.py
@@ -71,7 +71,6 @@ def main():
     )
 
     parser.add_argument('--verbose', action='store_true', help='')
-    parser.add_argument('--massage', action='store_true', help='')
     parser.add_argument('--sort', action='store_true', help='')
     parser.add_argument('--sub-csv', help='')
     parser.add_argument('--sub-json', required=True, help='Group substitutions to make fully ranked')

From fb69b9f0455660495b4a7213bfe02f33054a4d91 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 29 Aug 2018 17:36:00 -0700
Subject: [PATCH 25/55] timfuz: utility to create tile to speed model database

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 timfuz/tile_txt2json.py     |  74 ++++++++++++++++++++++
 timfuz/timgrid/Makefile     |  26 ++++++++
 timfuz/timgrid/generate.sh  |  16 +++++
 timfuz/timgrid/generate.tcl | 119 ++++++++++++++++++++++++++++++++++++
 timfuz/timgrid/top.v        |  49 +++++++++++++++
 timfuz/timgrid/top_bram.v   |  62 +++++++++++++++++++
 6 files changed, 346 insertions(+)
 create mode 100644 timfuz/tile_txt2json.py
 create mode 100644 timfuz/timgrid/Makefile
 create mode 100644 timfuz/timgrid/generate.sh
 create mode 100644 timfuz/timgrid/generate.tcl
 create mode 100644 timfuz/timgrid/top.v
 create mode 100644 timfuz/timgrid/top_bram.v

diff --git a/timfuz/tile_txt2json.py b/timfuz/tile_txt2json.py
new file mode 100644
index 00000000..06711f87
--- /dev/null
+++ b/timfuz/tile_txt2json.py
@@ -0,0 +1,74 @@
+#!/usr/bin/env python3
+
+import sys
+import os
+import time
+import json
+
+SI_NONE = 0xFFFF
+def load_speed_json(f):
+    j = json.load(f)
+    # Index speed indexes to names
+    speed_i2s = {}
+    for k, v in j['speed_model'].items():
+        i = v['speed_index']
+        if i != SI_NONE:
+            speed_i2s[i] = k
+    return j, speed_i2s
+
+def gen_tiles(fnin, speed_i2s):
+    for l in open(fnin):
+        # lappend items pip $name $speed_index
+        # puts $fp "$type $tile $grid_x $grid_y $items"
+        parts = l.strip().split()
+        tile_type, tile_name, grid_x, grid_y = parts[0:4]
+        grid_x, grid_y = int(grid_x), int(grid_y)
+        tuples = parts[4:]
+        assert len(tuples) % 3 == 0
+        pips = {}
+        wires = {}
+        for i in range(0, len(tuples), 3):
+            ttype, name, speed_index = tuples[i:i+3]
+            name_local = name.split('/')[1]
+            {
+                'pip': pips,
+                'wire': wires,
+            }[ttype][name_local] = speed_i2s[int(speed_index)]
+        yield (tile_type, tile_name, grid_x, grid_y, pips, wires)
+
+def run(fnin, fnout, speed_json_fn, verbose=False):
+    speedj, speed_i2s = load_speed_json(open(speed_json_fn, 'r'))
+
+    tiles = {}
+    for tile in gen_tiles(fnin, speed_i2s):
+        (tile_type, tile_name, grid_x, grid_y, pips, wires) = tile
+        this_dat = {'pips': pips, 'wires': wires}
+        if tile_type not in tiles:
+            tiles[tile_type] = this_dat
+        else:
+                if tiles[tile_type] != this_dat:
+                    print(tile_name, tile_type)
+                    print(this_dat)
+                    print(tiles[tile_type])
+                    assert 0
+    
+    j = {'tiles': tiles}
+    json.dump(j, open(fnout, 'w'), sort_keys=True, indent=4, separators=(',', ': '))
+
+def main():
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description=
+        'Solve timing solution'
+    )
+    parser.add_argument('--speed-json', default='build_speed/speed.json',
+        help='Provides speed index to name translation')
+    parser.add_argument('fnin', default=None, help='input tcl output .txt')
+    parser.add_argument('fnout', default=None, help='output .json')
+    args = parser.parse_args()
+
+    run(args.fnin, args.fnout, speed_json_fn=args.speed_json, verbose=False)
+
+if __name__ == '__main__':
+    main()
diff --git a/timfuz/timgrid/Makefile b/timfuz/timgrid/Makefile
new file mode 100644
index 00000000..c59f83bf
--- /dev/null
+++ b/timfuz/timgrid/Makefile
@@ -0,0 +1,26 @@
+
+N := 1
+SPECIMENS := $(addprefix specimen_,$(shell seq -f '%03.0f' $(N)))
+SPECIMENS_OK := $(addsuffix /OK,$(SPECIMENS))
+
+database: $(SPECIMENS_OK)
+	cp specimen_001/tilegrid.json tilegrid.json
+
+pushdb:
+	cp tilegrid.json ${XRAY_DATABASE_DIR}/$(XRAY_DATABASE)/tilegrid.json
+
+$(SPECIMENS_OK):
+	bash generate.sh $(subst /OK,,$@)
+	touch $@
+
+run:
+	$(MAKE) clean
+	$(MAKE) database
+	$(MAKE) pushdb
+	touch run.ok
+
+clean:
+	rm -rf specimen_[0-9][0-9][0-9]/ tilegrid.json run.ok
+
+.PHONY: database pushdb clean run
+
diff --git a/timfuz/timgrid/generate.sh b/timfuz/timgrid/generate.sh
new file mode 100644
index 00000000..3efa2478
--- /dev/null
+++ b/timfuz/timgrid/generate.sh
@@ -0,0 +1,16 @@
+#!/bin/bash -x
+
+source ${XRAY_GENHEADER}
+
+vivado -mode batch -source ../generate.tcl
+
+for x in design*.bit; do
+	${XRAY_BITREAD} -F $XRAY_ROI_FRAMES -o ${x}s -z -y $x
+done
+
+for x in design_*.bits; do
+	diff -u design.bits $x | grep '^[-+]bit' > ${x%.bits}.delta
+done
+
+python3 ../generate.py design_*.delta > tilegrid.json
+
diff --git a/timfuz/timgrid/generate.tcl b/timfuz/timgrid/generate.tcl
new file mode 100644
index 00000000..70a9b030
--- /dev/null
+++ b/timfuz/timgrid/generate.tcl
@@ -0,0 +1,119 @@
+proc create_project {} {
+    if 0 {
+        set grid_min_x -1
+        set grid_max_x -1
+        set grid_min_y -1
+        set grid_max_y -1
+    } {
+        set grid_min_x $::env(XRAY_ROI_GRID_X1)
+        set grid_max_x $::env(XRAY_ROI_GRID_X2)
+        set grid_min_y $::env(XRAY_ROI_GRID_Y1)
+        set grid_max_y $::env(XRAY_ROI_GRID_Y2)
+    }
+
+    create_project -force -part $::env(XRAY_PART) design design
+
+    read_verilog ../top.v
+    synth_design -top top
+
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_00) IOSTANDARD LVCMOS33" [get_ports clk]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_01) IOSTANDARD LVCMOS33" [get_ports di]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_02) IOSTANDARD LVCMOS33" [get_ports do]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_03) IOSTANDARD LVCMOS33" [get_ports stb]
+
+    create_pblock roi
+    add_cells_to_pblock [get_pblocks roi] [get_cells roi]
+    resize_pblock [get_pblocks roi] -add "$::env(XRAY_ROI)"
+
+    set_property CFGBVS VCCO [current_design]
+    set_property CONFIG_VOLTAGE 3.3 [current_design]
+    set_property BITSTREAM.GENERAL.PERFRAMECRC YES [current_design]
+    set_param tcl.collectionResultDisplayLimit 0
+
+    set_property CLOCK_DEDICATED_ROUTE FALSE [get_nets clk_IBUF]
+
+    set luts [get_bels -of_objects [get_sites -of_objects [get_pblocks roi]] -filter {TYPE =~ LUT*} */A6LUT]
+    set selected_luts {}
+    set lut_index 0
+
+    # LOC one LUT (a "selected_lut") into each CLB segment configuration column (ie 50 per column)
+    # Also, if GRID_MIN/MAX is not defined, automatically create it based on used CLBs
+    # See caveat in README on automatic creation
+    foreach lut $luts {
+	    set tile [get_tile -of_objects $lut]
+	    set grid_x [get_property GRID_POINT_X $tile]
+	    set grid_y [get_property GRID_POINT_Y $tile]
+
+	    if [expr $grid_min_x < 0 || $grid_x < $grid_min_x] {set grid_min_x $grid_x}
+	    if [expr $grid_max_x < 0 || $grid_x > $grid_max_x] {set grid_max_x $grid_x}
+
+	    if [expr $grid_min_y < 0 || $grid_y < $grid_min_y] {set grid_min_y $grid_y}
+	    if [expr $grid_max_y < 0 || $grid_y > $grid_max_y] {set grid_max_y $grid_y}
+
+	    # 50 per column => 50, 100, 150, etc
+	    if [regexp "Y(0|[0-9]*[05]0)/" $lut] {
+		    set cell [get_cells roi/is[$lut_index].lut]
+		    set_property LOC [get_sites -of_objects $lut] $cell
+		    set lut_index [expr $lut_index + 1]
+		    lappend selected_luts $lut
+	    }
+    }
+
+    place_design
+    route_design
+
+    write_checkpoint -force design.dcp
+    write_bitstream -force design.bit
+}
+
+proc write_data {} {
+    if 0 {
+        set grid_min_x -1
+        set grid_max_x -1
+        set grid_min_y -1
+        set grid_max_y -1
+    } {
+        set grid_min_x $::env(XRAY_ROI_GRID_X1)
+        set grid_max_x $::env(XRAY_ROI_GRID_X2)
+        set grid_min_y $::env(XRAY_ROI_GRID_Y1)
+        set grid_max_y $::env(XRAY_ROI_GRID_Y2)
+    }
+
+    # Get all tiles in ROI, ie not just the selected LUTs
+    set tiles [get_tiles -filter "GRID_POINT_X >= $grid_min_x && GRID_POINT_X <= $grid_max_x && GRID_POINT_Y >= $grid_min_y && GRID_POINT_Y <= $grid_max_y"]
+
+    # Write tiles.txt with site metadata
+    set fp [open "tiles.txt" w]
+    foreach tile $tiles {
+	    set type [get_property TYPE $tile]
+	    set grid_x [get_property GRID_POINT_X $tile]
+	    set grid_y [get_property GRID_POINT_Y $tile]
+
+	    set items {}
+
+        set wires [get_wires -of_objects $tile]
+	    if [llength $wires] {
+            foreach wire $wires {
+                set name [get_property NAME $wire]
+                set speed_index [get_property SPEED_INDEX $wire]
+			    lappend items wire $name $speed_index
+		    }
+	    }
+
+        set pips [get_pips -of_objects $tile]
+	    if [llength $pips] {
+            foreach pip $pips {
+                set name [get_property NAME $pip]
+                set speed_index [get_property SPEED_INDEX $pip]
+			    lappend items pip $name $speed_index
+		    }
+	    }
+
+	    puts $fp "$type $tile $grid_x $grid_y $items"
+    }
+    close $fp
+}
+
+create_project
+write_data
+
diff --git a/timfuz/timgrid/top.v b/timfuz/timgrid/top.v
new file mode 100644
index 00000000..5fd239b5
--- /dev/null
+++ b/timfuz/timgrid/top.v
@@ -0,0 +1,49 @@
+//Need at least one LUT per frame base address we want
+`define N 100
+
+module top(input clk, stb, di, output do);
+	localparam integer DIN_N = 6;
+	localparam integer DOUT_N = `N;
+
+	reg [DIN_N-1:0] din;
+	wire [DOUT_N-1:0] dout;
+
+	reg [DIN_N-1:0] din_shr;
+	reg [DOUT_N-1:0] dout_shr;
+
+	always @(posedge clk) begin
+		din_shr <= {din_shr, di};
+		dout_shr <= {dout_shr, din_shr[DIN_N-1]};
+		if (stb) begin
+			din <= din_shr;
+			dout_shr <= dout;
+		end
+	end
+
+	assign do = dout_shr[DOUT_N-1];
+
+	roi roi (
+		.clk(clk),
+		.din(din),
+		.dout(dout)
+	);
+endmodule
+
+module roi(input clk, input [5:0] din, output [`N-1:0] dout);
+	genvar i;
+	generate
+		for (i = 0; i < `N; i = i+1) begin:is
+			LUT6 #(
+				.INIT(64'h8000_0000_0000_0001 + (i << 16))
+			) lut (
+				.I0(din[0]),
+				.I1(din[1]),
+				.I2(din[2]),
+				.I3(din[3]),
+				.I4(din[4]),
+				.I5(din[5]),
+				.O(dout[i])
+			);
+		end
+	endgenerate
+endmodule
diff --git a/timfuz/timgrid/top_bram.v b/timfuz/timgrid/top_bram.v
new file mode 100644
index 00000000..880fd375
--- /dev/null
+++ b/timfuz/timgrid/top_bram.v
@@ -0,0 +1,62 @@
+`define N 100
+
+module top(input clk, stb, di, output do);
+	localparam integer DIN_N = 8;
+	localparam integer DOUT_N = `N;
+
+	reg [DIN_N-1:0] din;
+	wire [DOUT_N-1:0] dout;
+
+	reg [DIN_N-1:0] din_shr;
+	reg [DOUT_N-1:0] dout_shr;
+
+	always @(posedge clk) begin
+		din_shr <= {din_shr, di};
+		dout_shr <= {dout_shr, din_shr[DIN_N-1]};
+		if (stb) begin
+			din <= din_shr;
+			dout_shr <= dout;
+		end
+	end
+
+	assign do = dout_shr[DOUT_N-1];
+
+	roi roi (
+		.clk(clk),
+		.din(din),
+		.dout(dout)
+	);
+endmodule
+
+module roi(input clk, input [7:0] din, output [`N-1:0] dout);
+	genvar i;
+	generate
+		for (i = 0; i < `N; i = i+1) begin:is
+            (* KEEP, DONT_TOUCH *)
+            RAMB36E1 #(.INIT_00(256'h0000000000000000000000000000000000000000000000000000000000000000)) ram (
+                    .CLKARDCLK(din[0]),
+                    .CLKBWRCLK(din[1]),
+                    .ENARDEN(din[2]),
+                    .ENBWREN(din[3]),
+                    .REGCEAREGCE(din[4]),
+                    .REGCEB(din[5]),
+                    .RSTRAMARSTRAM(din[6]),
+                    .RSTRAMB(din[7]),
+                    .RSTREGARSTREG(din[0]),
+                    .RSTREGB(din[1]),
+                    .ADDRARDADDR(din[2]),
+                    .ADDRBWRADDR(din[3]),
+                    .DIADI(din[4]),
+                    .DIBDI(din[5]),
+                    .DIPADIP(din[6]),
+                    .DIPBDIP(din[7]),
+                    .WEA(din[0]),
+                    .WEBWE(din[1]),
+                    .DOADO(dout[0]),
+                    .DOBDO(),
+                    .DOPADOP(),
+                    .DOPBDOP());
+		end
+	endgenerate
+endmodule
+

From edbd5f4ca92233a789b39cbf85a2b3872d529774 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 29 Aug 2018 17:58:56 -0700
Subject: [PATCH 26/55] timfuz: tile annotate. Workflow alpha!

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 timfuz/tile_annotate.py | 64 +++++++++++++++++++++++++++++++++++++++++
 1 file changed, 64 insertions(+)
 create mode 100644 timfuz/tile_annotate.py

diff --git a/timfuz/tile_annotate.py b/timfuz/tile_annotate.py
new file mode 100644
index 00000000..e294769b
--- /dev/null
+++ b/timfuz/tile_annotate.py
@@ -0,0 +1,64 @@
+#!/usr/bin/env python3
+
+from timfuz import loadc_Ads_b, Ads2bounds
+
+import sys
+import os
+import time
+import json
+
+# corner wokraround
+def quad(x):
+    return [x for _ in range(4)]
+
+def run(fnin, fnout, tile_json_fn, verbose=False):
+    # modified in place
+    tilej = json.load(open(tile_json_fn, 'r'))
+
+    # FIXME: all corners
+    Ads, b = loadc_Ads_b([fnin], corner=None, ico=True)
+    bounds = Ads2bounds(Ads, b)
+
+    pipn_net = 0
+    pipn_solved = 0
+    wiren_net = 0
+    wiren_solved = 0
+
+    for tile in tilej['tiles'].values():
+        pips = tile['pips']
+        for k, v in pips.items():
+            val = bounds.get('PIP_' + v, None)
+            pips[k] = quad(val)
+            pipn_net += 1
+            if pips[k]:
+                pipn_solved += 1
+
+        wires = tile['wires']
+        for k, v in wires.items():
+            val = bounds.get('WIRE_' + v, None)
+            wires[k] = quad(val)
+            wiren_net += 1
+            if wires[k]:
+                wiren_solved += 1
+
+    print('Pips: %u / %u solved' % (pipn_solved, pipn_net))
+    print('Wires: %u / %u solved' % (wiren_solved, wiren_net))
+
+    json.dump(tilej, open(fnout, 'w'), sort_keys=True, indent=4, separators=(',', ': '))
+
+def main():
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description=
+        ''
+    )
+    parser.add_argument('--tile-json', default='tiles.json', help='')
+    parser.add_argument('fnin', default=None, help='Flattened timing csv')
+    parser.add_argument('fnout', default=None, help='output tile .json')
+    args = parser.parse_args()
+
+    run(args.fnin, args.fnout, args.tile_json, verbose=False)
+
+if __name__ == '__main__':
+    main()

From d96bfd7a8b64d6888d1ff205ba364b6c70e353bd Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Mon, 10 Sep 2018 15:54:39 -0700
Subject: [PATCH 27/55] timfuz: cleanup README

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 timfuz/README.md   | 288 +++++++++++++++++++++++++++++++++++++++++++++
 timfuz/README.txt  |  71 -----------
 timfuz/checksub.py |   1 +
 3 files changed, 289 insertions(+), 71 deletions(-)
 create mode 100644 timfuz/README.md
 delete mode 100644 timfuz/README.txt

diff --git a/timfuz/README.md b/timfuz/README.md
new file mode 100644
index 00000000..ae90a689
--- /dev/null
+++ b/timfuz/README.md
@@ -0,0 +1,288 @@
+# Timing analysis fuzzer (timfuz)
+
+WIP: 2018-09-10: this process is just starting together and is going to get significant cleanup. But heres the general idea
+
+This runs various designs through Vivado and processes the
+resulting timing informationin order to create very simple timing models.
+While Vivado might have more involved models (say RC delays, fanout, etc),
+timfuz creates simple models that bound realistic min and max element delays.
+
+Currently this document focuses exclusively on fabric timing delays.
+
+
+## Quick start
+
+TODO: make this into a more formal makefile flow
+
+```
+# Pre-processing
+# Create speed.json
+./speed.sh
+
+# Create csvs
+make N=1
+csv=specimen_001/timing3.csv
+
+# Main workflow
+# Discover which variables can be separated
+python3 timfuz_rref.py --simplify --out sub.json $csv
+# Verify sub.json makes a solvable solution
+python3 checksub.py --sub-json sub.json group.csv
+# Separate variables
+python3 csv_flat2group.py --sub-json sub.json --strict $csv group.csv
+# Create a rough timing model that approximately fits the given paths
+python3 solve_leastsq.py --sub-json sub.json group.csv --out leastsq.csv
+# Tweak rough timing model, making sure all constraints are satisfied
+python3 solve_linprog.py --sub-json sub.json --sub-csv leastsq.csv --massage group.csv --out linprog.csv
+# Take separated variables and back-annotate them to the original timing variables
+python3 csv_group2flat.py --sub-json sub.json --sort linprog.csv flat.csv
+
+# Final processing
+# Create tile.json (where timing models are in tile fabric)
+python3 tile_txt2json.py timgrid/specimen_001/tiles.txt tiles.json
+# Insert timing delays into actual tile layouts
+python3 tile_annotate.py flat.csv tilea.json
+```
+
+
+## Vivado background
+
+Examples are for a XC750T on Vivado 2017.2.
+
+TODO maybe move to: https://github.com/SymbiFlow/prjxray/wiki/Timing
+
+
+### Speed index
+
+Vivado seems to associate each delay model with a "speed index".
+The fabric has these in two elements: wires (ie one delay element per tile) and pips.
+For example, LUT output node A (ex: CLBLL_L_X12Y100/CLBLL_LL_A) has a single wire, also called CLBLL_L_X12Y100/CLBLL_LL_A.
+This has speed index 733. Speed models can be queried and we find this corresponds to model C_CLBLL_LL_A.
+
+There are various speed model types:
+* bel_delay
+* buffer
+* buffer_switch
+* content_version
+* functional
+* inpin
+* outpin
+* parameters
+* pass_transistor
+* switch
+* table_lookup
+* tl_buffer
+* vt_limits
+* wire
+
+IIRC the interconnect is only composed of switch and wire types.
+
+Indices with value 65535 (0xFFFF) never appear. Presumably these are unused models.
+They are used for some special models such as those of type "content_version".
+For example, the "xilinx" model is of type "content_version".
+
+There are also "cost codes", but these seem to be very course (only around 30 of these)
+and are suspected to be related more to PnR than timing model.
+
+
+### Timing paths
+
+The Vivado timing analyzer can easily output the following:
+* Full: delay from BEL pin to BEL pin
+* Interconnect only (ICO): delay from BEL pin to BEL pin, but only report interconnect delays (ie exclude site delays)
+
+There is also theoretically an option to report delays up to a specific pip,
+but this option is poorly documented and I was unable to get it to work.
+
+Each timing path reports a fast process and a slow process min and max value. So four process values are reported in total:
+* fast_max
+* fast_min
+* slow_max
+* slow_min
+
+For example, if the device is end of life, was poorly made, and at an extreme temperature, the delay may be up to the slow_max value.
+Since ICO can be reported for each of these, fully analyzing a timing path results in 8 values.
+
+Finally, part of this was analyzing tile regularity to discover what a reasonably compact timing model was.
+We verified that all tiles of the same type have exactly the same delay elements.
+
+
+
+## Methodology
+
+Make sure you've read the Vivado background section first
+
+
+### Background
+
+This section briefly describes some of the mathmatics used by this technique that readers may not be familiar with.
+These definitions are intended to be good enough to provide a high level understanding and may not be precise.
+
+Numerical analysis: the study of algorithms that use numerical approximation (as opposed to general symbolic manipulations)
+
+numpy: a popular numerical analysis python library. Often written np (import numpy as np).
+
+scipy: provides higher level functionality on top of numpy
+
+sympy ("symbolic python"): like numpy, but is designed to work with rational numbers.
+For example, python actually stores 0.1 as 0.1000000000000000055511151231257827021181583404541015625.
+However, sympy can represent this as the fraction 1/10, eliminating numerical approximation issues.
+
+Least squares (ex: scipy.optimize.least_squares): approximation method to do a best fit of several variables to a set of equations.
+For example, given the equations "x = 1" and "x = 2" there isn't an exact solution.
+However, "x = 1.5" is a good compromise since its reasonably solves both equations.
+
+Linear programming (ex: scipy.optimize.linprog aka linprog): approximation method that finds a set of variables that satisfy a set of inequalities.
+For example,
+
+Reduced row echelon form (RREF, ex: sympy.Matrix.rref): the simplest form that a system of linear equations can be solved to.
+For example, given "x = 1" and "x + y = 9", one can solve for "x = 1" and "y = 8".
+However, given "x + y = 1" and "x + y + z = 9", there aren't enough variables to solve this fully.
+In this case RREF provides a best effort by giving the ratios between correlated variables.
+One variable is normalized to 1 in each of these ratios and is called the "pivot".
+Note that if numpy.linalg.solve encounters an unsolvable matrix it may either complain
+or generate a false solution due to numerical approximation issues.
+
+
+### What didn't work
+
+First some quick background on things that didn't work to illustrate why the current approach was chosen.
+I first tried to directly through things into linprog, but it unfairly weighted towards arbitrary shared variables. For example, feeding in:
+* t0 >= 10
+* t0 + t1 >= 100
+
+It would declare "t0 = 100", "t1 = 0" instead of the more intuitive "t0 = 10", "t1 = 90".
+I tried to work around this in several ways, notably subtracting equations from each other to produce additional constraints.
+This worked okay, but was relatively slow and wasn't approaching nearly solved solutions, even when throwing a lot of data at it.
+
+Next we tried randomly combining a bunch of the equations together and solving them like a regular linear algebra matrix (numpy.linalg.solve).
+However, this illustrated that the system was under-constrained.
+Further analysis revealed that there are some delay element combinations that simply can't be linearly separated.
+This was checked primarily using numpy.linalg.matrix_rank, with some use of numpy.linalg.slogdet.
+matrix_rank was preferred over slogdet since its more flexible against non-square matrices.
+
+
+### Process
+
+Above ultimately led to the idea that we should come up with a set of substitutions that would make the system solvable. This has several advantages:
+* Easy to evaluate which variables aren't covered well enough by source data
+* Easy to evaluate which variables weren't solved properly (if its fully constrained it should have had a non-zero delay)
+
+At a high level, the above learnings gave this process:
+* Find correlated variables by using RREF (sympy.Matrix.rref) to create variable groups
+  - Note pivots
+  - You must input a fractional type (ex: fractions.Fraction, but surprisingly not int) to get exact results, otherwise it seems to fall back to numerical approximation
+  - This is by far the most computationally expensive step
+  - Mixing RREF substitutions from one data set to another may not be recommended
+* Use RREF result to substitute groups on input data, creating new meta variables, but ultimately reducing the number of columns
+* Pick a corner
+  - Examples assume fast_max, but other corners are applicable with appropriate column and sign changes
+* De-duplicate by removing equations that are less constrained
+  - Ex: if solving for a max corner and given:
+  - t0 + t1 >= 10
+  - t0 + t1 >= 12
+  - The first equation is redundant since the second provides a stricter constraint
+  - This significantly reduces computational time
+* Use least squares (scipy.optimize.least_squares) to fit variables near input constraints
+  - Helps fairly weight delays vs the original input constraints
+  - Does not guarantee all constraints are met. For example, if this was put in (ignoring these would have been de-duplicated):
+  - t0 = 10
+  - t0 = 12
+  - It may decide something like t0 = 11, which means that the second constraint was not satisfied given we actually want t0 >= 12
+* Use linear programming (scipy.optimize.linprog aka linprog) to formally meet all remaining constraints
+  - Start by filtering out all constraints that are already met. This should eliminate nearly all equations
+* Map resulting constraints onto different tile types
+  - Group delays map onto the group pivot variable, typically setting other elements to 0 (if the processed set is not the one used to create the pivots they may be non-zero)
+
+
+## TODO
+
+Milestone 1 (MVP)
+* DONE
+* Provide any process corner with at least some of the fabric
+
+Milestone 2
+* Provide all four fabric corners
+* Simple makefile based flow
+* Cleanup/separate fabric input targets
+
+Milestone 3
+* Create site delay model
+
+Final
+* Investigate ZERO
+* Investigate virtual switchboxes
+* Compare our vs Xilinx output on random designs
+
+
+### Improve test cases
+
+Test cases are somewhat random right now. We could make much more targetted cases using custom routing to improve various fanout estimates and such.
+Also there are a lot more elements that are not covered.
+At a minimum these should be moved to their own directory.
+
+
+### ZERO models
+
+Background: there are a number of speed models with the name ZERO in them.
+These generally seem to be zero delay, although needs more investigation.
+
+Example: see virtual switchbox item below
+
+The timing models will probably significantly improve if these are removed.
+In the past I was removing them, but decided to keep them in for now in the spirit of being more conservative.
+
+They include:
+ * _BSW_CLK_ZERO
+ * BSW_CLK_ZERO
+ * _BSW_ZERO
+ * BSW_ZERO
+ * _B_ZERO
+ * B_ZERO
+ * C_CLK_ZERO
+ * C_DSP_ZERO
+ * C_ZERO
+ * I_ZERO
+ * _O_ZERO
+ * O_ZERO
+ * RC_ZERO
+ * _R_ZERO
+ * R_ZERO
+
+
+### Virtual switchboxes
+
+Background: several low level configuration details are abstracted with virtual configurable elements.
+For example, LUT inputs can be rearranged to reduce routing congestion.
+However, the LUT configuratioon must be changed to match the switched inputs.
+This is handled by the CLBLL_L_INTER switchbox, which doesn't encode any physical configuration bits.
+However, this contains PIPs with delay models.
+
+For example, LUT A, input A1 has node CLBLM_M_A1 coming from pip junction CLBLM_M_A1 has PIP CLBLM_IMUX7->CLBLM_M_A1
+with speed index 659 (R_ZERO).
+
+This might be further evidence on related issue that ZERO models should probably be removed.
+
+
+### Incporporate fanout
+
+We could probably significantly improve model granularity by studying delay impact on fanout
+
+
+### Investigate RC delays
+
+Suspect accuracy could be significantly improved by moving to SPICE based models. But this will take significantly more characterization
+
+
+### Characterize real hardware
+
+A few people have expressed interest on running tests on real hardware. Will take some thought given we don't have direct access
+
+
+### Review approximation errors
+
+Ex: one known issue is that the objective function linearly weights small and large delays.
+This is only recommended when variables are approximately the same order of magnitude.
+For example, carry chain delays are on the order of 7 ps while other delays are 100 ps.
+Its very easy to put a large delay on the carry chain while it could have been more appropriately put somewhere else.
+
diff --git a/timfuz/README.txt b/timfuz/README.txt
deleted file mode 100644
index 5d37ec78..00000000
--- a/timfuz/README.txt
+++ /dev/null
@@ -1,71 +0,0 @@
-Timing analysis fuzzer
-This runs some random designs through Vivado and extracts timing information in order to derive timing models
-While Vivado has more involved RC (spice?) models incorporating fanout and other things,
-for now we are shooting for simple, conservative models with a min and max timing delay
-
-
-*******************************************************************************
-Background
-*******************************************************************************
-
-Vivado seems to associate each delay model with a "speed index"
-In particular, we are currently looking at pips and wires, each of which have a speed index associated with them
-For every timeing path, we record the total delay from one site to another, excluding site delays
-(timing analyzer provides an option to make this easy)
-We then walk along the path and record all wires and pips in between
-These are converted to their associated speed indexes
-This gives an equation that a series of speed indexes was given a certain delay value
-These equations are then fed into scipy.optimize.linprog to give estimates for the delay models
-
-However, there are some complications. For example:
-Given a system of equations like:
-t0           = 5
-t0 + t1      = 10
-t0 + t1 + t2 = 12
-The solver puts all the delays in t0
-To get around this, we subtract equations from each other
-
-Some additional info here: https://github.com/SymbiFlow/prjxray/wiki/Timing
-
-
-*******************************************************************************
-Quick start
-*******************************************************************************
-
-./speed.sh
-python timfuz_delay.py --cols-max 9 timfuz_dat/s1_timing2.txt
-Which will report something like 
-Delay on 36 / 162
-
-Now add some more data in:
-python timfuz_delay.py --cols-max 9 timfuz_dat/speed_json.json timfuz_dat/s*_timing2.txt
-Which should get a few more delay elements, say:
-Delay on 57 / 185
-
-
-*******************************************************************************
-From scratch
-*******************************************************************************
-
-Roughly something like this
-Edit generate.tcl
-Uncomment speed_models2
-Run "make N=1"
-python speed_json.py specimen_001/speed_model.txt speed_json.json
-Edit generate.tcl
-Comment speed_models2
-Run "make N=4" to generate some more timing data
-Now run as in the quick start
-python timfuz_delay.py --cols-max 9 speed_json.json specimen_*/timing2.txt
-
-
-*******************************************************************************
-TODO:
-*******************************************************************************
-
-Verify elements are being imported correctly throughout the whole chain
-Can any wires or similar be aggregated?
-    Ex: if a node consisents of two wire delay models and that pair is never seen elsewhere
-Look at virtual switchboxes. Can these be removed?
-Look at suspicous elements like WIRE_RC_ZERO
-
diff --git a/timfuz/checksub.py b/timfuz/checksub.py
index f91fb38e..213fcb33 100644
--- a/timfuz/checksub.py
+++ b/timfuz/checksub.py
@@ -90,6 +90,7 @@ def run(fns_in, sub_json=None, verbose=False):
     print
     # https://docs.scipy.org/doc/numpy-dev/reference/generated/numpy.linalg.matrix_rank.html
     print('rank: %s / %d col' % (np.linalg.matrix_rank(Amat), len(names)))
+    # doesn't work on non-square matrices
     if 0:
         # https://docs.scipy.org/doc/numpy-1.14.0/reference/generated/numpy.linalg.slogdet.html
         sign, logdet = np.linalg.slogdet(Amat)

From 5d8d0b22d8fdb14f762eaeb2116e36b13d7187a7 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Mon, 10 Sep 2018 15:57:13 -0700
Subject: [PATCH 28/55] timfuz: moving to fuzzers dir

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 {timfuz => fuzzers/007-timing}/.gitignore           | 0
 {timfuz => fuzzers/007-timing}/Makefile             | 0
 {timfuz => fuzzers/007-timing}/README.md            | 0
 {timfuz => fuzzers/007-timing}/benchmark.py         | 0
 {timfuz => fuzzers/007-timing}/checksub.py          | 0
 {timfuz => fuzzers/007-timing}/corner_csv.py        | 0
 {timfuz => fuzzers/007-timing}/csv_flat2group.py    | 0
 {timfuz => fuzzers/007-timing}/csv_group2flat.py    | 0
 {timfuz => fuzzers/007-timing}/generate.sh          | 0
 {timfuz => fuzzers/007-timing}/generate.tcl         | 0
 {timfuz => fuzzers/007-timing}/node_unique.py       | 0
 {timfuz => fuzzers/007-timing}/oneblinkw.v          | 0
 {timfuz => fuzzers/007-timing}/perf_test.py         | 0
 {timfuz => fuzzers/007-timing}/picorv32.v           | 0
 {timfuz => fuzzers/007-timing}/pip_unique.py        | 0
 {timfuz => fuzzers/007-timing}/placelut.py          | 0
 {timfuz => fuzzers/007-timing}/placelut_fb.py       | 0
 {timfuz => fuzzers/007-timing}/placelut_ff_fb.py    | 0
 {timfuz => fuzzers/007-timing}/rref.py              | 0
 {timfuz => fuzzers/007-timing}/solve_leastsq.py     | 0
 {timfuz => fuzzers/007-timing}/solve_linprog.py     | 0
 {timfuz => fuzzers/007-timing}/speed.sh             | 0
 {timfuz => fuzzers/007-timing}/speed.tcl            | 0
 {timfuz => fuzzers/007-timing}/speed_json.py        | 0
 {timfuz => fuzzers/007-timing}/sub2csv.py           | 0
 {timfuz => fuzzers/007-timing}/tile_annotate.py     | 0
 {timfuz => fuzzers/007-timing}/tile_txt2json.py     | 0
 {timfuz => fuzzers/007-timing}/timfuz.py            | 0
 {timfuz => fuzzers/007-timing}/timfuz_csv.py        | 0
 {timfuz => fuzzers/007-timing}/timfuz_massage.py    | 0
 {timfuz => fuzzers/007-timing}/timfuz_solve.py      | 0
 {timfuz => fuzzers/007-timing}/timgrid/Makefile     | 0
 {timfuz => fuzzers/007-timing}/timgrid/generate.sh  | 0
 {timfuz => fuzzers/007-timing}/timgrid/generate.tcl | 0
 {timfuz => fuzzers/007-timing}/timgrid/top.v        | 0
 {timfuz => fuzzers/007-timing}/timgrid/top_bram.v   | 0
 {timfuz => fuzzers/007-timing}/top.v                | 0
 {timfuz => fuzzers/007-timing}/wire_unique.py       | 0
 38 files changed, 0 insertions(+), 0 deletions(-)
 rename {timfuz => fuzzers/007-timing}/.gitignore (100%)
 rename {timfuz => fuzzers/007-timing}/Makefile (100%)
 rename {timfuz => fuzzers/007-timing}/README.md (100%)
 rename {timfuz => fuzzers/007-timing}/benchmark.py (100%)
 rename {timfuz => fuzzers/007-timing}/checksub.py (100%)
 rename {timfuz => fuzzers/007-timing}/corner_csv.py (100%)
 rename {timfuz => fuzzers/007-timing}/csv_flat2group.py (100%)
 rename {timfuz => fuzzers/007-timing}/csv_group2flat.py (100%)
 rename {timfuz => fuzzers/007-timing}/generate.sh (100%)
 rename {timfuz => fuzzers/007-timing}/generate.tcl (100%)
 rename {timfuz => fuzzers/007-timing}/node_unique.py (100%)
 rename {timfuz => fuzzers/007-timing}/oneblinkw.v (100%)
 rename {timfuz => fuzzers/007-timing}/perf_test.py (100%)
 rename {timfuz => fuzzers/007-timing}/picorv32.v (100%)
 rename {timfuz => fuzzers/007-timing}/pip_unique.py (100%)
 rename {timfuz => fuzzers/007-timing}/placelut.py (100%)
 rename {timfuz => fuzzers/007-timing}/placelut_fb.py (100%)
 rename {timfuz => fuzzers/007-timing}/placelut_ff_fb.py (100%)
 rename {timfuz => fuzzers/007-timing}/rref.py (100%)
 rename {timfuz => fuzzers/007-timing}/solve_leastsq.py (100%)
 rename {timfuz => fuzzers/007-timing}/solve_linprog.py (100%)
 rename {timfuz => fuzzers/007-timing}/speed.sh (100%)
 rename {timfuz => fuzzers/007-timing}/speed.tcl (100%)
 rename {timfuz => fuzzers/007-timing}/speed_json.py (100%)
 rename {timfuz => fuzzers/007-timing}/sub2csv.py (100%)
 rename {timfuz => fuzzers/007-timing}/tile_annotate.py (100%)
 rename {timfuz => fuzzers/007-timing}/tile_txt2json.py (100%)
 rename {timfuz => fuzzers/007-timing}/timfuz.py (100%)
 rename {timfuz => fuzzers/007-timing}/timfuz_csv.py (100%)
 rename {timfuz => fuzzers/007-timing}/timfuz_massage.py (100%)
 rename {timfuz => fuzzers/007-timing}/timfuz_solve.py (100%)
 rename {timfuz => fuzzers/007-timing}/timgrid/Makefile (100%)
 rename {timfuz => fuzzers/007-timing}/timgrid/generate.sh (100%)
 rename {timfuz => fuzzers/007-timing}/timgrid/generate.tcl (100%)
 rename {timfuz => fuzzers/007-timing}/timgrid/top.v (100%)
 rename {timfuz => fuzzers/007-timing}/timgrid/top_bram.v (100%)
 rename {timfuz => fuzzers/007-timing}/top.v (100%)
 rename {timfuz => fuzzers/007-timing}/wire_unique.py (100%)

diff --git a/timfuz/.gitignore b/fuzzers/007-timing/.gitignore
similarity index 100%
rename from timfuz/.gitignore
rename to fuzzers/007-timing/.gitignore
diff --git a/timfuz/Makefile b/fuzzers/007-timing/Makefile
similarity index 100%
rename from timfuz/Makefile
rename to fuzzers/007-timing/Makefile
diff --git a/timfuz/README.md b/fuzzers/007-timing/README.md
similarity index 100%
rename from timfuz/README.md
rename to fuzzers/007-timing/README.md
diff --git a/timfuz/benchmark.py b/fuzzers/007-timing/benchmark.py
similarity index 100%
rename from timfuz/benchmark.py
rename to fuzzers/007-timing/benchmark.py
diff --git a/timfuz/checksub.py b/fuzzers/007-timing/checksub.py
similarity index 100%
rename from timfuz/checksub.py
rename to fuzzers/007-timing/checksub.py
diff --git a/timfuz/corner_csv.py b/fuzzers/007-timing/corner_csv.py
similarity index 100%
rename from timfuz/corner_csv.py
rename to fuzzers/007-timing/corner_csv.py
diff --git a/timfuz/csv_flat2group.py b/fuzzers/007-timing/csv_flat2group.py
similarity index 100%
rename from timfuz/csv_flat2group.py
rename to fuzzers/007-timing/csv_flat2group.py
diff --git a/timfuz/csv_group2flat.py b/fuzzers/007-timing/csv_group2flat.py
similarity index 100%
rename from timfuz/csv_group2flat.py
rename to fuzzers/007-timing/csv_group2flat.py
diff --git a/timfuz/generate.sh b/fuzzers/007-timing/generate.sh
similarity index 100%
rename from timfuz/generate.sh
rename to fuzzers/007-timing/generate.sh
diff --git a/timfuz/generate.tcl b/fuzzers/007-timing/generate.tcl
similarity index 100%
rename from timfuz/generate.tcl
rename to fuzzers/007-timing/generate.tcl
diff --git a/timfuz/node_unique.py b/fuzzers/007-timing/node_unique.py
similarity index 100%
rename from timfuz/node_unique.py
rename to fuzzers/007-timing/node_unique.py
diff --git a/timfuz/oneblinkw.v b/fuzzers/007-timing/oneblinkw.v
similarity index 100%
rename from timfuz/oneblinkw.v
rename to fuzzers/007-timing/oneblinkw.v
diff --git a/timfuz/perf_test.py b/fuzzers/007-timing/perf_test.py
similarity index 100%
rename from timfuz/perf_test.py
rename to fuzzers/007-timing/perf_test.py
diff --git a/timfuz/picorv32.v b/fuzzers/007-timing/picorv32.v
similarity index 100%
rename from timfuz/picorv32.v
rename to fuzzers/007-timing/picorv32.v
diff --git a/timfuz/pip_unique.py b/fuzzers/007-timing/pip_unique.py
similarity index 100%
rename from timfuz/pip_unique.py
rename to fuzzers/007-timing/pip_unique.py
diff --git a/timfuz/placelut.py b/fuzzers/007-timing/placelut.py
similarity index 100%
rename from timfuz/placelut.py
rename to fuzzers/007-timing/placelut.py
diff --git a/timfuz/placelut_fb.py b/fuzzers/007-timing/placelut_fb.py
similarity index 100%
rename from timfuz/placelut_fb.py
rename to fuzzers/007-timing/placelut_fb.py
diff --git a/timfuz/placelut_ff_fb.py b/fuzzers/007-timing/placelut_ff_fb.py
similarity index 100%
rename from timfuz/placelut_ff_fb.py
rename to fuzzers/007-timing/placelut_ff_fb.py
diff --git a/timfuz/rref.py b/fuzzers/007-timing/rref.py
similarity index 100%
rename from timfuz/rref.py
rename to fuzzers/007-timing/rref.py
diff --git a/timfuz/solve_leastsq.py b/fuzzers/007-timing/solve_leastsq.py
similarity index 100%
rename from timfuz/solve_leastsq.py
rename to fuzzers/007-timing/solve_leastsq.py
diff --git a/timfuz/solve_linprog.py b/fuzzers/007-timing/solve_linprog.py
similarity index 100%
rename from timfuz/solve_linprog.py
rename to fuzzers/007-timing/solve_linprog.py
diff --git a/timfuz/speed.sh b/fuzzers/007-timing/speed.sh
similarity index 100%
rename from timfuz/speed.sh
rename to fuzzers/007-timing/speed.sh
diff --git a/timfuz/speed.tcl b/fuzzers/007-timing/speed.tcl
similarity index 100%
rename from timfuz/speed.tcl
rename to fuzzers/007-timing/speed.tcl
diff --git a/timfuz/speed_json.py b/fuzzers/007-timing/speed_json.py
similarity index 100%
rename from timfuz/speed_json.py
rename to fuzzers/007-timing/speed_json.py
diff --git a/timfuz/sub2csv.py b/fuzzers/007-timing/sub2csv.py
similarity index 100%
rename from timfuz/sub2csv.py
rename to fuzzers/007-timing/sub2csv.py
diff --git a/timfuz/tile_annotate.py b/fuzzers/007-timing/tile_annotate.py
similarity index 100%
rename from timfuz/tile_annotate.py
rename to fuzzers/007-timing/tile_annotate.py
diff --git a/timfuz/tile_txt2json.py b/fuzzers/007-timing/tile_txt2json.py
similarity index 100%
rename from timfuz/tile_txt2json.py
rename to fuzzers/007-timing/tile_txt2json.py
diff --git a/timfuz/timfuz.py b/fuzzers/007-timing/timfuz.py
similarity index 100%
rename from timfuz/timfuz.py
rename to fuzzers/007-timing/timfuz.py
diff --git a/timfuz/timfuz_csv.py b/fuzzers/007-timing/timfuz_csv.py
similarity index 100%
rename from timfuz/timfuz_csv.py
rename to fuzzers/007-timing/timfuz_csv.py
diff --git a/timfuz/timfuz_massage.py b/fuzzers/007-timing/timfuz_massage.py
similarity index 100%
rename from timfuz/timfuz_massage.py
rename to fuzzers/007-timing/timfuz_massage.py
diff --git a/timfuz/timfuz_solve.py b/fuzzers/007-timing/timfuz_solve.py
similarity index 100%
rename from timfuz/timfuz_solve.py
rename to fuzzers/007-timing/timfuz_solve.py
diff --git a/timfuz/timgrid/Makefile b/fuzzers/007-timing/timgrid/Makefile
similarity index 100%
rename from timfuz/timgrid/Makefile
rename to fuzzers/007-timing/timgrid/Makefile
diff --git a/timfuz/timgrid/generate.sh b/fuzzers/007-timing/timgrid/generate.sh
similarity index 100%
rename from timfuz/timgrid/generate.sh
rename to fuzzers/007-timing/timgrid/generate.sh
diff --git a/timfuz/timgrid/generate.tcl b/fuzzers/007-timing/timgrid/generate.tcl
similarity index 100%
rename from timfuz/timgrid/generate.tcl
rename to fuzzers/007-timing/timgrid/generate.tcl
diff --git a/timfuz/timgrid/top.v b/fuzzers/007-timing/timgrid/top.v
similarity index 100%
rename from timfuz/timgrid/top.v
rename to fuzzers/007-timing/timgrid/top.v
diff --git a/timfuz/timgrid/top_bram.v b/fuzzers/007-timing/timgrid/top_bram.v
similarity index 100%
rename from timfuz/timgrid/top_bram.v
rename to fuzzers/007-timing/timgrid/top_bram.v
diff --git a/timfuz/top.v b/fuzzers/007-timing/top.v
similarity index 100%
rename from timfuz/top.v
rename to fuzzers/007-timing/top.v
diff --git a/timfuz/wire_unique.py b/fuzzers/007-timing/wire_unique.py
similarity index 100%
rename from timfuz/wire_unique.py
rename to fuzzers/007-timing/wire_unique.py

From 943ab5bbb7d1ea1ab6ea4a7d6f98f0522dd4c32c Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Tue, 11 Sep 2018 11:51:11 -0700
Subject: [PATCH 29/55] timfuz: placelut as standalone data generator

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/Makefile                   |  22 --
 fuzzers/007-timing/generate.sh                |   9 -
 fuzzers/007-timing/generate.tcl               | 279 ------------------
 .../{ => projects/oneblinkw}/oneblinkw.v      |   0
 .../007-timing/{ => projects/picorv32}/top.v  |   0
 fuzzers/007-timing/projects/placelut/Makefile |  52 ++++
 .../placelut/generate.py}                     |   2 +-
 .../007-timing/projects/placelut/generate.sh  |  11 +
 .../007-timing/projects/placelut/generate.tcl |  47 +++
 .../{ => projects/placelut_fb}/placelut_fb.py |   0
 .../placelut_ff_fb}/placelut_ff_fb.py         |   0
 fuzzers/007-timing/speed.sh                   |   8 -
 fuzzers/007-timing/speed/.gitignore           |   2 +
 fuzzers/007-timing/speed/Makefile             |  12 +
 fuzzers/007-timing/speed/README.md            |   4 +
 .../{speed.tcl => speed/generate.tcl}         |  19 +-
 fuzzers/007-timing/{ => speed}/speed_json.py  |   0
 fuzzers/007-timing/speed/top.v                |   8 +
 fuzzers/007-timing/{ => src}/picorv32.v       |   0
 fuzzers/007-timing/timgrid/.gitignore         |   1 +
 fuzzers/007-timing/timgrid/Makefile           |  28 +-
 fuzzers/007-timing/timgrid/generate.tcl       |   6 +-
 .../007-timing/{ => timgrid}/tile_txt2json.py |   2 +-
 .../{timfuz_csv.py => timing_txt2csv.py}      |   2 +-
 24 files changed, 155 insertions(+), 359 deletions(-)
 delete mode 100644 fuzzers/007-timing/Makefile
 delete mode 100755 fuzzers/007-timing/generate.sh
 delete mode 100644 fuzzers/007-timing/generate.tcl
 rename fuzzers/007-timing/{ => projects/oneblinkw}/oneblinkw.v (100%)
 rename fuzzers/007-timing/{ => projects/picorv32}/top.v (100%)
 create mode 100644 fuzzers/007-timing/projects/placelut/Makefile
 rename fuzzers/007-timing/{placelut.py => projects/placelut/generate.py} (98%)
 create mode 100755 fuzzers/007-timing/projects/placelut/generate.sh
 create mode 100644 fuzzers/007-timing/projects/placelut/generate.tcl
 rename fuzzers/007-timing/{ => projects/placelut_fb}/placelut_fb.py (100%)
 rename fuzzers/007-timing/{ => projects/placelut_ff_fb}/placelut_ff_fb.py (100%)
 delete mode 100755 fuzzers/007-timing/speed.sh
 create mode 100644 fuzzers/007-timing/speed/.gitignore
 create mode 100644 fuzzers/007-timing/speed/Makefile
 create mode 100644 fuzzers/007-timing/speed/README.md
 rename fuzzers/007-timing/{speed.tcl => speed/generate.tcl} (90%)
 rename fuzzers/007-timing/{ => speed}/speed_json.py (100%)
 create mode 100644 fuzzers/007-timing/speed/top.v
 rename fuzzers/007-timing/{ => src}/picorv32.v (100%)
 create mode 100644 fuzzers/007-timing/timgrid/.gitignore
 rename fuzzers/007-timing/{ => timgrid}/tile_txt2json.py (96%)
 rename fuzzers/007-timing/{timfuz_csv.py => timing_txt2csv.py} (99%)

diff --git a/fuzzers/007-timing/Makefile b/fuzzers/007-timing/Makefile
deleted file mode 100644
index 8da96c3f..00000000
--- a/fuzzers/007-timing/Makefile
+++ /dev/null
@@ -1,22 +0,0 @@
-N := 1
-SPECIMENS := $(addprefix specimen_,$(shell seq -f '%03.0f' $(N)))
-SPECIMENS_OK := $(addsuffix /OK,$(SPECIMENS))
-
-all: $(SPECIMENS_OK)
-	#python timfuz.py specimen_*/timing.txt
-
-$(SPECIMENS_OK):
-	bash generate.sh $(subst /OK,,$@)
-	touch $@
-
-run:
-	$(MAKE) clean
-	$(MAKE) all
-	touch run.ok
-
-clean:
-	rm -rf specimen_[0-9][0-9][0-9]/ seg_clblx.segbits __pycache__ run.ok
-	rm -rf vivado*.log vivado_*.str vivado*.jou design *.bits *.dcp *.bit
-
-.PHONY: database pushdb run clean
-
diff --git a/fuzzers/007-timing/generate.sh b/fuzzers/007-timing/generate.sh
deleted file mode 100755
index eebd0388..00000000
--- a/fuzzers/007-timing/generate.sh
+++ /dev/null
@@ -1,9 +0,0 @@
-#!/bin/bash
-
-set -ex
-
-source ${XRAY_GENHEADER}
-
-python ../placelut_ff_fb.py --sdx 4 --sdy 4  >placelut.v
-vivado -mode batch -source ../generate.tcl
-
diff --git a/fuzzers/007-timing/generate.tcl b/fuzzers/007-timing/generate.tcl
deleted file mode 100644
index a2e76c71..00000000
--- a/fuzzers/007-timing/generate.tcl
+++ /dev/null
@@ -1,279 +0,0 @@
-source ../../../utils/utils.tcl
-
-proc pin_info {pin} {
-    set cell [get_cells -of_objects $pin]
-    set bel [get_bels -of_objects $cell]
-    set site [get_sites -of_objects $bel]
-    return "$site $bel"
-}
-
-proc pin_bel {pin} {
-    set cell [get_cells -of_objects $pin]
-    set bel [get_bels -of_objects $cell]
-    return $bel
-}
-
-proc build_design {} {
-    create_project -force -part $::env(XRAY_PART) design design
-    #read_verilog ../top.v
-    #read_verilog ../picorv32.v
-    #read_verilog ../oneblinkw.v
-    read_verilog placelut.v
-    synth_design -top top
-
-    puts "Locking pins"
-    set_property LOCK_PINS {I0:A1 I1:A2 I2:A3 I3:A4 I4:A5 I5:A6} \
-		[get_cells -quiet -filter {REF_NAME == LUT6} -hierarchical]
-
-    puts "Package stuff"
-    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_00) IOSTANDARD LVCMOS33" [get_ports clk]
-    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_01) IOSTANDARD LVCMOS33" [get_ports stb]
-    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_02) IOSTANDARD LVCMOS33" [get_ports di]
-    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_03) IOSTANDARD LVCMOS33" [get_ports do]
-
-    if {0 < 0} {
-        puts "pblocking"
-        create_pblock roi
-        set roipb [get_pblocks roi]
-        set_property EXCLUDE_PLACEMENT 1 $roipb
-        add_cells_to_pblock $roipb [get_cells roi]
-        resize_pblock $roipb -add "$::env(XRAY_ROI)"
-
-        puts "randplace"
-        randplace_pblock 150 $roipb
-    }
-
-    set_property CFGBVS VCCO [current_design]
-    set_property CONFIG_VOLTAGE 3.3 [current_design]
-    set_property BITSTREAM.GENERAL.PERFRAMECRC YES [current_design]
-
-    puts "dedicated route"
-    set_property CLOCK_DEDICATED_ROUTE FALSE [get_nets clk_IBUF]
-
-    place_design
-
-    
-    route_design
-
-    write_checkpoint -force design.dcp
-    # disable combinitorial loop
-    # set_property IS_ENABLED 0 [get_drc_checks {LUTLP-1}]
-    #write_bitstream -force design.bit
-}
-
-# Changed to group wires and nodes
-# This allows tracing the full path along with pips
-proc write_info3 {} {
-    set outdir "."
-    set fp [open "$outdir/timing3.txt" w]
-    # bel as site/bel, so don't bother with site
-    puts $fp "net src_bel dst_bel ico fast_max fast_min slow_max slow_min pips inodes wires"
-
-    set TIME_start [clock clicks -milliseconds]
-    set verbose 0
-    set equations 0
-    set site_src_nets 0
-    set site_dst_nets 0
-    set neti 0
-    set nets [get_nets -hierarchical]
-    set nnets [llength $nets]
-    foreach net $nets {
-        incr neti
-        #if {$neti >= 10} {
-        #    puts "Debug break"
-        #    break
-        #}
-
-        puts "Net $neti / $nnets: $net"
-        # The semantics of get_pins -leaf is kind of odd
-        # When no passthrough LUTs exist, it has no effect
-        # When passthrough LUT present:
-        # -w/o -leaf: some pins + passthrough LUT pins
-        # -w/ -leaf: different pins + passthrough LUT pins
-        # With OUT filter this seems to be sufficient
-        set src_pin [get_pins -leaf -filter {DIRECTION == OUT} -of_objects $net]
-        set src_bel [pin_bel $src_pin]
-        set src_site [get_sites -of_objects $src_bel]
-        # Only one net driver
-        set src_site_pins [get_site_pins -filter {DIRECTION == OUT} -of_objects $net]
-
-        # Sometimes this is empty for reasons that escape me
-        # Emitting direction doesn't help
-        if {[llength $src_site_pins] < 1} {
-            if $verbose {
-                puts "    Ignoring site internal net"
-            }
-            incr site_src_nets
-            continue
-        }
-        set dst_site_pins_net [get_site_pins -filter {DIRECTION == IN} -of_objects $net]
-        if {[llength $dst_site_pins_net] < 1} {
-            puts "  Skipping site internal source net"
-            incr site_dst_nets
-            continue
-        }
-        foreach src_site_pin $src_site_pins {
-            if $verbose {
-                puts "Source: $src_pin at site $src_site:$src_bel, spin $src_site_pin"
-            }
-
-            # Run with and without interconnect only
-            foreach ico "0 1" {
-                set ico_flag ""
-                if $ico {
-                    set ico_flag "-interconnect_only"
-                    set delays [get_net_delays $ico_flag -of_objects $net]
-                } else {
-                    set delays [get_net_delays -of_objects $net]
-                }
-                foreach delay $delays {
-                    set delaystr [get_property NAME $delay]
-                    set dst_pins [get_property TO_PIN $delay]
-                    set dst_pin [get_pins $dst_pins]
-                    #puts "  $delaystr: $src_pin => $dst_pin"
-                    set dst_bel [pin_bel $dst_pin]
-                    set dst_site [get_sites -of_objects $dst_bel]
-                    if $verbose {
-                        puts "  Dest: $dst_pin at site $dst_site:$dst_bel"
-                    }
-
-                    set dst_site_pins [get_site_pins -of_objects $dst_pin]
-                    # Some nets are internal
-                    # But should this happen on dest if we've already filtered source?
-                    if {"$dst_site_pins" eq ""} {
-                        continue
-                    }
-                    # Also apparantly you can have multiple of these as well
-                    foreach dst_site_pin $dst_site_pins {
-                        set fast_max [get_property "FAST_MAX" $delay]
-                        set fast_min [get_property "FAST_MIN" $delay]
-                        set slow_max [get_property "SLOW_MAX" $delay]
-                        set slow_min [get_property "SLOW_MIN" $delay]
-
-                        # Want:
-                        # Site / BEL at src
-                        # Site / BEL at dst
-                        # Pips in between
-                        # Walk net, looking for interesting elements in between
-                        set pips [get_pips -of_objects $net -from $src_site_pin -to $dst_site_pin]
-                        if $verbose {
-                            foreach pip $pips {
-                                puts "    PIP $pip"
-                            }
-                        }
-                        set nodes [get_nodes -of_objects $net -from $src_site_pin -to $dst_site_pin]
-                        #set wires [get_wires -of_objects $net -from $src_site_pin -to $dst_site_pin]
-                        set wires [get_wires -of_objects $nodes]
-
-                        # puts $fp "$net $src_bel $dst_bel $ico $fast_max $fast_min $slow_max $slow_min $pips"
-                        puts -nonewline $fp "$net $src_bel $dst_bel $ico $fast_max $fast_min $slow_max $slow_min"
-        
-                        # Write pips w/ speed index
-                        puts -nonewline $fp " "
-                        set needspace 0
-                        foreach pip $pips {
-                            if $needspace {
-                                puts -nonewline $fp "|"
-                            }
-                            set speed_index [get_property SPEED_INDEX $pip]
-                            puts -nonewline $fp "$pip:$speed_index"
-                            set needspace 1
-                        }
-
-                        # Write nodes
-                        #set nodes_str [string map {" " "|"} $nodes]
-                        #puts -nonewline $fp " $nodes_str"
-                        puts -nonewline $fp " "
-                        set needspace 0
-                        foreach node $nodes {
-                            if $needspace {
-                                puts -nonewline $fp "|"
-                            }
-                            set nwires [llength [get_wires -of_objects $node]]
-                            puts -nonewline $fp "$node:$nwires"
-                            set needspace 1
-                        }
-
-                        # Write wires
-                        puts -nonewline $fp " "
-                        set needspace 0
-                        foreach wire $wires {
-                            if $needspace {
-                                puts -nonewline $fp "|"
-                            }
-                            set speed_index [get_property SPEED_INDEX $wire]
-                            puts -nonewline $fp "$wire:$speed_index"
-                            set needspace 1
-                        }
-
-                        puts $fp ""
-
-                        incr equations
-                        break
-                    }
-                }
-            }
-        }
-    }
-    close $fp
-    set TIME_taken [expr [clock clicks -milliseconds] - $TIME_start]
-    puts "Took ms: $TIME_taken"
-    puts "Generated $equations equations"
-    puts "Skipped $site_src_nets (+ $site_dst_nets) site nets"
-}
-
-proc pips_all {} {
-    set outdir "."
-    set fp [open "$outdir/pip_all.txt" w]
-    set items [get_pips]
-    puts "Items: [llength $items]"
-
-    set needspace 0
-    set properties [list_property [lindex $items 0]]
-    foreach item $items {
-        set needspace 0
-        foreach property $properties {
-            set val [get_property $property $item]
-            if {"$val" ne ""} {
-                if $needspace {
-                    puts -nonewline $fp " "
-                }
-                puts -nonewline $fp "$property:$val"
-                set needspace 1
-            }
-        }
-        puts $fp ""
-    }
-    close $fp
-}
-proc wires_all {} {
-    set outdir "."
-    set fp [open "$outdir/wire_all.txt" w]
-    set items [get_wires]
-    puts "Items: [llength $items]"
-
-    set needspace 0
-    set properties [list_property [lindex $items 0]]
-    foreach item $items {
-        set needspace 0
-        foreach property $properties {
-            set val [get_property $property $item]
-            if {"$val" ne ""} {
-                if $needspace {
-                    puts -nonewline $fp " "
-                }
-                puts -nonewline $fp "$property:$val"
-                set needspace 1
-            }
-        }
-        puts $fp ""
-    }
-    close $fp
-}
-
-build_design
-#write_info2
-write_info3
-#wires_all
-#pips_all
-
diff --git a/fuzzers/007-timing/oneblinkw.v b/fuzzers/007-timing/projects/oneblinkw/oneblinkw.v
similarity index 100%
rename from fuzzers/007-timing/oneblinkw.v
rename to fuzzers/007-timing/projects/oneblinkw/oneblinkw.v
diff --git a/fuzzers/007-timing/top.v b/fuzzers/007-timing/projects/picorv32/top.v
similarity index 100%
rename from fuzzers/007-timing/top.v
rename to fuzzers/007-timing/projects/picorv32/top.v
diff --git a/fuzzers/007-timing/projects/placelut/Makefile b/fuzzers/007-timing/projects/placelut/Makefile
new file mode 100644
index 00000000..df00e979
--- /dev/null
+++ b/fuzzers/007-timing/projects/placelut/Makefile
@@ -0,0 +1,52 @@
+N := 1
+SPECIMENS := $(addprefix specimen_,$(shell seq -f '%03.0f' $(N)))
+SPECIMENS_OK := $(addsuffix /OK,$(SPECIMENS))
+CSVS := $(addsuffix /timing3.csv,$(SPECIMENS))
+TIMFUZ_DIR=$(XRAY_DIR)/fuzzers/007-timing
+
+all: tilea.json
+
+$(SPECIMENS_OK):
+	bash generate.sh $(subst /OK,,$@)
+	touch $@
+
+run:
+	$(MAKE) clean
+	$(MAKE) all
+	touch run.ok
+
+clean:
+	rm -rf specimen_[0-9][0-9][0-9]/ seg_clblx.segbits __pycache__ run.ok
+	rm -rf vivado*.log vivado_*.str vivado*.jou design *.bits *.dcp *.bit
+	rm -rf build
+
+.PHONY: database pushdb run clean
+
+sub.json: $(SPECIMENS_OK)
+	# Discover which variables can be separated
+	# This is typically the longest running operation
+	python3 $(TIMFUZ_DIR)/rref.py --simplify --out sub.json $(CSVS)
+
+grouped.csv: $(SPECIMENS_OK) sub.json
+	# Separate variables
+	python3 $(TIMFUZ_DIR)/csv_flat2group.py --sub-json sub.json --strict $(CSVS) grouped.csv
+	# Verify sub.json makes a solvable solution
+	# python3 $(TIMFUZ_DIR)/checksub.py --sub-json sub.json grouped.csv
+
+leastsq.csv: sub.json grouped.csv
+	# Create a rough timing model that approximately fits the given paths
+	python3 $(TIMFUZ_DIR)/solve_leastsq.py --sub-json sub.json grouped.csv --out leastsq.csv
+
+linprog.csv: leastsq.csv grouped.csv
+	# Tweak rough timing model, making sure all constraints are satisfied
+	python3 $(TIMFUZ_DIR)/solve_linprog.py --sub-json sub.json --sub-csv leastsq.csv --massage grouped.csv --out linprog.csv
+
+flat.csv: linprog.csv
+	# Take separated variables and back-annotate them to the original timing variables
+	python3 $(TIMFUZ_DIR)/csv_group2flat.py --sub-json sub.json --sort linprog.csv flat.csv
+
+tilea.json: flat.csv
+	# Final processing
+	# Insert timing delays into actual tile layouts
+	python3 $(TIMFUZ_DIR)/tile_annotate.py --tile-json $(TIMFUZ_DIR)/timgrid/build/timgrid.json flat.csv tilea.json
+
diff --git a/fuzzers/007-timing/placelut.py b/fuzzers/007-timing/projects/placelut/generate.py
similarity index 98%
rename from fuzzers/007-timing/placelut.py
rename to fuzzers/007-timing/projects/placelut/generate.py
index 47dd9e3c..a56d4c55 100644
--- a/fuzzers/007-timing/placelut.py
+++ b/fuzzers/007-timing/projects/placelut/generate.py
@@ -25,7 +25,7 @@ nlut = 4 * SDX * SDY
 nin = 6 * nlut
 nout = nlut
 
-print('placelut simple')
+print('//placelut simple')
 print('//SBASE: %s' % (SBASE,))
 print('//SDX: %s' % (SDX,))
 print('//SDY: %s' % (SDX,))
diff --git a/fuzzers/007-timing/projects/placelut/generate.sh b/fuzzers/007-timing/projects/placelut/generate.sh
new file mode 100755
index 00000000..fff71d31
--- /dev/null
+++ b/fuzzers/007-timing/projects/placelut/generate.sh
@@ -0,0 +1,11 @@
+#!/bin/bash
+
+set -ex
+
+source ${XRAY_GENHEADER}
+TIMFUZ_DIR=$XRAY_DIR/fuzzers/007-timing
+
+python ../generate.py --sdx 4 --sdy 4  >top.v
+vivado -mode batch -source ../generate.tcl
+python3 $TIMFUZ_DIR/timing_txt2csv.py --speed-json $TIMFUZ_DIR/speed/build/speed.json --out timing3.csv timing3.txt
+
diff --git a/fuzzers/007-timing/projects/placelut/generate.tcl b/fuzzers/007-timing/projects/placelut/generate.tcl
new file mode 100644
index 00000000..0b536169
--- /dev/null
+++ b/fuzzers/007-timing/projects/placelut/generate.tcl
@@ -0,0 +1,47 @@
+source ../../../../../utils/utils.tcl
+source ../../project.tcl
+
+proc build_design {} {
+    create_project -force -part $::env(XRAY_PART) design design
+    read_verilog top.v
+    synth_design -top top
+
+    puts "Locking pins"
+    set_property LOCK_PINS {I0:A1 I1:A2 I2:A3 I3:A4 I4:A5 I5:A6} \
+		[get_cells -quiet -filter {REF_NAME == LUT6} -hierarchical]
+
+    puts "Package stuff"
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_00) IOSTANDARD LVCMOS33" [get_ports clk]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_01) IOSTANDARD LVCMOS33" [get_ports stb]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_02) IOSTANDARD LVCMOS33" [get_ports di]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_03) IOSTANDARD LVCMOS33" [get_ports do]
+
+    puts "pblocking"
+    create_pblock roi
+    set roipb [get_pblocks roi]
+    set_property EXCLUDE_PLACEMENT 1 $roipb
+    add_cells_to_pblock $roipb [get_cells roi]
+    resize_pblock $roipb -add "$::env(XRAY_ROI)"
+
+    puts "randplace"
+    randplace_pblock 50 roi
+
+    set_property CFGBVS VCCO [current_design]
+    set_property CONFIG_VOLTAGE 3.3 [current_design]
+    set_property BITSTREAM.GENERAL.PERFRAMECRC YES [current_design]
+
+    puts "dedicated route"
+    set_property CLOCK_DEDICATED_ROUTE FALSE [get_nets clk_IBUF]
+
+    place_design
+    route_design
+
+    write_checkpoint -force design.dcp
+    # disable combinitorial loop
+    # set_property IS_ENABLED 0 [get_drc_checks {LUTLP-1}]
+    #write_bitstream -force design.bit
+}
+
+build_design
+write_info3
+
diff --git a/fuzzers/007-timing/placelut_fb.py b/fuzzers/007-timing/projects/placelut_fb/placelut_fb.py
similarity index 100%
rename from fuzzers/007-timing/placelut_fb.py
rename to fuzzers/007-timing/projects/placelut_fb/placelut_fb.py
diff --git a/fuzzers/007-timing/placelut_ff_fb.py b/fuzzers/007-timing/projects/placelut_ff_fb/placelut_ff_fb.py
similarity index 100%
rename from fuzzers/007-timing/placelut_ff_fb.py
rename to fuzzers/007-timing/projects/placelut_ff_fb/placelut_ff_fb.py
diff --git a/fuzzers/007-timing/speed.sh b/fuzzers/007-timing/speed.sh
deleted file mode 100755
index 0712c64f..00000000
--- a/fuzzers/007-timing/speed.sh
+++ /dev/null
@@ -1,8 +0,0 @@
-#!/usr/bin/env bash
-set -ex
-
-mkdir -p build_speed
-cd build_speed
-vivado -mode batch -source ../speed.tcl
-python ../speed_json.py speed_model.txt node.txt speed.json
-
diff --git a/fuzzers/007-timing/speed/.gitignore b/fuzzers/007-timing/speed/.gitignore
new file mode 100644
index 00000000..9ef96044
--- /dev/null
+++ b/fuzzers/007-timing/speed/.gitignore
@@ -0,0 +1,2 @@
+build
+
diff --git a/fuzzers/007-timing/speed/Makefile b/fuzzers/007-timing/speed/Makefile
new file mode 100644
index 00000000..e2b7a520
--- /dev/null
+++ b/fuzzers/007-timing/speed/Makefile
@@ -0,0 +1,12 @@
+all: build/speed.json
+
+build/node.txt: speed_json.py generate.tcl
+	mkdir -p build
+	cd build && vivado -mode batch -source ../generate.tcl
+
+build/speed.json: build/node.txt
+	cd build && python ../speed_json.py speed_model.txt node.txt speed.json
+
+clean:
+	rm -rf build
+
diff --git a/fuzzers/007-timing/speed/README.md b/fuzzers/007-timing/speed/README.md
new file mode 100644
index 00000000..a10f335d
--- /dev/null
+++ b/fuzzers/007-timing/speed/README.md
@@ -0,0 +1,4 @@
+Generates speed.json, describing speed index to string translation.
+These indices appear to be fixed between runtimes.
+It is unknown how stable they are across versions.
+
diff --git a/fuzzers/007-timing/speed.tcl b/fuzzers/007-timing/speed/generate.tcl
similarity index 90%
rename from fuzzers/007-timing/speed.tcl
rename to fuzzers/007-timing/speed/generate.tcl
index 31f8b857..cf423e65 100644
--- a/fuzzers/007-timing/speed.tcl
+++ b/fuzzers/007-timing/speed/generate.tcl
@@ -1,5 +1,3 @@
-source ../../../utils/utils.tcl
-
 proc pin_info {pin} {
     set cell [get_cells -of_objects $pin]
     set bel [get_bels -of_objects $cell]
@@ -16,24 +14,17 @@ proc pin_bel {pin} {
 proc build_design_full {} {
     create_project -force -part $::env(XRAY_PART) design design
     read_verilog ../top.v
-    read_verilog ../picorv32.v
+    read_verilog ../../src/picorv32.v
     synth_design -top top
 
-    set_property LOCK_PINS {I0:A1 I1:A2 I2:A3 I3:A4 I4:A5 I5:A6} \
-		[get_cells -quiet -filter {REF_NAME == LUT6} -hierarchical]
+    #set_property LOCK_PINS {I0:A1 I1:A2 I2:A3 I3:A4 I4:A5 I5:A6} \
+	#	[get_cells -quiet -filter {REF_NAME == LUT6} -hierarchical]
 
     set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_00) IOSTANDARD LVCMOS33" [get_ports clk]
     set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_01) IOSTANDARD LVCMOS33" [get_ports stb]
     set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_02) IOSTANDARD LVCMOS33" [get_ports di]
     set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_03) IOSTANDARD LVCMOS33" [get_ports do]
 
-    create_pblock roi
-    set roipb [get_pblocks roi]
-    set_property EXCLUDE_PLACEMENT 1 $roipb
-    add_cells_to_pblock $roipb [get_cells roi]
-    resize_pblock $roipb -add "$::env(XRAY_ROI)"
-
-    randplace_pblock 150 $roipb
     set_property CFGBVS VCCO [current_design]
     set_property CONFIG_VOLTAGE 3.3 [current_design]
     set_property BITSTREAM.GENERAL.PERFRAMECRC YES [current_design]
@@ -145,7 +136,7 @@ proc nodes_unique_cc {} {
     set outdir "."
     set fp [open "$outdir/node.txt" w]
     set items [get_nodes]
-    puts "Items: [llength $items]"
+    puts "Computing cost codes with [llength $items] items"
 
     set needspace 0
     set properties [list_property [lindex $items 0]]
@@ -157,7 +148,7 @@ proc nodes_unique_cc {} {
         if {[ dict exists $cost_codes_known $cost_code ]} {
             continue
         }
-        puts "Adding $cost_code @ item $itemi"
+        puts "  Adding cost code $cost_code @ item $itemi"
         dict set cost_codes_known $cost_code 1
 
         set needspace 0
diff --git a/fuzzers/007-timing/speed_json.py b/fuzzers/007-timing/speed/speed_json.py
similarity index 100%
rename from fuzzers/007-timing/speed_json.py
rename to fuzzers/007-timing/speed/speed_json.py
diff --git a/fuzzers/007-timing/speed/top.v b/fuzzers/007-timing/speed/top.v
new file mode 100644
index 00000000..cf662548
--- /dev/null
+++ b/fuzzers/007-timing/speed/top.v
@@ -0,0 +1,8 @@
+module top(input clk, stb, di, output do);
+    reg dor;
+	always @(posedge clk) begin
+	    dor <= stb & di;
+	end
+    assign do = dor;
+endmodule
+
diff --git a/fuzzers/007-timing/picorv32.v b/fuzzers/007-timing/src/picorv32.v
similarity index 100%
rename from fuzzers/007-timing/picorv32.v
rename to fuzzers/007-timing/src/picorv32.v
diff --git a/fuzzers/007-timing/timgrid/.gitignore b/fuzzers/007-timing/timgrid/.gitignore
new file mode 100644
index 00000000..378eac25
--- /dev/null
+++ b/fuzzers/007-timing/timgrid/.gitignore
@@ -0,0 +1 @@
+build
diff --git a/fuzzers/007-timing/timgrid/Makefile b/fuzzers/007-timing/timgrid/Makefile
index c59f83bf..af0a72da 100644
--- a/fuzzers/007-timing/timgrid/Makefile
+++ b/fuzzers/007-timing/timgrid/Makefile
@@ -1,26 +1,12 @@
+all: build/timgrid.json
 
-N := 1
-SPECIMENS := $(addprefix specimen_,$(shell seq -f '%03.0f' $(N)))
-SPECIMENS_OK := $(addsuffix /OK,$(SPECIMENS))
+build/timgrid.txt: generate.tcl
+	mkdir -p build
+	cd build && vivado -mode batch -source ../generate.tcl
 
-database: $(SPECIMENS_OK)
-	cp specimen_001/tilegrid.json tilegrid.json
-
-pushdb:
-	cp tilegrid.json ${XRAY_DATABASE_DIR}/$(XRAY_DATABASE)/tilegrid.json
-
-$(SPECIMENS_OK):
-	bash generate.sh $(subst /OK,,$@)
-	touch $@
-
-run:
-	$(MAKE) clean
-	$(MAKE) database
-	$(MAKE) pushdb
-	touch run.ok
+build/timgrid.json: build/timgrid.txt
+	cd build && python3 ../tile_txt2json.py --speed-json ../../speed/build/speed.json timgrid.txt timgrid.json
 
 clean:
-	rm -rf specimen_[0-9][0-9][0-9]/ tilegrid.json run.ok
-
-.PHONY: database pushdb clean run
+	rm -rf build
 
diff --git a/fuzzers/007-timing/timgrid/generate.tcl b/fuzzers/007-timing/timgrid/generate.tcl
index 70a9b030..c7f218bc 100644
--- a/fuzzers/007-timing/timgrid/generate.tcl
+++ b/fuzzers/007-timing/timgrid/generate.tcl
@@ -1,4 +1,4 @@
-proc create_project {} {
+proc build_project {} {
     if 0 {
         set grid_min_x -1
         set grid_max_x -1
@@ -83,7 +83,7 @@ proc write_data {} {
     set tiles [get_tiles -filter "GRID_POINT_X >= $grid_min_x && GRID_POINT_X <= $grid_max_x && GRID_POINT_Y >= $grid_min_y && GRID_POINT_Y <= $grid_max_y"]
 
     # Write tiles.txt with site metadata
-    set fp [open "tiles.txt" w]
+    set fp [open "timgrid.txt" w]
     foreach tile $tiles {
 	    set type [get_property TYPE $tile]
 	    set grid_x [get_property GRID_POINT_X $tile]
@@ -114,6 +114,6 @@ proc write_data {} {
     close $fp
 }
 
-create_project
+build_project
 write_data
 
diff --git a/fuzzers/007-timing/tile_txt2json.py b/fuzzers/007-timing/timgrid/tile_txt2json.py
similarity index 96%
rename from fuzzers/007-timing/tile_txt2json.py
rename to fuzzers/007-timing/timgrid/tile_txt2json.py
index 06711f87..b6e410ff 100644
--- a/fuzzers/007-timing/tile_txt2json.py
+++ b/fuzzers/007-timing/timgrid/tile_txt2json.py
@@ -62,7 +62,7 @@ def main():
         description=
         'Solve timing solution'
     )
-    parser.add_argument('--speed-json', default='build_speed/speed.json',
+    parser.add_argument('--speed-json', default='../../speed/build/speed.json',
         help='Provides speed index to name translation')
     parser.add_argument('fnin', default=None, help='input tcl output .txt')
     parser.add_argument('fnout', default=None, help='output .json')
diff --git a/fuzzers/007-timing/timfuz_csv.py b/fuzzers/007-timing/timing_txt2csv.py
similarity index 99%
rename from fuzzers/007-timing/timfuz_csv.py
rename to fuzzers/007-timing/timing_txt2csv.py
index 97da40e1..51f04f42 100644
--- a/fuzzers/007-timing/timfuz_csv.py
+++ b/fuzzers/007-timing/timing_txt2csv.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python3
 
-from timfuz import Benchmark, row_di2ds, A_di2ds
+from timfuz import Benchmark, A_di2ds
 import numpy as np
 import glob
 import math

From 133ff586e80055aa5391d2ddd6f1b1373eed7fe7 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Tue, 11 Sep 2018 12:02:32 -0700
Subject: [PATCH 30/55] timfuz: move project outputs to build directory

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/projects/placelut/Makefile | 29 ++++++++++---------
 1 file changed, 15 insertions(+), 14 deletions(-)

diff --git a/fuzzers/007-timing/projects/placelut/Makefile b/fuzzers/007-timing/projects/placelut/Makefile
index df00e979..f1e10dc2 100644
--- a/fuzzers/007-timing/projects/placelut/Makefile
+++ b/fuzzers/007-timing/projects/placelut/Makefile
@@ -4,7 +4,7 @@ SPECIMENS_OK := $(addsuffix /OK,$(SPECIMENS))
 CSVS := $(addsuffix /timing3.csv,$(SPECIMENS))
 TIMFUZ_DIR=$(XRAY_DIR)/fuzzers/007-timing
 
-all: tilea.json
+all: build/tilea.json
 
 $(SPECIMENS_OK):
 	bash generate.sh $(subst /OK,,$@)
@@ -22,31 +22,32 @@ clean:
 
 .PHONY: database pushdb run clean
 
-sub.json: $(SPECIMENS_OK)
+build/sub.json: $(SPECIMENS_OK)
+	mkdir -p build
 	# Discover which variables can be separated
 	# This is typically the longest running operation
-	python3 $(TIMFUZ_DIR)/rref.py --simplify --out sub.json $(CSVS)
+	python3 $(TIMFUZ_DIR)/rref.py --simplify --out build/sub.json $(CSVS)
 
-grouped.csv: $(SPECIMENS_OK) sub.json
+build/grouped.csv: $(SPECIMENS_OK) build/sub.json
 	# Separate variables
-	python3 $(TIMFUZ_DIR)/csv_flat2group.py --sub-json sub.json --strict $(CSVS) grouped.csv
+	python3 $(TIMFUZ_DIR)/csv_flat2group.py --sub-json build/sub.json --strict $(CSVS) build/grouped.csv
 	# Verify sub.json makes a solvable solution
-	# python3 $(TIMFUZ_DIR)/checksub.py --sub-json sub.json grouped.csv
+	# python3 $(TIMFUZ_DIR)/checksub.py --sub-json build/sub.json grouped.csv
 
-leastsq.csv: sub.json grouped.csv
+build/leastsq.csv: build/sub.json build/grouped.csv
 	# Create a rough timing model that approximately fits the given paths
-	python3 $(TIMFUZ_DIR)/solve_leastsq.py --sub-json sub.json grouped.csv --out leastsq.csv
+	python3 $(TIMFUZ_DIR)/solve_leastsq.py --sub-json build/sub.json build/grouped.csv --out build/leastsq.csv
 
-linprog.csv: leastsq.csv grouped.csv
+build/linprog.csv: build/leastsq.csv build/grouped.csv
 	# Tweak rough timing model, making sure all constraints are satisfied
-	python3 $(TIMFUZ_DIR)/solve_linprog.py --sub-json sub.json --sub-csv leastsq.csv --massage grouped.csv --out linprog.csv
+	python3 $(TIMFUZ_DIR)/solve_linprog.py --sub-json build/sub.json --sub-csv build/leastsq.csv --massage build/grouped.csv --out build/linprog.csv
 
-flat.csv: linprog.csv
+build/flat.csv: build/linprog.csv
 	# Take separated variables and back-annotate them to the original timing variables
-	python3 $(TIMFUZ_DIR)/csv_group2flat.py --sub-json sub.json --sort linprog.csv flat.csv
+	python3 $(TIMFUZ_DIR)/csv_group2flat.py --sub-json build/sub.json --sort build/linprog.csv build/flat.csv
 
-tilea.json: flat.csv
+build/tilea.json: build/flat.csv
 	# Final processing
 	# Insert timing delays into actual tile layouts
-	python3 $(TIMFUZ_DIR)/tile_annotate.py --tile-json $(TIMFUZ_DIR)/timgrid/build/timgrid.json flat.csv tilea.json
+	python3 $(TIMFUZ_DIR)/tile_annotate.py --tile-json $(TIMFUZ_DIR)/timgrid/build/timgrid.json build/flat.csv build/tilea.json
 

From 557fda4215fa50701a506c30d01ee210002ba979 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Tue, 11 Sep 2018 12:07:41 -0700
Subject: [PATCH 31/55] timfuz: placelut made into generic project

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/projects/placelut/Makefile |  53 +-----
 fuzzers/007-timing/projects/project.mk        |  53 ++++++
 fuzzers/007-timing/projects/project.tcl       | 174 ++++++++++++++++++
 3 files changed, 228 insertions(+), 52 deletions(-)
 create mode 100644 fuzzers/007-timing/projects/project.mk
 create mode 100644 fuzzers/007-timing/projects/project.tcl

diff --git a/fuzzers/007-timing/projects/placelut/Makefile b/fuzzers/007-timing/projects/placelut/Makefile
index f1e10dc2..9c8b1947 100644
--- a/fuzzers/007-timing/projects/placelut/Makefile
+++ b/fuzzers/007-timing/projects/placelut/Makefile
@@ -1,53 +1,2 @@
-N := 1
-SPECIMENS := $(addprefix specimen_,$(shell seq -f '%03.0f' $(N)))
-SPECIMENS_OK := $(addsuffix /OK,$(SPECIMENS))
-CSVS := $(addsuffix /timing3.csv,$(SPECIMENS))
-TIMFUZ_DIR=$(XRAY_DIR)/fuzzers/007-timing
-
-all: build/tilea.json
-
-$(SPECIMENS_OK):
-	bash generate.sh $(subst /OK,,$@)
-	touch $@
-
-run:
-	$(MAKE) clean
-	$(MAKE) all
-	touch run.ok
-
-clean:
-	rm -rf specimen_[0-9][0-9][0-9]/ seg_clblx.segbits __pycache__ run.ok
-	rm -rf vivado*.log vivado_*.str vivado*.jou design *.bits *.dcp *.bit
-	rm -rf build
-
-.PHONY: database pushdb run clean
-
-build/sub.json: $(SPECIMENS_OK)
-	mkdir -p build
-	# Discover which variables can be separated
-	# This is typically the longest running operation
-	python3 $(TIMFUZ_DIR)/rref.py --simplify --out build/sub.json $(CSVS)
-
-build/grouped.csv: $(SPECIMENS_OK) build/sub.json
-	# Separate variables
-	python3 $(TIMFUZ_DIR)/csv_flat2group.py --sub-json build/sub.json --strict $(CSVS) build/grouped.csv
-	# Verify sub.json makes a solvable solution
-	# python3 $(TIMFUZ_DIR)/checksub.py --sub-json build/sub.json grouped.csv
-
-build/leastsq.csv: build/sub.json build/grouped.csv
-	# Create a rough timing model that approximately fits the given paths
-	python3 $(TIMFUZ_DIR)/solve_leastsq.py --sub-json build/sub.json build/grouped.csv --out build/leastsq.csv
-
-build/linprog.csv: build/leastsq.csv build/grouped.csv
-	# Tweak rough timing model, making sure all constraints are satisfied
-	python3 $(TIMFUZ_DIR)/solve_linprog.py --sub-json build/sub.json --sub-csv build/leastsq.csv --massage build/grouped.csv --out build/linprog.csv
-
-build/flat.csv: build/linprog.csv
-	# Take separated variables and back-annotate them to the original timing variables
-	python3 $(TIMFUZ_DIR)/csv_group2flat.py --sub-json build/sub.json --sort build/linprog.csv build/flat.csv
-
-build/tilea.json: build/flat.csv
-	# Final processing
-	# Insert timing delays into actual tile layouts
-	python3 $(TIMFUZ_DIR)/tile_annotate.py --tile-json $(TIMFUZ_DIR)/timgrid/build/timgrid.json build/flat.csv build/tilea.json
+include ../project.mk
 
diff --git a/fuzzers/007-timing/projects/project.mk b/fuzzers/007-timing/projects/project.mk
new file mode 100644
index 00000000..f1e10dc2
--- /dev/null
+++ b/fuzzers/007-timing/projects/project.mk
@@ -0,0 +1,53 @@
+N := 1
+SPECIMENS := $(addprefix specimen_,$(shell seq -f '%03.0f' $(N)))
+SPECIMENS_OK := $(addsuffix /OK,$(SPECIMENS))
+CSVS := $(addsuffix /timing3.csv,$(SPECIMENS))
+TIMFUZ_DIR=$(XRAY_DIR)/fuzzers/007-timing
+
+all: build/tilea.json
+
+$(SPECIMENS_OK):
+	bash generate.sh $(subst /OK,,$@)
+	touch $@
+
+run:
+	$(MAKE) clean
+	$(MAKE) all
+	touch run.ok
+
+clean:
+	rm -rf specimen_[0-9][0-9][0-9]/ seg_clblx.segbits __pycache__ run.ok
+	rm -rf vivado*.log vivado_*.str vivado*.jou design *.bits *.dcp *.bit
+	rm -rf build
+
+.PHONY: database pushdb run clean
+
+build/sub.json: $(SPECIMENS_OK)
+	mkdir -p build
+	# Discover which variables can be separated
+	# This is typically the longest running operation
+	python3 $(TIMFUZ_DIR)/rref.py --simplify --out build/sub.json $(CSVS)
+
+build/grouped.csv: $(SPECIMENS_OK) build/sub.json
+	# Separate variables
+	python3 $(TIMFUZ_DIR)/csv_flat2group.py --sub-json build/sub.json --strict $(CSVS) build/grouped.csv
+	# Verify sub.json makes a solvable solution
+	# python3 $(TIMFUZ_DIR)/checksub.py --sub-json build/sub.json grouped.csv
+
+build/leastsq.csv: build/sub.json build/grouped.csv
+	# Create a rough timing model that approximately fits the given paths
+	python3 $(TIMFUZ_DIR)/solve_leastsq.py --sub-json build/sub.json build/grouped.csv --out build/leastsq.csv
+
+build/linprog.csv: build/leastsq.csv build/grouped.csv
+	# Tweak rough timing model, making sure all constraints are satisfied
+	python3 $(TIMFUZ_DIR)/solve_linprog.py --sub-json build/sub.json --sub-csv build/leastsq.csv --massage build/grouped.csv --out build/linprog.csv
+
+build/flat.csv: build/linprog.csv
+	# Take separated variables and back-annotate them to the original timing variables
+	python3 $(TIMFUZ_DIR)/csv_group2flat.py --sub-json build/sub.json --sort build/linprog.csv build/flat.csv
+
+build/tilea.json: build/flat.csv
+	# Final processing
+	# Insert timing delays into actual tile layouts
+	python3 $(TIMFUZ_DIR)/tile_annotate.py --tile-json $(TIMFUZ_DIR)/timgrid/build/timgrid.json build/flat.csv build/tilea.json
+
diff --git a/fuzzers/007-timing/projects/project.tcl b/fuzzers/007-timing/projects/project.tcl
new file mode 100644
index 00000000..b1478201
--- /dev/null
+++ b/fuzzers/007-timing/projects/project.tcl
@@ -0,0 +1,174 @@
+proc pin_info {pin} {
+    set cell [get_cells -of_objects $pin]
+    set bel [get_bels -of_objects $cell]
+    set site [get_sites -of_objects $bel]
+    return "$site $bel"
+}
+
+proc pin_bel {pin} {
+    set cell [get_cells -of_objects $pin]
+    set bel [get_bels -of_objects $cell]
+    return $bel
+}
+
+# Changed to group wires and nodes
+# This allows tracing the full path along with pips
+proc write_info3 {} {
+    set outdir "."
+    set fp [open "$outdir/timing3.txt" w]
+    # bel as site/bel, so don't bother with site
+    puts $fp "net src_bel dst_bel ico fast_max fast_min slow_max slow_min pips inodes wires"
+
+    set TIME_start [clock clicks -milliseconds]
+    set verbose 0
+    set equations 0
+    set site_src_nets 0
+    set site_dst_nets 0
+    set neti 0
+    set nets [get_nets -hierarchical]
+    set nnets [llength $nets]
+    foreach net $nets {
+        incr neti
+        #if {$neti >= 10} {
+        #    puts "Debug break"
+        #    break
+        #}
+
+        puts "Net $neti / $nnets: $net"
+        # The semantics of get_pins -leaf is kind of odd
+        # When no passthrough LUTs exist, it has no effect
+        # When passthrough LUT present:
+        # -w/o -leaf: some pins + passthrough LUT pins
+        # -w/ -leaf: different pins + passthrough LUT pins
+        # With OUT filter this seems to be sufficient
+        set src_pin [get_pins -leaf -filter {DIRECTION == OUT} -of_objects $net]
+        set src_bel [pin_bel $src_pin]
+        set src_site [get_sites -of_objects $src_bel]
+        # Only one net driver
+        set src_site_pins [get_site_pins -filter {DIRECTION == OUT} -of_objects $net]
+
+        # Sometimes this is empty for reasons that escape me
+        # Emitting direction doesn't help
+        if {[llength $src_site_pins] < 1} {
+            if $verbose {
+                puts "    Ignoring site internal net"
+            }
+            incr site_src_nets
+            continue
+        }
+        set dst_site_pins_net [get_site_pins -filter {DIRECTION == IN} -of_objects $net]
+        if {[llength $dst_site_pins_net] < 1} {
+            puts "  Skipping site internal source net"
+            incr site_dst_nets
+            continue
+        }
+        foreach src_site_pin $src_site_pins {
+            if $verbose {
+                puts "Source: $src_pin at site $src_site:$src_bel, spin $src_site_pin"
+            }
+
+            # Run with and without interconnect only
+            foreach ico "0 1" {
+                set ico_flag ""
+                if $ico {
+                    set ico_flag "-interconnect_only"
+                    set delays [get_net_delays $ico_flag -of_objects $net]
+                } else {
+                    set delays [get_net_delays -of_objects $net]
+                }
+                foreach delay $delays {
+                    set delaystr [get_property NAME $delay]
+                    set dst_pins [get_property TO_PIN $delay]
+                    set dst_pin [get_pins $dst_pins]
+                    #puts "  $delaystr: $src_pin => $dst_pin"
+                    set dst_bel [pin_bel $dst_pin]
+                    set dst_site [get_sites -of_objects $dst_bel]
+                    if $verbose {
+                        puts "  Dest: $dst_pin at site $dst_site:$dst_bel"
+                    }
+
+                    set dst_site_pins [get_site_pins -of_objects $dst_pin]
+                    # Some nets are internal
+                    # But should this happen on dest if we've already filtered source?
+                    if {"$dst_site_pins" eq ""} {
+                        continue
+                    }
+                    # Also apparantly you can have multiple of these as well
+                    foreach dst_site_pin $dst_site_pins {
+                        set fast_max [get_property "FAST_MAX" $delay]
+                        set fast_min [get_property "FAST_MIN" $delay]
+                        set slow_max [get_property "SLOW_MAX" $delay]
+                        set slow_min [get_property "SLOW_MIN" $delay]
+
+                        # Want:
+                        # Site / BEL at src
+                        # Site / BEL at dst
+                        # Pips in between
+                        # Walk net, looking for interesting elements in between
+                        set pips [get_pips -of_objects $net -from $src_site_pin -to $dst_site_pin]
+                        if $verbose {
+                            foreach pip $pips {
+                                puts "    PIP $pip"
+                            }
+                        }
+                        set nodes [get_nodes -of_objects $net -from $src_site_pin -to $dst_site_pin]
+                        #set wires [get_wires -of_objects $net -from $src_site_pin -to $dst_site_pin]
+                        set wires [get_wires -of_objects $nodes]
+
+                        # puts $fp "$net $src_bel $dst_bel $ico $fast_max $fast_min $slow_max $slow_min $pips"
+                        puts -nonewline $fp "$net $src_bel $dst_bel $ico $fast_max $fast_min $slow_max $slow_min"
+        
+                        # Write pips w/ speed index
+                        puts -nonewline $fp " "
+                        set needspace 0
+                        foreach pip $pips {
+                            if $needspace {
+                                puts -nonewline $fp "|"
+                            }
+                            set speed_index [get_property SPEED_INDEX $pip]
+                            puts -nonewline $fp "$pip:$speed_index"
+                            set needspace 1
+                        }
+
+                        # Write nodes
+                        #set nodes_str [string map {" " "|"} $nodes]
+                        #puts -nonewline $fp " $nodes_str"
+                        puts -nonewline $fp " "
+                        set needspace 0
+                        foreach node $nodes {
+                            if $needspace {
+                                puts -nonewline $fp "|"
+                            }
+                            set nwires [llength [get_wires -of_objects $node]]
+                            puts -nonewline $fp "$node:$nwires"
+                            set needspace 1
+                        }
+
+                        # Write wires
+                        puts -nonewline $fp " "
+                        set needspace 0
+                        foreach wire $wires {
+                            if $needspace {
+                                puts -nonewline $fp "|"
+                            }
+                            set speed_index [get_property SPEED_INDEX $wire]
+                            puts -nonewline $fp "$wire:$speed_index"
+                            set needspace 1
+                        }
+
+                        puts $fp ""
+
+                        incr equations
+                        break
+                    }
+                }
+            }
+        }
+    }
+    close $fp
+    set TIME_taken [expr [clock clicks -milliseconds] - $TIME_start]
+    puts "Took ms: $TIME_taken"
+    puts "Generated $equations equations"
+    puts "Skipped $site_src_nets (+ $site_dst_nets) site nets"
+}
+

From c2707e5c23faf27be1aaad531049cf724d9409ad Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Tue, 11 Sep 2018 12:12:33 -0700
Subject: [PATCH 32/55] timfuz: simplify readme instructions using new make
 system

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/README.md | 36 +++++++++---------------------------
 1 file changed, 9 insertions(+), 27 deletions(-)

diff --git a/fuzzers/007-timing/README.md b/fuzzers/007-timing/README.md
index ae90a689..047e073c 100644
--- a/fuzzers/007-timing/README.md
+++ b/fuzzers/007-timing/README.md
@@ -12,36 +12,18 @@ Currently this document focuses exclusively on fabric timing delays.
 
 ## Quick start
 
-TODO: make this into a more formal makefile flow
-
 ```
-# Pre-processing
-# Create speed.json
-./speed.sh
+pushd speed
+make
+popd
 
-# Create csvs
+pushd timgrid
+make
+popd
+
+pushd projects/placelut
 make N=1
-csv=specimen_001/timing3.csv
-
-# Main workflow
-# Discover which variables can be separated
-python3 timfuz_rref.py --simplify --out sub.json $csv
-# Verify sub.json makes a solvable solution
-python3 checksub.py --sub-json sub.json group.csv
-# Separate variables
-python3 csv_flat2group.py --sub-json sub.json --strict $csv group.csv
-# Create a rough timing model that approximately fits the given paths
-python3 solve_leastsq.py --sub-json sub.json group.csv --out leastsq.csv
-# Tweak rough timing model, making sure all constraints are satisfied
-python3 solve_linprog.py --sub-json sub.json --sub-csv leastsq.csv --massage group.csv --out linprog.csv
-# Take separated variables and back-annotate them to the original timing variables
-python3 csv_group2flat.py --sub-json sub.json --sort linprog.csv flat.csv
-
-# Final processing
-# Create tile.json (where timing models are in tile fabric)
-python3 tile_txt2json.py timgrid/specimen_001/tiles.txt tiles.json
-# Insert timing delays into actual tile layouts
-python3 tile_annotate.py flat.csv tilea.json
+popd
 ```
 
 

From 1fc02389ed4c230aff9c9e4a5de877eb074cf509 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Tue, 11 Sep 2018 12:25:57 -0700
Subject: [PATCH 33/55] timfuz: tile_annotate report solve correctly

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/tile_annotate.py | 21 +++++++++++++--------
 fuzzers/007-timing/timfuz.py        | 12 ++++++------
 2 files changed, 19 insertions(+), 14 deletions(-)

diff --git a/fuzzers/007-timing/tile_annotate.py b/fuzzers/007-timing/tile_annotate.py
index e294769b..005b6c52 100644
--- a/fuzzers/007-timing/tile_annotate.py
+++ b/fuzzers/007-timing/tile_annotate.py
@@ -1,5 +1,6 @@
 #!/usr/bin/env python3
 
+import timfuz
 from timfuz import loadc_Ads_b, Ads2bounds
 
 import sys
@@ -20,9 +21,9 @@ def run(fnin, fnout, tile_json_fn, verbose=False):
     bounds = Ads2bounds(Ads, b)
 
     pipn_net = 0
-    pipn_solved = 0
+    pipn_solved = [0, 0, 0, 0]
     wiren_net = 0
-    wiren_solved = 0
+    wiren_solved = [0, 0, 0, 0]
 
     for tile in tilej['tiles'].values():
         pips = tile['pips']
@@ -30,19 +31,23 @@ def run(fnin, fnout, tile_json_fn, verbose=False):
             val = bounds.get('PIP_' + v, None)
             pips[k] = quad(val)
             pipn_net += 1
-            if pips[k]:
-                pipn_solved += 1
+            for i in range(4):
+                if pips[k][i]:
+                    pipn_solved[i] += 1
 
         wires = tile['wires']
         for k, v in wires.items():
             val = bounds.get('WIRE_' + v, None)
             wires[k] = quad(val)
             wiren_net += 1
-            if wires[k]:
-                wiren_solved += 1
+            for i in range(4):
+                if wires[k][i]:
+                    wiren_solved[i] += 1
 
-    print('Pips: %u / %u solved' % (pipn_solved, pipn_net))
-    print('Wires: %u / %u solved' % (wiren_solved, wiren_net))
+    for corner, corneri in timfuz.corner_s2i.items():
+        print('Corner %s' % corner)
+        print('  Pips: %u / %u solved' % (pipn_solved[corneri], pipn_net))
+        print('  Wires: %u / %u solved' % (wiren_solved[corneri], wiren_net))
 
     json.dump(tilej, open(fnout, 'w'), sort_keys=True, indent=4, separators=(',', ': '))
 
diff --git a/fuzzers/007-timing/timfuz.py b/fuzzers/007-timing/timfuz.py
index 6f2f8918..f48b7e89 100644
--- a/fuzzers/007-timing/timfuz.py
+++ b/fuzzers/007-timing/timfuz.py
@@ -30,12 +30,12 @@ NAME_ZERO = set([
             ])
 
 # csv index
-corner_s2i = {
-    'fast_max': 0,
-    'fast_min': 1,
-    'slow_max': 2,
-    'slow_min': 3,
-    }
+corner_s2i = OrderedDict([
+    ('fast_max', 0),
+    ('fast_min', 1),
+    ('slow_max', 2),
+    ('slow_min', 3),
+    ])
 
 def print_eqns(A_ubd, b_ub, verbose=0, lim=3, label=''):
     rows = len(b_ub)

From fa524df6575e4f3bba1adfaf0b3c4dcfb94e6117 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Tue, 11 Sep 2018 16:43:37 -0700
Subject: [PATCH 34/55] timfuz: fix zero delay element inconsistency

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/checksub.py                |  5 ++-
 fuzzers/007-timing/csv_flat2group.py          | 39 +++++++------------
 .../007-timing/projects/oneblinkw/oneblinkw.v | 37 ------------------
 fuzzers/007-timing/projects/project.mk        | 24 ++++++++----
 fuzzers/007-timing/rref.py                    |  2 +-
 fuzzers/007-timing/timfuz.py                  | 19 ++++-----
 6 files changed, 44 insertions(+), 82 deletions(-)
 delete mode 100644 fuzzers/007-timing/projects/oneblinkw/oneblinkw.v

diff --git a/fuzzers/007-timing/checksub.py b/fuzzers/007-timing/checksub.py
index 213fcb33..9cdb259d 100644
--- a/fuzzers/007-timing/checksub.py
+++ b/fuzzers/007-timing/checksub.py
@@ -89,7 +89,8 @@ def run(fns_in, sub_json=None, verbose=False):
     '''
     print
     # https://docs.scipy.org/doc/numpy-dev/reference/generated/numpy.linalg.matrix_rank.html
-    print('rank: %s / %d col' % (np.linalg.matrix_rank(Amat), len(names)))
+    rank = np.linalg.matrix_rank(Amat)
+    print('rank: %s / %d col' % (rank, len(names)))
     # doesn't work on non-square matrices
     if 0:
         # https://docs.scipy.org/doc/numpy-1.14.0/reference/generated/numpy.linalg.slogdet.html
@@ -99,6 +100,8 @@ def run(fns_in, sub_json=None, verbose=False):
             print('slogdet :( : 0')
         else:
             print('slogdet :) : %s, %s' % (sign, logdet))
+    if rank != len(names):
+        raise Exception("Matrix not fully ranked w/ %u / %u" % (rank, len(names)))
 
 def main():
     import argparse
diff --git a/fuzzers/007-timing/csv_flat2group.py b/fuzzers/007-timing/csv_flat2group.py
index 7a050585..57be54a5 100644
--- a/fuzzers/007-timing/csv_flat2group.py
+++ b/fuzzers/007-timing/csv_flat2group.py
@@ -1,19 +1,6 @@
 #!/usr/bin/env python3
 
-# https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
-from scipy.optimize import linprog
-from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json, A_ub_np2d, print_eqns, print_eqns_np, Ads2bounds, loadc_Ads_raw, instances
-from timfuz_massage import massage_equations
-import numpy as np
-import glob
-import json
-import math
-from collections import OrderedDict
-from fractions import Fraction
-import sys
-import datetime
-import os
-import time
+from timfuz import Benchmark, loadc_Ads_b, index_names, load_sub, run_sub_json, instances
 
 def gen_group(fnin, sub_json, strict=False, verbose=False):
     print('Loading data')
@@ -31,15 +18,16 @@ def gen_group(fnin, sub_json, strict=False, verbose=False):
     for row_ds, row_b in zip(Ads, b):
         yield row_ds, [row_b for _ in range(4)]
 
-def run(fnin, fnout, sub_json, corner=None, strict=False, verbose=False):
+def run(fns_in, fnout, sub_json, corner=None, strict=False, verbose=False):
     with open(fnout, 'w') as fout:
         fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
-        for row_ds, row_bs in gen_group(fnin, sub_json, strict=strict):
-            row_ico = 1
-            items = [str(row_ico), ' '.join([str(x) for x in row_bs])]
-            for k, v in sorted(row_ds.items()):
-                items.append('%u %s' % (v, k))
-            fout.write(','.join(items) + '\n')
+        for fn_in in fns_in:
+            for row_ds, row_bs in gen_group(fn_in, sub_json, strict=strict):
+                row_ico = 1
+                items = [str(row_ico), ' '.join([str(x) for x in row_bs])]
+                for k, v in sorted(row_ds.items()):
+                    items.append('%u %s' % (v, k))
+                fout.write(','.join(items) + '\n')
 
 def main():
     import argparse
@@ -54,8 +42,11 @@ def main():
     parser.add_argument('--strict', action='store_true', help='')
     parser.add_argument('--sub-csv', help='')
     parser.add_argument('--sub-json', required=True, help='Group substitutions to make fully ranked')
-    parser.add_argument('fnin', default=None, help='input timing delay .csv')
-    parser.add_argument('fnout', default=None, help='output timing delay .csv')
+    parser.add_argument('--out', help='Output sub.json substitution result')
+    parser.add_argument(
+        'fns_in',
+        nargs='*',
+        help='timing3.txt input files')
     args = parser.parse_args()
     # Store options in dict to ease passing through functions
     bench = Benchmark()
@@ -63,7 +54,7 @@ def main():
     sub_json = load_sub(args.sub_json)
 
     try:
-        run(args.fnin, args.fnout, sub_json=sub_json, strict=args.strict, verbose=args.verbose)
+        run(args.fns_in, args.out, sub_json=sub_json, strict=args.strict, verbose=args.verbose)
     finally:
         print('Exiting after %s' % bench)
 
diff --git a/fuzzers/007-timing/projects/oneblinkw/oneblinkw.v b/fuzzers/007-timing/projects/oneblinkw/oneblinkw.v
deleted file mode 100644
index 5e133bac..00000000
--- a/fuzzers/007-timing/projects/oneblinkw/oneblinkw.v
+++ /dev/null
@@ -1,37 +0,0 @@
-module roi (
-        input wire clk,
-        output wire out);
-    reg [23:0] counter;
-    assign out = counter[23] ^ counter[22] ^ counter[2] && counter[1] || counter[0];
-
-    always @(posedge clk) begin
-        counter <= counter + 1;
-    end
-endmodule
-
-module top(input wire clk, input wire stb, input wire di, output wire do);
-    localparam integer DIN_N = 0;
-    localparam integer DOUT_N = 1;
-
-    reg [DIN_N-1:0] din;
-    wire [DOUT_N-1:0] dout;
-
-    reg [DIN_N-1:0] din_shr;
-    reg [DOUT_N-1:0] dout_shr;
-
-    always @(posedge clk) begin
-        din_shr <= {din_shr, di};
-        dout_shr <= {dout_shr, din_shr[DIN_N-1]};
-        if (stb) begin
-            din <= din_shr;
-            dout_shr <= dout;
-        end
-    end
-
-    assign do = dout_shr[DOUT_N-1];
-    roi roi(
-            .clk(clk),
-            .out(dout[0])
-            );
-endmodule
-
diff --git a/fuzzers/007-timing/projects/project.mk b/fuzzers/007-timing/projects/project.mk
index f1e10dc2..f870af11 100644
--- a/fuzzers/007-timing/projects/project.mk
+++ b/fuzzers/007-timing/projects/project.mk
@@ -26,25 +26,33 @@ build/sub.json: $(SPECIMENS_OK)
 	mkdir -p build
 	# Discover which variables can be separated
 	# This is typically the longest running operation
-	python3 $(TIMFUZ_DIR)/rref.py --simplify --out build/sub.json $(CSVS)
+	python3 $(TIMFUZ_DIR)/rref.py --simplify --out build/sub.json.tmp $(CSVS)
+	mv build/sub.json.tmp build/sub.json
 
 build/grouped.csv: $(SPECIMENS_OK) build/sub.json
 	# Separate variables
-	python3 $(TIMFUZ_DIR)/csv_flat2group.py --sub-json build/sub.json --strict $(CSVS) build/grouped.csv
-	# Verify sub.json makes a solvable solution
-	# python3 $(TIMFUZ_DIR)/checksub.py --sub-json build/sub.json grouped.csv
+	python3 $(TIMFUZ_DIR)/csv_flat2group.py --sub-json build/sub.json --strict --out build/grouped.csv.tmp $(CSVS)
+	mv build/grouped.csv.tmp build/grouped.csv
 
-build/leastsq.csv: build/sub.json build/grouped.csv
+build/checksub: build/grouped.csv build/sub.json
+	# Verify sub.json makes a cleanly solvable solution with no non-pivot leftover
+	python3 $(TIMFUZ_DIR)/checksub.py --sub-json build/sub.json build/grouped.csv
+	touch build/checksub
+
+build/leastsq.csv: build/sub.json build/grouped.csv build/checksub
 	# Create a rough timing model that approximately fits the given paths
-	python3 $(TIMFUZ_DIR)/solve_leastsq.py --sub-json build/sub.json build/grouped.csv --out build/leastsq.csv
+	python3 $(TIMFUZ_DIR)/solve_leastsq.py --sub-json build/sub.json build/grouped.csv --out build/leastsq.csv.tmp
+	mv build/leastsq.csv.tmp build/leastsq.csv
 
 build/linprog.csv: build/leastsq.csv build/grouped.csv
 	# Tweak rough timing model, making sure all constraints are satisfied
-	python3 $(TIMFUZ_DIR)/solve_linprog.py --sub-json build/sub.json --sub-csv build/leastsq.csv --massage build/grouped.csv --out build/linprog.csv
+	python3 $(TIMFUZ_DIR)/solve_linprog.py --sub-json build/sub.json --sub-csv build/leastsq.csv --massage build/grouped.csv --out build/linprog.csv.tmp
+	mv build/linprog.csv.tmp build/linprog.csv
 
 build/flat.csv: build/linprog.csv
 	# Take separated variables and back-annotate them to the original timing variables
-	python3 $(TIMFUZ_DIR)/csv_group2flat.py --sub-json build/sub.json --sort build/linprog.csv build/flat.csv
+	python3 $(TIMFUZ_DIR)/csv_group2flat.py --sub-json build/sub.json --sort build/linprog.csv build/flat.csv.tmp
+	mv build/flat.csv.tmp build/flat.csv
 
 build/tilea.json: build/flat.csv
 	# Final processing
diff --git a/fuzzers/007-timing/rref.py b/fuzzers/007-timing/rref.py
index df0d7153..19dcc89c 100644
--- a/fuzzers/007-timing/rref.py
+++ b/fuzzers/007-timing/rref.py
@@ -71,7 +71,7 @@ class State(object):
         Ads, b = loadc_Ads_b(fn_ins, corner=corner, ico=True)
         if simplify:
             print('Simplifying corner %s' % (corner,))
-            Ads, b = simplify_rows(Ads, b)
+            Ads, b = simplify_rows(Ads, b, remove_zd=False)
         return State(Ads)
 
 def write_state(state, fout):
diff --git a/fuzzers/007-timing/timfuz.py b/fuzzers/007-timing/timfuz.py
index f48b7e89..604649c9 100644
--- a/fuzzers/007-timing/timfuz.py
+++ b/fuzzers/007-timing/timfuz.py
@@ -130,7 +130,7 @@ def Ab_ub_dt2d(eqns):
     return list(A_ubd), list(b_ub)
 
 # This significantly reduces runtime
-def simplify_rows(Ads, b_ub):
+def simplify_rows(Ads, b_ub, remove_zd=False):
     '''Remove duplicate equations, taking highest delay'''
     # dict of constants to highest delay
     eqns = OrderedDict()
@@ -149,7 +149,7 @@ def simplify_rows(Ads, b_ub):
         # TODO: elements have zero delay (ex: COUT)
         # Remove these from now since they make me nervous
         # Although they should just solve to 0
-        if not b:
+        if remove_zd and not b:
             zero_ds += 1
             continue
 
@@ -168,7 +168,7 @@ def simplify_rows(Ads, b_ub):
     #A_ub_ret = eqns.keys()
     A_ubd_ret, b_ub_ret = Ab_ub_dt2d(eqns)
 
-    print('Simplify rows: %d => %d w/ zd %d, ze %d' % (len(b_ub), len(b_ub_ret), zero_ds, zero_es))
+    print('Simplify rows: %d => %d rows w/ zd %d, ze %d' % (len(b_ub), len(b_ub_ret), zero_ds, zero_es))
     #return A_ub_ret, b_ub_ret
     #return A_ub_np2d(A_ub_ret), b_ub_ret
     return A_ubd_ret, b_ub_ret
@@ -693,9 +693,9 @@ def loadc_Ads_b(fns, corner, ico=None):
     corneri = corner_s2i[corner]
 
     if ico is not None:
-        filt = lambda ico, corners, vars: ico == ico
+        filt = lambda ico_, corners, vars: ico_ == ico
     else:
-        filt = lambda ico, corners, vars: True
+        filt = lambda ico_, corners, vars: True
 
     def mkb(val):
         return val[corneri]
@@ -725,9 +725,6 @@ def load_sub(fn):
     return j
 
 def row_sub_syms(row, sub_json, strict=False, verbose=False):
-    zero = Fraction(0)
-    zero = 0
-
     if 0 and verbose:
         print("")
         print(row.items())
@@ -761,9 +758,9 @@ def row_sub_syms(row, sub_json, strict=False, verbose=False):
         if verbose:
             print('pivot %i %s' % (n, pivot))
         for subk, subv in sorted(sub_json['subs'][group].items()):
-            oldn = row.get(subk, zero)
+            oldn = row.get(subk, type(subv)(0))
             rown = -n * subv
-            rown += type(rown)(oldn)
+            rown += oldn
             if verbose:
                 print("  %s: %d => %d" % (subk, oldn, rown))
             if rown == 0:
@@ -783,7 +780,7 @@ def row_sub_syms(row, sub_json, strict=False, verbose=False):
         # verify no subs are left
         for subs in sub_json['subs'].values():
             for sub in subs:
-                assert sub not in row, 'Unexpected element %s' % sub
+                assert sub not in row, 'non-pivot element after group sub %s' % sub
 
         # Verify all constants are positive
         for k, v in sorted(row.items()):

From 7ac4f31e589bc54f6f5b050d1c516cb24972eeba Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Tue, 11 Sep 2018 17:16:01 -0700
Subject: [PATCH 35/55] timfuz: zero row add assertion

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/projects/.gitignore        |  3 ++
 fuzzers/007-timing/projects/generate.sh       |  9 ++++
 .../007-timing/projects/oneblinkw/Makefile    |  2 +
 .../007-timing/projects/oneblinkw/generate.sh |  8 ++++
 .../projects/oneblinkw/generate.tcl           | 47 +++++++++++++++++++
 fuzzers/007-timing/projects/oneblinkw/top.v   | 37 +++++++++++++++
 fuzzers/007-timing/timfuz.py                  |  6 +--
 7 files changed, 109 insertions(+), 3 deletions(-)
 create mode 100644 fuzzers/007-timing/projects/.gitignore
 create mode 100644 fuzzers/007-timing/projects/generate.sh
 create mode 100644 fuzzers/007-timing/projects/oneblinkw/Makefile
 create mode 100755 fuzzers/007-timing/projects/oneblinkw/generate.sh
 create mode 100644 fuzzers/007-timing/projects/oneblinkw/generate.tcl
 create mode 100644 fuzzers/007-timing/projects/oneblinkw/top.v

diff --git a/fuzzers/007-timing/projects/.gitignore b/fuzzers/007-timing/projects/.gitignore
new file mode 100644
index 00000000..374eddc2
--- /dev/null
+++ b/fuzzers/007-timing/projects/.gitignore
@@ -0,0 +1,3 @@
+specimen_*
+build
+
diff --git a/fuzzers/007-timing/projects/generate.sh b/fuzzers/007-timing/projects/generate.sh
new file mode 100644
index 00000000..f8e6e094
--- /dev/null
+++ b/fuzzers/007-timing/projects/generate.sh
@@ -0,0 +1,9 @@
+#!/bin/bash
+
+source ${XRAY_GENHEADER}
+TIMFUZ_DIR=$XRAY_DIR/fuzzers/007-timing
+
+timing_txt2csv () {
+    python3 $TIMFUZ_DIR/timing_txt2csv.py --speed-json $TIMFUZ_DIR/speed/build/speed.json --out timing3.csv timing3.txt
+}
+
diff --git a/fuzzers/007-timing/projects/oneblinkw/Makefile b/fuzzers/007-timing/projects/oneblinkw/Makefile
new file mode 100644
index 00000000..9c8b1947
--- /dev/null
+++ b/fuzzers/007-timing/projects/oneblinkw/Makefile
@@ -0,0 +1,2 @@
+include ../project.mk
+
diff --git a/fuzzers/007-timing/projects/oneblinkw/generate.sh b/fuzzers/007-timing/projects/oneblinkw/generate.sh
new file mode 100755
index 00000000..0ba2a7fc
--- /dev/null
+++ b/fuzzers/007-timing/projects/oneblinkw/generate.sh
@@ -0,0 +1,8 @@
+#!/bin/bash
+
+set -ex
+source ../generate.sh
+
+vivado -mode batch -source ../generate.tcl
+timing_txt2csv
+
diff --git a/fuzzers/007-timing/projects/oneblinkw/generate.tcl b/fuzzers/007-timing/projects/oneblinkw/generate.tcl
new file mode 100644
index 00000000..e7946556
--- /dev/null
+++ b/fuzzers/007-timing/projects/oneblinkw/generate.tcl
@@ -0,0 +1,47 @@
+source ../../../../../utils/utils.tcl
+source ../../project.tcl
+
+proc build_design {} {
+    create_project -force -part $::env(XRAY_PART) design design
+    read_verilog ../top.v
+    synth_design -top top
+
+    puts "Locking pins"
+    set_property LOCK_PINS {I0:A1 I1:A2 I2:A3 I3:A4 I4:A5 I5:A6} \
+		[get_cells -quiet -filter {REF_NAME == LUT6} -hierarchical]
+
+    puts "Package stuff"
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_00) IOSTANDARD LVCMOS33" [get_ports clk]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_01) IOSTANDARD LVCMOS33" [get_ports stb]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_02) IOSTANDARD LVCMOS33" [get_ports di]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_03) IOSTANDARD LVCMOS33" [get_ports do]
+
+    puts "pblocking"
+    create_pblock roi
+    set roipb [get_pblocks roi]
+    set_property EXCLUDE_PLACEMENT 1 $roipb
+    add_cells_to_pblock $roipb [get_cells roi]
+    resize_pblock $roipb -add "$::env(XRAY_ROI)"
+
+    puts "randplace"
+    #randplace_pblock 50 roi
+
+    set_property CFGBVS VCCO [current_design]
+    set_property CONFIG_VOLTAGE 3.3 [current_design]
+    set_property BITSTREAM.GENERAL.PERFRAMECRC YES [current_design]
+
+    puts "dedicated route"
+    set_property CLOCK_DEDICATED_ROUTE FALSE [get_nets clk_IBUF]
+
+    place_design
+    route_design
+
+    write_checkpoint -force design.dcp
+    # disable combinitorial loop
+    # set_property IS_ENABLED 0 [get_drc_checks {LUTLP-1}]
+    #write_bitstream -force design.bit
+}
+
+build_design
+write_info3
+
diff --git a/fuzzers/007-timing/projects/oneblinkw/top.v b/fuzzers/007-timing/projects/oneblinkw/top.v
new file mode 100644
index 00000000..5e133bac
--- /dev/null
+++ b/fuzzers/007-timing/projects/oneblinkw/top.v
@@ -0,0 +1,37 @@
+module roi (
+        input wire clk,
+        output wire out);
+    reg [23:0] counter;
+    assign out = counter[23] ^ counter[22] ^ counter[2] && counter[1] || counter[0];
+
+    always @(posedge clk) begin
+        counter <= counter + 1;
+    end
+endmodule
+
+module top(input wire clk, input wire stb, input wire di, output wire do);
+    localparam integer DIN_N = 0;
+    localparam integer DOUT_N = 1;
+
+    reg [DIN_N-1:0] din;
+    wire [DOUT_N-1:0] dout;
+
+    reg [DIN_N-1:0] din_shr;
+    reg [DOUT_N-1:0] dout_shr;
+
+    always @(posedge clk) begin
+        din_shr <= {din_shr, di};
+        dout_shr <= {dout_shr, din_shr[DIN_N-1]};
+        if (stb) begin
+            din <= din_shr;
+            dout_shr <= dout;
+        end
+    end
+
+    assign do = dout_shr[DOUT_N-1];
+    roi roi(
+            .clk(clk),
+            .out(dout[0])
+            );
+endmodule
+
diff --git a/fuzzers/007-timing/timfuz.py b/fuzzers/007-timing/timfuz.py
index 604649c9..868e8126 100644
--- a/fuzzers/007-timing/timfuz.py
+++ b/fuzzers/007-timing/timfuz.py
@@ -153,10 +153,10 @@ def simplify_rows(Ads, b_ub, remove_zd=False):
             zero_ds += 1
             continue
 
-        # A very few of these exist with very small values
-        # TODO: investigate, understand what these are
-        # Leaving these in can make the result unsolvable since there does not exist a set of constants to reach the delay
+        # think ran into these before when taking out ZERO elements
         if len(rowd) == 0:
+            if b != 0:
+                assert zero_es == 0, 'Unexpected zero element row with non-zero delay'
             zero_es += 1
             continue
 

From 6197a9353620e4458a1417365dcf7a152772241b Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Tue, 11 Sep 2018 17:32:50 -0700
Subject: [PATCH 36/55] timfuz: picorv32 project

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 .../007-timing/projects/oneblinkw/README.md   |  2 +
 fuzzers/007-timing/projects/picorv32/Makefile |  2 +
 .../007-timing/projects/picorv32/README.md    |  3 ++
 .../007-timing/projects/picorv32/generate.sh  |  8 ++++
 .../007-timing/projects/picorv32/generate.tcl | 48 +++++++++++++++++++
 5 files changed, 63 insertions(+)
 create mode 100644 fuzzers/007-timing/projects/oneblinkw/README.md
 create mode 100644 fuzzers/007-timing/projects/picorv32/Makefile
 create mode 100644 fuzzers/007-timing/projects/picorv32/README.md
 create mode 100755 fuzzers/007-timing/projects/picorv32/generate.sh
 create mode 100644 fuzzers/007-timing/projects/picorv32/generate.tcl

diff --git a/fuzzers/007-timing/projects/oneblinkw/README.md b/fuzzers/007-timing/projects/oneblinkw/README.md
new file mode 100644
index 00000000..ae7cac37
--- /dev/null
+++ b/fuzzers/007-timing/projects/oneblinkw/README.md
@@ -0,0 +1,2 @@
+Minimal, simple test
+
diff --git a/fuzzers/007-timing/projects/picorv32/Makefile b/fuzzers/007-timing/projects/picorv32/Makefile
new file mode 100644
index 00000000..9c8b1947
--- /dev/null
+++ b/fuzzers/007-timing/projects/picorv32/Makefile
@@ -0,0 +1,2 @@
+include ../project.mk
+
diff --git a/fuzzers/007-timing/projects/picorv32/README.md b/fuzzers/007-timing/projects/picorv32/README.md
new file mode 100644
index 00000000..0be27709
--- /dev/null
+++ b/fuzzers/007-timing/projects/picorv32/README.md
@@ -0,0 +1,3 @@
+picorv32 uses more advanced structures than simple LUT/FF tests (such as carry chain)
+It attempts to provide some realistic timing data wrt fanout and used fabric
+
diff --git a/fuzzers/007-timing/projects/picorv32/generate.sh b/fuzzers/007-timing/projects/picorv32/generate.sh
new file mode 100755
index 00000000..0ba2a7fc
--- /dev/null
+++ b/fuzzers/007-timing/projects/picorv32/generate.sh
@@ -0,0 +1,8 @@
+#!/bin/bash
+
+set -ex
+source ../generate.sh
+
+vivado -mode batch -source ../generate.tcl
+timing_txt2csv
+
diff --git a/fuzzers/007-timing/projects/picorv32/generate.tcl b/fuzzers/007-timing/projects/picorv32/generate.tcl
new file mode 100644
index 00000000..a928a3bd
--- /dev/null
+++ b/fuzzers/007-timing/projects/picorv32/generate.tcl
@@ -0,0 +1,48 @@
+source ../../../../../utils/utils.tcl
+source ../../project.tcl
+
+proc build_design {} {
+    create_project -force -part $::env(XRAY_PART) design design
+    read_verilog ../../../src/picorv32.v
+    read_verilog ../top.v
+    synth_design -top top
+
+    puts "Locking pins"
+    set_property LOCK_PINS {I0:A1 I1:A2 I2:A3 I3:A4 I4:A5 I5:A6} \
+		[get_cells -quiet -filter {REF_NAME == LUT6} -hierarchical]
+
+    puts "Package stuff"
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_00) IOSTANDARD LVCMOS33" [get_ports clk]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_01) IOSTANDARD LVCMOS33" [get_ports stb]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_02) IOSTANDARD LVCMOS33" [get_ports di]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_03) IOSTANDARD LVCMOS33" [get_ports do]
+
+    puts "pblocking"
+    create_pblock roi
+    set roipb [get_pblocks roi]
+    set_property EXCLUDE_PLACEMENT 1 $roipb
+    add_cells_to_pblock $roipb [get_cells roi]
+    resize_pblock $roipb -add "$::env(XRAY_ROI)"
+
+    puts "randplace"
+    randplace_pblock 50 roi
+
+    set_property CFGBVS VCCO [current_design]
+    set_property CONFIG_VOLTAGE 3.3 [current_design]
+    set_property BITSTREAM.GENERAL.PERFRAMECRC YES [current_design]
+
+    puts "dedicated route"
+    set_property CLOCK_DEDICATED_ROUTE FALSE [get_nets clk_IBUF]
+
+    place_design
+    route_design
+
+    write_checkpoint -force design.dcp
+    # disable combinitorial loop
+    # set_property IS_ENABLED 0 [get_drc_checks {LUTLP-1}]
+    #write_bitstream -force design.bit
+}
+
+build_design
+write_info3
+

From 5c122c2fe15a81edad5826e29d50e82cf24f078f Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Tue, 11 Sep 2018 18:18:40 -0700
Subject: [PATCH 37/55] timfuz: misc cleanup

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/Makefile                   |   5 +
 fuzzers/007-timing/checksub.py                |   7 +-
 fuzzers/007-timing/corner_csv.py              |   2 +-
 fuzzers/007-timing/projects/Makefile          |   4 +
 .../007-timing/projects/placelut/README.md    |   2 +
 .../007-timing/projects/placelut_fb/Makefile  |   2 +
 .../007-timing/projects/placelut_fb/README.md |   2 +
 .../{placelut_fb.py => generate.py}           |   0
 .../projects/placelut_fb/generate.sh          |   9 +
 .../projects/placelut_fb/generate.tcl         |  47 +++++
 .../projects/placelut_ff_fb/Makefile          |   2 +
 .../projects/placelut_ff_fb/README.md         |   3 +
 .../{placelut_ff_fb.py => generate.py}        |   0
 .../projects/placelut_ff_fb/generate.sh       |   9 +
 .../projects/placelut_ff_fb/generate.tcl      |  47 +++++
 fuzzers/007-timing/rref.py                    |   2 +-
 fuzzers/007-timing/solve_linprog.py           |   5 -
 fuzzers/007-timing/timfuz.py                  | 165 ++----------------
 fuzzers/007-timing/timfuz_massage.py          |  18 +-
 fuzzers/007-timing/timfuz_solve.py            |   4 +-
 20 files changed, 156 insertions(+), 179 deletions(-)
 create mode 100644 fuzzers/007-timing/Makefile
 create mode 100644 fuzzers/007-timing/projects/Makefile
 create mode 100644 fuzzers/007-timing/projects/placelut/README.md
 create mode 100644 fuzzers/007-timing/projects/placelut_fb/Makefile
 create mode 100644 fuzzers/007-timing/projects/placelut_fb/README.md
 rename fuzzers/007-timing/projects/placelut_fb/{placelut_fb.py => generate.py} (100%)
 create mode 100755 fuzzers/007-timing/projects/placelut_fb/generate.sh
 create mode 100644 fuzzers/007-timing/projects/placelut_fb/generate.tcl
 create mode 100644 fuzzers/007-timing/projects/placelut_ff_fb/Makefile
 create mode 100644 fuzzers/007-timing/projects/placelut_ff_fb/README.md
 rename fuzzers/007-timing/projects/placelut_ff_fb/{placelut_ff_fb.py => generate.py} (100%)
 create mode 100755 fuzzers/007-timing/projects/placelut_ff_fb/generate.sh
 create mode 100644 fuzzers/007-timing/projects/placelut_ff_fb/generate.tcl

diff --git a/fuzzers/007-timing/Makefile b/fuzzers/007-timing/Makefile
new file mode 100644
index 00000000..1f90909f
--- /dev/null
+++ b/fuzzers/007-timing/Makefile
@@ -0,0 +1,5 @@
+all:
+	cd speed && make
+	cd timgrid && make
+	cd projects && make
+
diff --git a/fuzzers/007-timing/checksub.py b/fuzzers/007-timing/checksub.py
index 9cdb259d..00559735 100644
--- a/fuzzers/007-timing/checksub.py
+++ b/fuzzers/007-timing/checksub.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python3
 
-from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json
+from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json
 import numpy as np
 import glob
 import json
@@ -58,11 +58,6 @@ def run(fns_in, sub_json=None, verbose=False):
 
     Ads, b = loadc_Ads_b(fns_in, corner, ico=True)
 
-    # Remove duplicate rows
-    # is this necessary?
-    # maybe better to just add them into the matrix directly
-    #Ads, b = simplify_rows(Ads, b)
-
     if sub_json:
         print('Subbing JSON %u rows' % len(Ads))
         #pds(Ads, 'Orig')
diff --git a/fuzzers/007-timing/corner_csv.py b/fuzzers/007-timing/corner_csv.py
index 1df10bd0..d64c64ab 100644
--- a/fuzzers/007-timing/corner_csv.py
+++ b/fuzzers/007-timing/corner_csv.py
@@ -5,7 +5,7 @@ import glob
 
 def run(fout, fns_in, corner, verbose=0):
     Ads, b = loadc_Ads_b(fns_in, corner, ico=True)
-    Ads, b = simplify_rows(Ads, b)
+    Ads, b = simplify_rows(Ads, b, corner=corner)
 
     fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
     for row_b, row_ds in zip(b, Ads):
diff --git a/fuzzers/007-timing/projects/Makefile b/fuzzers/007-timing/projects/Makefile
new file mode 100644
index 00000000..eb1f30a9
--- /dev/null
+++ b/fuzzers/007-timing/projects/Makefile
@@ -0,0 +1,4 @@
+all:
+	echo "FIXME: tie projects together"
+	false
+
diff --git a/fuzzers/007-timing/projects/placelut/README.md b/fuzzers/007-timing/projects/placelut/README.md
new file mode 100644
index 00000000..0df7e3f8
--- /dev/null
+++ b/fuzzers/007-timing/projects/placelut/README.md
@@ -0,0 +1,2 @@
+LUTs are physically laid out in an array and directly connected to a test pattern generator
+
diff --git a/fuzzers/007-timing/projects/placelut_fb/Makefile b/fuzzers/007-timing/projects/placelut_fb/Makefile
new file mode 100644
index 00000000..9c8b1947
--- /dev/null
+++ b/fuzzers/007-timing/projects/placelut_fb/Makefile
@@ -0,0 +1,2 @@
+include ../project.mk
+
diff --git a/fuzzers/007-timing/projects/placelut_fb/README.md b/fuzzers/007-timing/projects/placelut_fb/README.md
new file mode 100644
index 00000000..1e597818
--- /dev/null
+++ b/fuzzers/007-timing/projects/placelut_fb/README.md
@@ -0,0 +1,2 @@
+LUTs are physically laid out in an array and connected to test pattern generator and fed back to other LUTs
+
diff --git a/fuzzers/007-timing/projects/placelut_fb/placelut_fb.py b/fuzzers/007-timing/projects/placelut_fb/generate.py
similarity index 100%
rename from fuzzers/007-timing/projects/placelut_fb/placelut_fb.py
rename to fuzzers/007-timing/projects/placelut_fb/generate.py
diff --git a/fuzzers/007-timing/projects/placelut_fb/generate.sh b/fuzzers/007-timing/projects/placelut_fb/generate.sh
new file mode 100755
index 00000000..579f2021
--- /dev/null
+++ b/fuzzers/007-timing/projects/placelut_fb/generate.sh
@@ -0,0 +1,9 @@
+#!/bin/bash
+
+set -ex
+source ../generate.sh
+
+python ../generate.py --sdx 4 --sdy 4  >top.v
+vivado -mode batch -source ../generate.tcl
+timing_txt2csv
+
diff --git a/fuzzers/007-timing/projects/placelut_fb/generate.tcl b/fuzzers/007-timing/projects/placelut_fb/generate.tcl
new file mode 100644
index 00000000..0b536169
--- /dev/null
+++ b/fuzzers/007-timing/projects/placelut_fb/generate.tcl
@@ -0,0 +1,47 @@
+source ../../../../../utils/utils.tcl
+source ../../project.tcl
+
+proc build_design {} {
+    create_project -force -part $::env(XRAY_PART) design design
+    read_verilog top.v
+    synth_design -top top
+
+    puts "Locking pins"
+    set_property LOCK_PINS {I0:A1 I1:A2 I2:A3 I3:A4 I4:A5 I5:A6} \
+		[get_cells -quiet -filter {REF_NAME == LUT6} -hierarchical]
+
+    puts "Package stuff"
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_00) IOSTANDARD LVCMOS33" [get_ports clk]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_01) IOSTANDARD LVCMOS33" [get_ports stb]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_02) IOSTANDARD LVCMOS33" [get_ports di]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_03) IOSTANDARD LVCMOS33" [get_ports do]
+
+    puts "pblocking"
+    create_pblock roi
+    set roipb [get_pblocks roi]
+    set_property EXCLUDE_PLACEMENT 1 $roipb
+    add_cells_to_pblock $roipb [get_cells roi]
+    resize_pblock $roipb -add "$::env(XRAY_ROI)"
+
+    puts "randplace"
+    randplace_pblock 50 roi
+
+    set_property CFGBVS VCCO [current_design]
+    set_property CONFIG_VOLTAGE 3.3 [current_design]
+    set_property BITSTREAM.GENERAL.PERFRAMECRC YES [current_design]
+
+    puts "dedicated route"
+    set_property CLOCK_DEDICATED_ROUTE FALSE [get_nets clk_IBUF]
+
+    place_design
+    route_design
+
+    write_checkpoint -force design.dcp
+    # disable combinitorial loop
+    # set_property IS_ENABLED 0 [get_drc_checks {LUTLP-1}]
+    #write_bitstream -force design.bit
+}
+
+build_design
+write_info3
+
diff --git a/fuzzers/007-timing/projects/placelut_ff_fb/Makefile b/fuzzers/007-timing/projects/placelut_ff_fb/Makefile
new file mode 100644
index 00000000..9c8b1947
--- /dev/null
+++ b/fuzzers/007-timing/projects/placelut_ff_fb/Makefile
@@ -0,0 +1,2 @@
+include ../project.mk
+
diff --git a/fuzzers/007-timing/projects/placelut_ff_fb/README.md b/fuzzers/007-timing/projects/placelut_ff_fb/README.md
new file mode 100644
index 00000000..983849b3
--- /dev/null
+++ b/fuzzers/007-timing/projects/placelut_ff_fb/README.md
@@ -0,0 +1,3 @@
+LUTs are physically laid out in an array and connected to test pattern generator and fed back to other LUTs.
+FFs are randomly inserted between connections.
+
diff --git a/fuzzers/007-timing/projects/placelut_ff_fb/placelut_ff_fb.py b/fuzzers/007-timing/projects/placelut_ff_fb/generate.py
similarity index 100%
rename from fuzzers/007-timing/projects/placelut_ff_fb/placelut_ff_fb.py
rename to fuzzers/007-timing/projects/placelut_ff_fb/generate.py
diff --git a/fuzzers/007-timing/projects/placelut_ff_fb/generate.sh b/fuzzers/007-timing/projects/placelut_ff_fb/generate.sh
new file mode 100755
index 00000000..579f2021
--- /dev/null
+++ b/fuzzers/007-timing/projects/placelut_ff_fb/generate.sh
@@ -0,0 +1,9 @@
+#!/bin/bash
+
+set -ex
+source ../generate.sh
+
+python ../generate.py --sdx 4 --sdy 4  >top.v
+vivado -mode batch -source ../generate.tcl
+timing_txt2csv
+
diff --git a/fuzzers/007-timing/projects/placelut_ff_fb/generate.tcl b/fuzzers/007-timing/projects/placelut_ff_fb/generate.tcl
new file mode 100644
index 00000000..0b536169
--- /dev/null
+++ b/fuzzers/007-timing/projects/placelut_ff_fb/generate.tcl
@@ -0,0 +1,47 @@
+source ../../../../../utils/utils.tcl
+source ../../project.tcl
+
+proc build_design {} {
+    create_project -force -part $::env(XRAY_PART) design design
+    read_verilog top.v
+    synth_design -top top
+
+    puts "Locking pins"
+    set_property LOCK_PINS {I0:A1 I1:A2 I2:A3 I3:A4 I4:A5 I5:A6} \
+		[get_cells -quiet -filter {REF_NAME == LUT6} -hierarchical]
+
+    puts "Package stuff"
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_00) IOSTANDARD LVCMOS33" [get_ports clk]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_01) IOSTANDARD LVCMOS33" [get_ports stb]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_02) IOSTANDARD LVCMOS33" [get_ports di]
+    set_property -dict "PACKAGE_PIN $::env(XRAY_PIN_03) IOSTANDARD LVCMOS33" [get_ports do]
+
+    puts "pblocking"
+    create_pblock roi
+    set roipb [get_pblocks roi]
+    set_property EXCLUDE_PLACEMENT 1 $roipb
+    add_cells_to_pblock $roipb [get_cells roi]
+    resize_pblock $roipb -add "$::env(XRAY_ROI)"
+
+    puts "randplace"
+    randplace_pblock 50 roi
+
+    set_property CFGBVS VCCO [current_design]
+    set_property CONFIG_VOLTAGE 3.3 [current_design]
+    set_property BITSTREAM.GENERAL.PERFRAMECRC YES [current_design]
+
+    puts "dedicated route"
+    set_property CLOCK_DEDICATED_ROUTE FALSE [get_nets clk_IBUF]
+
+    place_design
+    route_design
+
+    write_checkpoint -force design.dcp
+    # disable combinitorial loop
+    # set_property IS_ENABLED 0 [get_drc_checks {LUTLP-1}]
+    #write_bitstream -force design.bit
+}
+
+build_design
+write_info3
+
diff --git a/fuzzers/007-timing/rref.py b/fuzzers/007-timing/rref.py
index 19dcc89c..4cf1b9e7 100644
--- a/fuzzers/007-timing/rref.py
+++ b/fuzzers/007-timing/rref.py
@@ -71,7 +71,7 @@ class State(object):
         Ads, b = loadc_Ads_b(fn_ins, corner=corner, ico=True)
         if simplify:
             print('Simplifying corner %s' % (corner,))
-            Ads, b = simplify_rows(Ads, b, remove_zd=False)
+            Ads, b = simplify_rows(Ads, b, remove_zd=False, corner=corner)
         return State(Ads)
 
 def write_state(state, fout):
diff --git a/fuzzers/007-timing/solve_linprog.py b/fuzzers/007-timing/solve_linprog.py
index 201ba7ca..ec25474c 100644
--- a/fuzzers/007-timing/solve_linprog.py
+++ b/fuzzers/007-timing/solve_linprog.py
@@ -105,11 +105,6 @@ def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
             if nonzero and (verbose or ((nonzeros < 100 or nonzeros % 20 == 0) and nonzeros <= plim)):
                 print('  % 4u % -80s % 10.1f' % (xi, name, x))
         print('Delay on %d / %d' % (nonzeros, len(res.x)))
-        if not os.path.exists('res'):
-            os.mkdir('res')
-        fn_out = 'res/%s' % datetime.datetime.utcnow().isoformat().split('.')[0]
-        print('Writing %s' % fn_out)
-        np.save(fn_out, (3, c, A_ub, b_ub, bounds, names, res, meta))
 
         if outfn:
             # ballpark minimum actual observed delay is around 7 (carry chain)
diff --git a/fuzzers/007-timing/timfuz.py b/fuzzers/007-timing/timfuz.py
index 868e8126..09b34da2 100644
--- a/fuzzers/007-timing/timfuz.py
+++ b/fuzzers/007-timing/timfuz.py
@@ -130,12 +130,20 @@ def Ab_ub_dt2d(eqns):
     return list(A_ubd), list(b_ub)
 
 # This significantly reduces runtime
-def simplify_rows(Ads, b_ub, remove_zd=False):
+def simplify_rows(Ads, b_ub, remove_zd=False, corner=None):
     '''Remove duplicate equations, taking highest delay'''
     # dict of constants to highest delay
     eqns = OrderedDict()
     assert len(Ads) == len(b_ub), (len(Ads), len(b_ub))
 
+    assert corner is not None
+    minmax = {
+        'fast_max': max,
+        'fast_min': min,
+        'slow_max': max,
+        'slow_min': min,
+        }[corner]
+
     sys.stdout.write('SimpR ')
     sys.stdout.flush()
     progress = int(max(1, len(b_ub) / 100))
@@ -161,7 +169,7 @@ def simplify_rows(Ads, b_ub, remove_zd=False):
             continue
 
         rowt = Ar_ds2t(rowd)
-        eqns[rowt] = max(eqns.get(rowt, 0), b)
+        eqns[rowt] = minmax(eqns.get(rowt, 0), b)
 
     print(' done')
 
@@ -473,159 +481,6 @@ def filter_ncols(A_ubd, b_ub, cols_min=0, cols_max=0):
     assert len(b_ub_ret)
     return A_ubd_ret, b_ub_ret
 
-def preprocess(A_ubd, b_ub, opts, names, verbose=0):
-    def debug(what):
-        if verbose:
-            print('')
-            print_eqns(A_ubd, b_ub, verbose=verbose, label=what, lim=20)
-            col_dist(A_ubd, what, names)
-            check_feasible_d(A_ubd, b_ub, names)
-
-    col_dist(A_ubd, 'pre-filt', names, lim=12)
-    debug('pre-filt')
-
-    need_simpc = 0
-
-    # Input set may have redundant constraints
-    A_ubd, b_ub = simplify_rows(A_ubd=A_ubd, b_ub=b_ub)
-    debug("simp_rows")
-    cols_min_pre = opts.get('cols_min_pre', None)
-    cols_max_pre = opts.get('cols_max_pre', None)
-    # Filter input based on number of columns
-    if cols_min_pre or cols_max_pre:
-        A_ubd, b_ub = filter_ncols(A_ubd=A_ubd, b_ub=b_ub, cols_min=cols_min_pre, cols_max=cols_max_pre)
-        debug("filt_ncols")
-        need_simpc = 1
-
-    # Limit input rows, mostly for quick full run checks
-    row_limit = opts.get('row_limit', None)
-    if row_limit:
-        before_rows = len(b_ub)
-        A_ubd = A_ubd[0:row_limit]
-        b_ub = b_ub[0:row_limit]
-        print('Row limit %d => %d rows' % (before_rows, len(b_ub)))
-        need_simpc = 1
-
-    if need_simpc:
-        names, A_ubd, b_ub = simplify_cols(names=names, A_ubd=A_ubd, b_ub=b_ub)
-        debug("simp_cols")
-
-    return A_ubd, b_ub, names
-
-def massage_equations(A_ubd, b_ub, opts, names, verbose=0):
-    '''
-    Equation pipeline
-    Some operations may generate new equations
-    Simplify after these to avoid unnecessary overhead on redundant constraints
-    Similarly some operations may eliminate equations, potentially eliminating a column (ie variable)
-    Remove these columns as necessary to speed up solving
-    '''
-
-    def debug(what):
-        if verbose:
-            print('')
-            print_eqns(A_ubd, b_ub, verbose=verbose, label=what, lim=20)
-            col_dist(A_ubd, what, names)
-            check_feasible_d(A_ubd, b_ub, names)
-
-    A_ubd, b_ub, names = preprocess(A_ubd, b_ub, opts, names, verbose=verbose)
-
-    # Try to (intelligently) subtract equations to generate additional constraints
-    # This helps avoid putting all delay in a single shared variable
-    derive_lim = opts.get('derive_lim', None)
-    if derive_lim:
-        dstart = len(b_ub)
-
-        # Original simple
-        if 0:
-            for di in range(derive_lim):
-                print
-                assert len(A_ubd) == len(b_ub)
-                n_orig = len(b_ub)
-
-                # Meat of the operation
-                # Focus on easy equations for first pass to get a lot of easy derrivations
-                col_lim = 12 if di == 0 else None
-                #col_lim = None
-                A_ubd, b_ub = derive_eq_by_row(A_ubd, b_ub, col_lim=col_lim)
-                debug("der_rows")
-                # Run another simplify pass since new equations may have overlap with original
-                A_ubd, b_ub = simplify_rows(A_ubd, b_ub)
-                print('Derive row %d / %d: %d => %d equations' % (di + 1, derive_lim, n_orig, len(b_ub)))
-                debug("der_rows simp")
-
-                n_orig2 = len(b_ub)
-                # Meat of the operation
-                A_ubd, b_ub = derive_eq_by_col(A_ubd, b_ub)
-                debug("der_cols")
-                # Run another simplify pass since new equations may have overlap with original
-                A_ubd, b_ub = simplify_rows(A_ubd=A_ubd, b_ub=b_ub)
-                print('Derive col %d / %d: %d => %d equations' % (di + 1, derive_lim, n_orig2, len(b_ub)))
-                debug("der_cols simp")
-
-                if n_orig == len(b_ub):
-                    break
-
-        if 1:
-            # Each iteration one more column is allowed until all columns are included
-            # (and the system is stable)
-            col_lim = 15
-            di = 0
-            while True:
-                print
-                n_orig = len(b_ub)
-
-                print('Loop %d, lim %d' % (di + 1, col_lim))
-                # Meat of the operation
-                A_ubd, b_ub = derive_eq_by_row(A_ubd, b_ub, col_lim=col_lim, tweak=True)
-                debug("der_rows")
-                # Run another simplify pass since new equations may have overlap with original
-                A_ubd, b_ub = simplify_rows(A_ubd, b_ub)
-                print('Derive row: %d => %d equations' % (n_orig, len(b_ub)))
-                debug("der_rows simp")
-
-                n_orig2 = len(b_ub)
-                # Meat of the operation
-                A_ubd, b_ub = derive_eq_by_col(A_ubd, b_ub)
-                debug("der_cols")
-                # Run another simplify pass since new equations may have overlap with original
-                A_ubd, b_ub = simplify_rows(A_ubd=A_ubd, b_ub=b_ub)
-                print('Derive col %d: %d => %d equations' % (di + 1, n_orig2, len(b_ub)))
-                debug("der_cols simp")
-
-                # Doesn't help computation, but helps debugging
-                names, A_ubd, b_ub = simplify_cols(names=names, A_ubd=A_ubd, b_ub=b_ub)
-                A_ubd, b_ub = sort_equations(A_ubd, b_ub)
-                debug("loop done")
-                col_dist(A_ubd, 'derive done iter %d, lim %d' % (di, col_lim), names, lim=12)
-
-                rows = len(A_ubd)
-                if n_orig == len(b_ub) and col_lim >= rows:
-                    break
-                col_lim += col_lim / 5
-                di += 1
-
-        dend = len(b_ub)
-        print('')
-        print('Derive net: %d => %d' % (dstart, dend))
-        print('')
-        # Was experimentting to see how much the higher order columns really help
-
-    cols_min_post = opts.get('cols_min_post', None)
-    cols_max_post = opts.get('cols_max_post', None)
-    # Filter input based on number of columns
-    if cols_min_post or cols_max_post:
-        A_ubd, b_ub = filter_ncols(A_ubd=A_ubd, b_ub=b_ub, cols_min=cols_min_post, cols_max=cols_max_post)
-        debug("filter_ncals final")
-
-    names, A_ubd, b_ub = simplify_cols(names=names, A_ubd=A_ubd, b_ub=b_ub)
-    debug("simp_cols final")
-
-    # Helps debug readability
-    A_ubd, b_ub = sort_equations(A_ubd, b_ub)
-    debug("final (sorted)")
-    return names, A_ubd, b_ub
-
 def Ar_di2ds(rowA, names):
     row = OrderedDict()
     for k, v in rowA.items():
diff --git a/fuzzers/007-timing/timfuz_massage.py b/fuzzers/007-timing/timfuz_massage.py
index 046886ce..e35f4e28 100644
--- a/fuzzers/007-timing/timfuz_massage.py
+++ b/fuzzers/007-timing/timfuz_massage.py
@@ -323,7 +323,7 @@ def derive_eq_by_col(Ads, b_ub, verbose=0):
     return Ads_ret, b_ret
 
 # keep derriving until solution is (probably) stable
-def massage_equations_old(Ads, b, verbose=False, derive_lim=3):
+def massage_equations_old(Ads, b, verbose=False, derive_lim=3, corner=None):
     '''
     Equation pipeline
     Some operations may generate new equations
@@ -356,7 +356,7 @@ def massage_equations_old(Ads, b, verbose=False, derive_lim=3):
         Ads, b = derive_eq_by_row(Ads, b, col_lim=col_lim)
         debug("der_rows")
         # Run another simplify pass since new equations may have overlap with original
-        Ads, b = simplify_rows(Ads, b)
+        Ads, b = simplify_rows(Ads, b, corner=corner)
         print('Derive row %d / %d: %d => %d equations' % (di + 1, derive_lim, n_orig, len(b)))
         debug("der_rows simp")
 
@@ -365,7 +365,7 @@ def massage_equations_old(Ads, b, verbose=False, derive_lim=3):
         Ads, b = derive_eq_by_col(Ads, b)
         debug("der_cols")
         # Run another simplify pass since new equations may have overlap with original
-        Ads, b = simplify_rows(Ads, b)
+        Ads, b = simplify_rows(Ads, b, corner=corner)
         print('Derive col %d / %d: %d => %d equations' % (di + 1, derive_lim, n_orig2, len(b)))
         debug("der_cols simp")
 
@@ -394,7 +394,7 @@ def massage_equations_old(Ads, b, verbose=False, derive_lim=3):
     return Ads, b
 
 # iteratively increasing column limit until all columns are added
-def massage_equations_inc_col_lim(Ads, b, verbose=False):
+def massage_equations_inc_col_lim(Ads, b, verbose=False, corner=None):
     '''
     Equation pipeline
     Some operations may generate new equations
@@ -428,7 +428,7 @@ def massage_equations_inc_col_lim(Ads, b, verbose=False):
         Ads, b = derive_eq_by_row(Ads, b, col_lim=col_lim, tweak=True)
         debug("der_rows")
         # Run another simplify pass since new equations may have overlap with original
-        Ads, b = simplify_rows(Ads, b)
+        Ads, b = simplify_rows(Ads, b, corner=corner)
         print('Derive row: %d => %d equations' % (n_orig, len(b)))
         debug("der_rows simp")
 
@@ -437,7 +437,7 @@ def massage_equations_inc_col_lim(Ads, b, verbose=False):
         Ads, b = derive_eq_by_col(Ads, b)
         debug("der_cols")
         # Run another simplify pass since new equations may have overlap with original
-        Ads, b = simplify_rows(Ads, b)
+        Ads, b = simplify_rows(Ads, b, corner=corner)
         print('Derive col %d: %d => %d equations' % (di + 1, n_orig2, len(b)))
         debug("der_cols simp")
 
@@ -467,7 +467,7 @@ def massage_equations_inc_col_lim(Ads, b, verbose=False):
 
 # only derive based on nearby equations
 # theory is they will be the best to diff
-def massage_equations_near(Ads, b, verbose=False):
+def massage_equations_near(Ads, b, verbose=False, corner=None):
     '''
     Equation pipeline
     Some operations may generate new equations
@@ -497,7 +497,7 @@ def massage_equations_near(Ads, b, verbose=False):
     Ads, b = derive_eq_by_near_row(Ads, b, tweak=True)
     debug("der_rows")
     # Run another simplify pass since new equations may have overlap with original
-    Ads, b = simplify_rows(Ads, b)
+    Ads, b = simplify_rows(Ads, b, corner=corner)
     print('Derive row: %d => %d equations' % (n_orig, len(b)))
     debug("der_rows simp")
 
@@ -506,7 +506,7 @@ def massage_equations_near(Ads, b, verbose=False):
     Ads, b = derive_eq_by_col(Ads, b)
     debug("der_cols")
     # Run another simplify pass since new equations may have overlap with original
-    Ads, b = simplify_rows(Ads, b)
+    Ads, b = simplify_rows(Ads, b, corner=corner)
     print('Derive col: %d => %d equations' % (n_orig2, len(b)))
     debug("der_cols simp")
 
diff --git a/fuzzers/007-timing/timfuz_solve.py b/fuzzers/007-timing/timfuz_solve.py
index c6343e70..0d5b36d9 100644
--- a/fuzzers/007-timing/timfuz_solve.py
+++ b/fuzzers/007-timing/timfuz_solve.py
@@ -91,7 +91,7 @@ def run(fns_in, corner, run_corner, sub_json=None, sub_csv=None, dedup=True, mas
     if dedup:
         oldn = len(Ads)
         iold = instances(Ads)
-        Ads, b = simplify_rows(Ads, b)
+        Ads, b = simplify_rows(Ads, b, corner=corner)
         print('Simplify %u => %u rows' % (oldn, len(Ads)))
         print('Simplify %u => %u instances' % (iold, instances(Ads)))
 
@@ -142,7 +142,7 @@ def run(fns_in, corner, run_corner, sub_json=None, sub_csv=None, dedup=True, mas
     This creates derived constraints to provide more realistic results
     '''
     if massage:
-        Ads, b = massage_equations(Ads, b)
+        Ads, b = massage_equations(Ads, b, corner=corner)
 
     print('Converting to numpy...')
     names, Anp = A_ds2np(Ads)

From 7e4378446927b8a4a6ded34e29baa3c3de013d30 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Tue, 11 Sep 2018 18:22:22 -0700
Subject: [PATCH 38/55] timfuz: remove dead code

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/timfuz_solve.py | 17 ++++++-----------
 1 file changed, 6 insertions(+), 11 deletions(-)

diff --git a/fuzzers/007-timing/timfuz_solve.py b/fuzzers/007-timing/timfuz_solve.py
index 0d5b36d9..5b66ad35 100644
--- a/fuzzers/007-timing/timfuz_solve.py
+++ b/fuzzers/007-timing/timfuz_solve.py
@@ -111,17 +111,12 @@ def run(fns_in, corner, run_corner, sub_json=None, sub_csv=None, dedup=True, mas
     # however, I wanted to do some filtering based on expected form
     if sub_csv:
         Ads2, b2 = loadc_Ads_b([sub_csv], corner, ico=True)
-        if 0:
-            Ads = Ads + Ads2
-            b = b + b2
-        else:
-            bounds = Ads2bounds(Ads2, b2)
-            rows_old = len(Ads)
-            Ads, b = filter_bounds(Ads, b, bounds)
-            print('Filter bounds: %s => %s rows' % (rows_old, len(Ads)))
-            if 1:
-                Ads = Ads + Ads2
-                b = b + b2
+        bounds = Ads2bounds(Ads2, b2)
+        rows_old = len(Ads)
+        Ads, b = filter_bounds(Ads, b, bounds)
+        print('Filter bounds: %s => %s rows' % (rows_old, len(Ads)))
+        Ads = Ads + Ads2
+        b = b + b2
 
     if verbose:
         print

From a4950a86025cb3e3b0a805f9b116f1f763d874bc Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Tue, 11 Sep 2018 18:36:19 -0700
Subject: [PATCH 39/55] timfuz: misc cleanup

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/solve_leastsq.py | 87 ++++++++++++++---------------
 fuzzers/007-timing/solve_linprog.py |  2 +-
 fuzzers/007-timing/timfuz_solve.py  |  8 ++-
 3 files changed, 48 insertions(+), 49 deletions(-)

diff --git a/fuzzers/007-timing/solve_leastsq.py b/fuzzers/007-timing/solve_leastsq.py
index fde102c2..bbb20ecc 100644
--- a/fuzzers/007-timing/solve_leastsq.py
+++ b/fuzzers/007-timing/solve_leastsq.py
@@ -20,16 +20,52 @@ import scipy.optimize as optimize
 from scipy.optimize import least_squares
 
 def mkestimate(Anp, b):
+    '''
+    Ballpark upper bound estimate assuming variables contribute all of the delay in their respective row
+    Return the min of all of the occurances
+
+    XXX: should this be corner adjusted?
+    '''
     cols = len(Anp[0])
     x0 = np.array([1e3 for _x in range(cols)])
     for row_np, row_b in zip(Anp, b):
         for coli, val in enumerate(row_np):
             if val:
+                # Scale by number occurances
                 ub = row_b / val
                 if ub >= 0:
                     x0[coli] = min(x0[coli], ub)
     return x0
 
+def save(outfn, res, names):
+    # ballpark minimum actual observed delay is around 7 (carry chain)
+    # anything less than one is probably a solver artifact
+    delta = 0.5
+
+    print('Writing resutls')
+    skips = 0
+    with open(outfn, 'w') as fout:
+        # write as one variable per line
+        # this natively forms a bound if fed into linprog solver
+        fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
+        for xval, name in zip(res.x, names):
+            row_ico = 1
+
+            # FIXME: only report for the given corner?
+            # also review ceil vs floor choice for min vs max
+            # lets be more conservative for now
+            if xval < delta:
+                #print('Skipping %s: %0.6f' % (name, xval))
+                skips += 1
+                continue
+            #xvali = round(xval)
+            xvali = math.ceil(xval)
+            corners = [xvali for _ in range(4)]
+            items = [str(row_ico), ' '.join([str(x) for x in corners])]
+            items.append('%u %s' % (1, name))
+            fout.write(','.join(items) + '\n')
+    print('Wrote: skip %u => %u / %u valid delays' % (skips, len(names) - skips, len(names)))
+
 def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
     # Given timing scores for above delays (-ps)
     assert type(Anp[0]) is np.ndarray, type(Anp[0])
@@ -93,59 +129,20 @@ def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
     #x0 = np.array([1000.0 for _x in range(cols)])
     print('Creating x0 estimate')
     x0 = mkestimate(Anp, b)
-    #print('x0', x0)
 
-    if 0:
-        x, cov_x, infodict, mesg, ier = optimize.leastsq(func, x0, args=(), full_output=True)
-        print('x', x)
-        print('cov_x', cov_x)
-        print('infodictx', infodict)
-        print('mesg', mesg)
-        print('ier', ier)
-        print('  Solution found: %s' % (ier in (1, 2, 3, 4)))
-    else:
-        print('Solving')
-        res = least_squares(func, x0, bounds=(0, float('inf')))
-        if 0:
-            print(res)
-            print('')
-            print(res.x)
-        print('Done')
-        if outfn:
-            # ballpark minimum actual observed delay is around 7 (carry chain)
-            # anything less than one is probably a solver artifact
-            delta = 0.5
+    print('Solving')
+    res = least_squares(func, x0, bounds=(0, float('inf')))
+    print('Done')
 
-            print('Writing resutls')
-            skips = 0
-            with open(outfn, 'w') as fout:
-                # write as one variable per line
-                # this natively forms a bound if fed into linprog solver
-                fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
-                for xval, name in zip(res.x, names):
-                    row_ico = 1
-
-                    # FIXME: only report for the given corner?
-                    # also review ceil vs floor choice for min vs max
-                    # lets be more conservative for now
-                    if xval < delta:
-                        #print('Skipping %s: %0.6f' % (name, xval))
-                        skips += 1
-                        continue
-                    #xvali = round(xval)
-                    xvali = math.ceil(xval)
-                    corners = [xvali for _ in range(4)]
-                    items = [str(row_ico), ' '.join([str(x) for x in corners])]
-                    items.append('%u %s' % (1, name))
-                    fout.write(','.join(items) + '\n')
-            print('Wrote: skip %u => %u / %u valid delays' % (skips, len(names) - skips, len(names)))
+    if outfn:
+        save(outfn, res, names)
 
 def main():
     import argparse
 
     parser = argparse.ArgumentParser(
         description=
-        'Solve timing solution'
+        'Solve timing solution using least squares objective function'
     )
 
     parser.add_argument('--verbose', action='store_true', help='')
diff --git a/fuzzers/007-timing/solve_linprog.py b/fuzzers/007-timing/solve_linprog.py
index ec25474c..c33cd34a 100644
--- a/fuzzers/007-timing/solve_linprog.py
+++ b/fuzzers/007-timing/solve_linprog.py
@@ -140,7 +140,7 @@ def main():
 
     parser = argparse.ArgumentParser(
         description=
-        'Solve timing solution'
+        'Solve timing solution using linear programming inequalities'
     )
 
     parser.add_argument('--verbose', action='store_true', help='')
diff --git a/fuzzers/007-timing/timfuz_solve.py b/fuzzers/007-timing/timfuz_solve.py
index 5b66ad35..c9af58b1 100644
--- a/fuzzers/007-timing/timfuz_solve.py
+++ b/fuzzers/007-timing/timfuz_solve.py
@@ -106,9 +106,11 @@ def run(fns_in, corner, run_corner, sub_json=None, sub_csv=None, dedup=True, mas
     else:
         names = index_names(Ads)
 
-    # post substitution csv
-    # actually this might not be strictly necessary since subs would just not apply
-    # however, I wanted to do some filtering based on expected form
+    '''
+    Substitution .csv
+    Special .csv containing one variable per line
+    Used primarily for multiple optimization passes, such as different algorithms or additional constraints
+    '''
     if sub_csv:
         Ads2, b2 = loadc_Ads_b([sub_csv], corner, ico=True)
         bounds = Ads2bounds(Ads2, b2)

From a55b766c44bf757bf6cfc80a84a61832db9548a0 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Tue, 11 Sep 2018 19:45:33 -0700
Subject: [PATCH 40/55] timfuz: track corners properly

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/csv_flat2group.py   | 12 ++---
 fuzzers/007-timing/csv_group2flat.py   | 34 ++++++------
 fuzzers/007-timing/projects/project.mk |  9 ++--
 fuzzers/007-timing/solve_leastsq.py    | 20 +++-----
 fuzzers/007-timing/solve_linprog.py    | 71 +++++++++++---------------
 fuzzers/007-timing/tile_annotate.py    | 22 ++++----
 fuzzers/007-timing/timfuz.py           | 33 ++++++++++--
 fuzzers/007-timing/timfuz_solve.py     |  2 +-
 8 files changed, 111 insertions(+), 92 deletions(-)

diff --git a/fuzzers/007-timing/csv_flat2group.py b/fuzzers/007-timing/csv_flat2group.py
index 57be54a5..f1398b87 100644
--- a/fuzzers/007-timing/csv_flat2group.py
+++ b/fuzzers/007-timing/csv_flat2group.py
@@ -1,11 +1,10 @@
 #!/usr/bin/env python3
 
-from timfuz import Benchmark, loadc_Ads_b, index_names, load_sub, run_sub_json, instances
+from timfuz import Benchmark, loadc_Ads_bs, index_names, load_sub, run_sub_json, instances
 
 def gen_group(fnin, sub_json, strict=False, verbose=False):
     print('Loading data')
-    # FIXME: preserve corners
-    Ads, b = loadc_Ads_b([fnin], corner=None, ico=True)
+    Ads, bs = loadc_Ads_bs([fnin], ico=True)
 
     print('Sub: %u rows' % len(Ads))
     iold = instances(Ads)
@@ -15,10 +14,10 @@ def gen_group(fnin, sub_json, strict=False, verbose=False):
     print("Sub: %u => %u names" % (len(names_old), len(names)))
     print('Sub: %u => %u instances' % (iold, instances(Ads)))
 
-    for row_ds, row_b in zip(Ads, b):
-        yield row_ds, [row_b for _ in range(4)]
+    for row_ds, row_bs in zip(Ads, bs):
+        yield row_ds, row_bs
 
-def run(fns_in, fnout, sub_json, corner=None, strict=False, verbose=False):
+def run(fns_in, fnout, sub_json, strict=False, verbose=False):
     with open(fnout, 'w') as fout:
         fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
         for fn_in in fns_in:
@@ -38,7 +37,6 @@ def main():
     )
 
     parser.add_argument('--verbose', action='store_true', help='')
-    parser.add_argument('--massage', action='store_true', help='')
     parser.add_argument('--strict', action='store_true', help='')
     parser.add_argument('--sub-csv', help='')
     parser.add_argument('--sub-json', required=True, help='Group substitutions to make fully ranked')
diff --git a/fuzzers/007-timing/csv_group2flat.py b/fuzzers/007-timing/csv_group2flat.py
index bf5c2870..2449b916 100644
--- a/fuzzers/007-timing/csv_group2flat.py
+++ b/fuzzers/007-timing/csv_group2flat.py
@@ -2,7 +2,7 @@
 
 # https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
 from scipy.optimize import linprog
-from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json, A_ub_np2d, print_eqns, print_eqns_np, Ads2bounds, loadc_Ads_raw
+from timfuz import Benchmark, loadc_Ads_bs, load_sub, Ads2bounds, corners2csv, corner_s2i
 from timfuz_massage import massage_equations
 import numpy as np
 import glob
@@ -15,15 +15,13 @@ import datetime
 import os
 import time
 
-def gen_flat(fnin, sub_json):
-    # FIXME: preserve all bounds
-    # Ads, bs = loadc_Ads_raw([csv_fn_in])
-    Ads, b = loadc_Ads_b([fnin], corner=None, ico=True)
-    bounds = Ads2bounds(Ads, b)
+def gen_flat(fnin, sub_json, corner=None):
+    Ads, bs = loadc_Ads_bs([fnin], ico=True)
+    bounds = Ads2bounds(Ads, bs)
     zeros = set()
     nonzeros = set()
 
-    for bound_name, bound_b in bounds.items():
+    for bound_name, bound_bs in bounds.items():
         sub = sub_json['subs'].get(bound_name, None)
         if sub:
             # put entire delay into pivot
@@ -34,18 +32,23 @@ def gen_flat(fnin, sub_json):
             #for name in non_pivot:
             #    assert name not in nonzeros, (pivot, name, nonzeros)
             zeros.update(non_pivot)
-            yield pivot, bound_b
+            yield pivot, bound_bs
         else:
             nonzeros.add(bound_name)
-            yield bound_name, bound_b
+            yield bound_name, bound_bs
     # non-pivots can appear multiple times, but they should always be zero
     # however, due to substitution limitations, just warn
     violations = zeros.intersection(nonzeros)
     if len(violations):
         print('WARNING: %s non-0 non-pivot' % (len(violations)))
 
-    for zero in zeros - violations:
-        yield zero, 0
+    # XXX: how to best handle these?
+    # should they be fixed 0?
+    if corner:
+        zero_row = [None, None, None, None]
+        zero_row[corner_s2i[corner]] = 0
+        for zero in zeros - violations:
+            yield zero, zero_row
 
 def run(fnin, fnout, sub_json, corner=None, sort=False, verbose=False):
     if sort:
@@ -55,10 +58,10 @@ def run(fnin, fnout, sub_json, corner=None, sort=False, verbose=False):
 
     with open(fnout, 'w') as fout:
         fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
-        for name, delay in sortf(gen_flat(fnin, sub_json)):
+        #for name, corners in sortf(gen_flat(fnin, sub_json)):
+        for name, corners in gen_flat(fnin, sub_json, corner=corner):
             row_ico = 1
-            corners = [delay for _ in range(4)]
-            items = [str(row_ico), ' '.join([str(x) for x in corners])]
+            items = [str(row_ico), corners2csv(corners)]
             items.append('%u %s' % (1, name))
             fout.write(','.join(items) + '\n')
 
@@ -74,6 +77,7 @@ def main():
     parser.add_argument('--sort', action='store_true', help='')
     parser.add_argument('--sub-csv', help='')
     parser.add_argument('--sub-json', required=True, help='Group substitutions to make fully ranked')
+    parser.add_argument('--corner', default=None, help='')
     parser.add_argument('fnin', default=None, help='input timing delay .csv')
     parser.add_argument('fnout', default=None, help='output timing delay .csv')
     args = parser.parse_args()
@@ -83,7 +87,7 @@ def main():
     sub_json = load_sub(args.sub_json)
 
     try:
-        run(args.fnin, args.fnout, sub_json=sub_json, sort=args.sort, verbose=args.verbose)
+        run(args.fnin, args.fnout, sub_json=sub_json, sort=args.sort, verbose=args.verbose, corner=args.corner)
     finally:
         print('Exiting after %s' % bench)
 
diff --git a/fuzzers/007-timing/projects/project.mk b/fuzzers/007-timing/projects/project.mk
index f870af11..45a6165c 100644
--- a/fuzzers/007-timing/projects/project.mk
+++ b/fuzzers/007-timing/projects/project.mk
@@ -3,6 +3,7 @@ SPECIMENS := $(addprefix specimen_,$(shell seq -f '%03.0f' $(N)))
 SPECIMENS_OK := $(addsuffix /OK,$(SPECIMENS))
 CSVS := $(addsuffix /timing3.csv,$(SPECIMENS))
 TIMFUZ_DIR=$(XRAY_DIR)/fuzzers/007-timing
+CORNER=slow_max
 
 all: build/tilea.json
 
@@ -26,7 +27,7 @@ build/sub.json: $(SPECIMENS_OK)
 	mkdir -p build
 	# Discover which variables can be separated
 	# This is typically the longest running operation
-	python3 $(TIMFUZ_DIR)/rref.py --simplify --out build/sub.json.tmp $(CSVS)
+	python3 $(TIMFUZ_DIR)/rref.py --corner $(CORNER) --simplify --out build/sub.json.tmp $(CSVS)
 	mv build/sub.json.tmp build/sub.json
 
 build/grouped.csv: $(SPECIMENS_OK) build/sub.json
@@ -41,17 +42,17 @@ build/checksub: build/grouped.csv build/sub.json
 
 build/leastsq.csv: build/sub.json build/grouped.csv build/checksub
 	# Create a rough timing model that approximately fits the given paths
-	python3 $(TIMFUZ_DIR)/solve_leastsq.py --sub-json build/sub.json build/grouped.csv --out build/leastsq.csv.tmp
+	python3 $(TIMFUZ_DIR)/solve_leastsq.py --sub-json build/sub.json build/grouped.csv --corner $(CORNER) --out build/leastsq.csv.tmp
 	mv build/leastsq.csv.tmp build/leastsq.csv
 
 build/linprog.csv: build/leastsq.csv build/grouped.csv
 	# Tweak rough timing model, making sure all constraints are satisfied
-	python3 $(TIMFUZ_DIR)/solve_linprog.py --sub-json build/sub.json --sub-csv build/leastsq.csv --massage build/grouped.csv --out build/linprog.csv.tmp
+	python3 $(TIMFUZ_DIR)/solve_linprog.py --sub-json build/sub.json --sub-csv build/leastsq.csv --massage build/grouped.csv --corner $(CORNER) --out build/linprog.csv.tmp
 	mv build/linprog.csv.tmp build/linprog.csv
 
 build/flat.csv: build/linprog.csv
 	# Take separated variables and back-annotate them to the original timing variables
-	python3 $(TIMFUZ_DIR)/csv_group2flat.py --sub-json build/sub.json --sort build/linprog.csv build/flat.csv.tmp
+	python3 $(TIMFUZ_DIR)/csv_group2flat.py --sub-json build/sub.json --corner $(CORNER) --sort build/linprog.csv build/flat.csv.tmp
 	mv build/flat.csv.tmp build/flat.csv
 
 build/tilea.json: build/flat.csv
diff --git a/fuzzers/007-timing/solve_leastsq.py b/fuzzers/007-timing/solve_leastsq.py
index bbb20ecc..10cacbe3 100644
--- a/fuzzers/007-timing/solve_leastsq.py
+++ b/fuzzers/007-timing/solve_leastsq.py
@@ -2,20 +2,16 @@
 
 # https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
 from scipy.optimize import linprog
-from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json, A_ub_np2d, print_eqns, print_eqns_np
-from timfuz_massage import massage_equations
+from timfuz import Benchmark, load_sub, corner_s2i, acorner2csv
+import timfuz
 import numpy as np
 import glob
-import json
 import math
-from collections import OrderedDict
 from fractions import Fraction
 import sys
-import datetime
 import os
 import time
 import timfuz_solve
-import numpy
 import scipy.optimize as optimize
 from scipy.optimize import least_squares
 
@@ -37,10 +33,11 @@ def mkestimate(Anp, b):
                     x0[coli] = min(x0[coli], ub)
     return x0
 
-def save(outfn, res, names):
+def save(outfn, res, names, corner):
     # ballpark minimum actual observed delay is around 7 (carry chain)
     # anything less than one is probably a solver artifact
     delta = 0.5
+    corneri = corner_s2i[corner]
 
     print('Writing resutls')
     skips = 0
@@ -59,14 +56,13 @@ def save(outfn, res, names):
                 skips += 1
                 continue
             #xvali = round(xval)
-            xvali = math.ceil(xval)
-            corners = [xvali for _ in range(4)]
-            items = [str(row_ico), ' '.join([str(x) for x in corners])]
+
+            items = [str(row_ico), acorner2csv(math.ceil(xval), corneri)]
             items.append('%u %s' % (1, name))
             fout.write(','.join(items) + '\n')
     print('Wrote: skip %u => %u / %u valid delays' % (skips, len(names) - skips, len(names)))
 
-def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
+def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=None):
     # Given timing scores for above delays (-ps)
     assert type(Anp[0]) is np.ndarray, type(Anp[0])
     assert type(b) is np.ndarray, type(b)
@@ -135,7 +131,7 @@ def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
     print('Done')
 
     if outfn:
-        save(outfn, res, names)
+        save(outfn, res, names, corner)
 
 def main():
     import argparse
diff --git a/fuzzers/007-timing/solve_linprog.py b/fuzzers/007-timing/solve_linprog.py
index c33cd34a..e8fa4ac1 100644
--- a/fuzzers/007-timing/solve_linprog.py
+++ b/fuzzers/007-timing/solve_linprog.py
@@ -2,21 +2,44 @@
 
 # https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
 from scipy.optimize import linprog
-from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json, A_ub_np2d, print_eqns, print_eqns_np
-from timfuz_massage import massage_equations
+from timfuz import Benchmark, load_sub, A_ub_np2d, acorner2csv, corner_s2i
 import numpy as np
 import glob
 import json
 import math
-from collections import OrderedDict
-from fractions import Fraction
 import sys
-import datetime
 import os
 import time
 import timfuz_solve
 
-def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
+def save(outfn, res, names, corner):
+    # ballpark minimum actual observed delay is around 7 (carry chain)
+    # anything less than one is probably a solver artifact
+    delta = 0.5
+    corneri = corner_s2i[corner]
+
+    print('Writing resutls')
+    zeros = 0
+    with open(outfn, 'w') as fout:
+        # write as one variable per line
+        # this natively forms a bound if fed into linprog solver
+        fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
+        for xval, name in zip(res.x, names):
+            row_ico = 1
+
+            # FIXME: only report for the given corner?
+            # also review ceil vs floor choice for min vs max
+            # lets be more conservative for now
+            if xval < delta:
+                print('WARNING: near 0 delay on %s: %0.6f' % (name, xval))
+                zeros += 1
+                #continue
+            items = [str(row_ico), acorner2csv(math.ceil(xval), corneri)]
+            items.append('%u %s' % (1, name))
+            fout.write(','.join(items) + '\n')
+    print('Wrote: zeros %u => %u / %u constrained delays' % (zeros, len(names) - zeros, len(names)))
+
+def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=None):
     # Given timing scores for above delays (-ps)
     assert type(Anp[0]) is np.ndarray, type(Anp[0])
     assert type(b) is np.ndarray, type(b)
@@ -41,12 +64,6 @@ def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
     #A_ub = -1.0 * Anp
     A_ub = [-1.0 * x for x in Anp]
 
-    if verbose:
-        print('')
-        print('A_ub b_ub')
-        print_eqns_np(A_ub, b_ub, verbose=verbose)
-        print('')
-
     print('Creating misc constants...')
     # Minimization function scalars
     # Treat all logic elements as equally important
@@ -107,33 +124,7 @@ def run_corner(Anp, b, names, verbose=False, opts={}, meta={}, outfn=None):
         print('Delay on %d / %d' % (nonzeros, len(res.x)))
 
         if outfn:
-            # ballpark minimum actual observed delay is around 7 (carry chain)
-            # anything less than one is probably a solver artifact
-            delta = 0.5
-
-            print('Writing resutls')
-            zeros = 0
-            with open(outfn, 'w') as fout:
-                # write as one variable per line
-                # this natively forms a bound if fed into linprog solver
-                fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
-                for xval, name in zip(res.x, names):
-                    row_ico = 1
-
-                    # FIXME: only report for the given corner?
-                    # also review ceil vs floor choice for min vs max
-                    # lets be more conservative for now
-                    if xval < delta:
-                        print('WARNING: near 0 delay on %s: %0.6f' % (name, xval))
-                        zeros += 1
-                        #continue
-                    #xvali = round(xval)
-                    xvali = math.ceil(xval)
-                    corners = [xvali for _ in range(4)]
-                    items = [str(row_ico), ' '.join([str(x) for x in corners])]
-                    items.append('%u %s' % (1, name))
-                    fout.write(','.join(items) + '\n')
-            print('Wrote: zeros %u => %u / %u constrained delays' % (zeros, len(names) - zeros, len(names)))
+            save(outfn, res, names, corner)
 
 def main():
     import argparse
@@ -147,7 +138,7 @@ def main():
     parser.add_argument('--massage', action='store_true', help='')
     parser.add_argument('--sub-csv', help='')
     parser.add_argument('--sub-json', help='Group substitutions to make fully ranked')
-    parser.add_argument('--corner', default="slow_max", help='')
+    parser.add_argument('--corner', default=None, required=True, help='')
     parser.add_argument('--out', default=None, help='output timing delay .json')
     parser.add_argument(
         'fns_in',
diff --git a/fuzzers/007-timing/tile_annotate.py b/fuzzers/007-timing/tile_annotate.py
index 005b6c52..5b897b4d 100644
--- a/fuzzers/007-timing/tile_annotate.py
+++ b/fuzzers/007-timing/tile_annotate.py
@@ -1,7 +1,7 @@
 #!/usr/bin/env python3
 
 import timfuz
-from timfuz import loadc_Ads_b, Ads2bounds
+from timfuz import loadc_Ads_bs, Ads2bounds
 
 import sys
 import os
@@ -17,37 +17,41 @@ def run(fnin, fnout, tile_json_fn, verbose=False):
     tilej = json.load(open(tile_json_fn, 'r'))
 
     # FIXME: all corners
-    Ads, b = loadc_Ads_b([fnin], corner=None, ico=True)
-    bounds = Ads2bounds(Ads, b)
+    Ads, bs = loadc_Ads_bs([fnin], ico=True)
+    bounds = Ads2bounds(Ads, bs)
 
     pipn_net = 0
     pipn_solved = [0, 0, 0, 0]
+    pipn_covered = [0, 0, 0, 0]
     wiren_net = 0
     wiren_solved = [0, 0, 0, 0]
+    wiren_covered = [0, 0, 0, 0]
 
     for tile in tilej['tiles'].values():
         pips = tile['pips']
         for k, v in pips.items():
-            val = bounds.get('PIP_' + v, None)
-            pips[k] = quad(val)
+            pips[k] = bounds.get('PIP_' + v, [None, None, None, None])
             pipn_net += 1
             for i in range(4):
                 if pips[k][i]:
                     pipn_solved[i] += 1
+                if pips[k][i] is not None:
+                    pipn_covered[i] += 1
 
         wires = tile['wires']
         for k, v in wires.items():
-            val = bounds.get('WIRE_' + v, None)
-            wires[k] = quad(val)
+            wires[k] = bounds.get('WIRE_' + v, [None, None, None, None])
             wiren_net += 1
             for i in range(4):
                 if wires[k][i]:
                     wiren_solved[i] += 1
+                if wires[k][i] is not None:
+                    wiren_covered[i] += 1
 
     for corner, corneri in timfuz.corner_s2i.items():
         print('Corner %s' % corner)
-        print('  Pips: %u / %u solved' % (pipn_solved[corneri], pipn_net))
-        print('  Wires: %u / %u solved' % (wiren_solved[corneri], wiren_net))
+        print('  Pips: %u / %u solved, %u / %u covered' % (pipn_solved[corneri], pipn_net, pipn_covered[corneri], pipn_net))
+        print('  Wires: %u / %u solved, %u / %u covered' % (wiren_solved[corneri], wiren_net, wiren_covered[corneri], wiren_net))
 
     json.dump(tilej, open(fnout, 'w'), sort_keys=True, indent=4, separators=(',', ': '))
 
diff --git a/fuzzers/007-timing/timfuz.py b/fuzzers/007-timing/timfuz.py
index 09b34da2..c20a1b57 100644
--- a/fuzzers/007-timing/timfuz.py
+++ b/fuzzers/007-timing/timfuz.py
@@ -530,7 +530,12 @@ def loadc_Ads_mkb(fns, mkb, filt):
                 corners = cols[1]
                 vars = cols[2:]
 
-                corners = [int(x) for x in corners.split()]
+                def mkcorner(bstr):
+                    if bstr == 'None':
+                        return None
+                    else:
+                        return int(bstr)
+                corners = [mkcorner(corner) for corner in corners.split()]
                 def mkvar(x):
                     i, var = x.split()
                     return (var, int(i))
@@ -556,6 +561,16 @@ def loadc_Ads_b(fns, corner, ico=None):
         return val[corneri]
     return loadc_Ads_mkb(fns, mkb, filt)
 
+def loadc_Ads_bs(fns, ico=None):
+    if ico is not None:
+        filt = lambda ico_, corners, vars: ico_ == ico
+    else:
+        filt = lambda ico_, corners, vars: True
+
+    def mkb(val):
+        return val
+    return loadc_Ads_mkb(fns, mkb, filt)
+
 def loadc_Ads_raw(fns):
     filt = lambda ico, corners, vars: True
 
@@ -699,13 +714,13 @@ def print_eqns_np(A_ub, b_ub, verbose=0):
     Adi = A_ub_np2d(A_ub)
     print_eqns(Adi, b_ub, verbose=verbose)
 
-def Ads2bounds(Ads, b):
+def Ads2bounds(Ads, bs):
     ret = {}
-    for row_ds, row_b in zip(Ads, b):
+    for row_ds, row_bs in zip(Ads, bs):
         assert len(row_ds) == 1
         k, v = list(row_ds.items())[0]
         assert v == 1
-        ret[k] = row_b
+        ret[k] = row_bs
     return ret
 
 def instances(Ads):
@@ -713,3 +728,13 @@ def instances(Ads):
     for row_ds in Ads:
         ret += sum(row_ds.values())
     return ret
+
+def acorner2csv(b, corneri):
+    corners = ["None" for _ in range(4)]
+    corners[corneri] = str(b)
+    return ' '.join(corners)
+
+def corners2csv(bs):
+    assert len(bs) == 4
+    corners = ["None" if b is None else str(b) for b in bs]
+    return ' '.join(corners)
diff --git a/fuzzers/007-timing/timfuz_solve.py b/fuzzers/007-timing/timfuz_solve.py
index c9af58b1..dd08c5e0 100644
--- a/fuzzers/007-timing/timfuz_solve.py
+++ b/fuzzers/007-timing/timfuz_solve.py
@@ -143,4 +143,4 @@ def run(fns_in, corner, run_corner, sub_json=None, sub_csv=None, dedup=True, mas
 
     print('Converting to numpy...')
     names, Anp = A_ds2np(Ads)
-    run_corner(Anp, np.asarray(b), names, outfn=outfn, verbose=verbose, **kwargs)
+    run_corner(Anp, np.asarray(b), names, corner, outfn=outfn, verbose=verbose, **kwargs)

From 2dbe379200d6870178bf5087322b24f94cddb448 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Tue, 11 Sep 2018 19:47:31 -0700
Subject: [PATCH 41/55] timfuz: corner FIXME assert

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/solve_linprog.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/fuzzers/007-timing/solve_linprog.py b/fuzzers/007-timing/solve_linprog.py
index e8fa4ac1..037cafe2 100644
--- a/fuzzers/007-timing/solve_linprog.py
+++ b/fuzzers/007-timing/solve_linprog.py
@@ -57,6 +57,8 @@ def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=Non
     -delay1 +   -delay2 +               -delay4     <= -timing1
                 -delay2 +   -delay3                 <= -timing2
     '''
+    assert 'max' in corner, 'FIXME: support min corner math'
+
     rows = len(Anp)
     cols = len(Anp[0])
     print('Scaling to solution form...')

From e148ed5f9128a98fad4c549fd0e9cf3f1968651a Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 12 Sep 2018 13:51:44 -0700
Subject: [PATCH 42/55] timfuz: build all four corners

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/projects/corner.mk  | 42 ++++++++++++++++++++++
 fuzzers/007-timing/projects/project.mk | 49 +++++++++++++-------------
 fuzzers/007-timing/solve_linprog.py    | 12 +++++--
 fuzzers/007-timing/timfuz.py           |  6 ++++
 fuzzers/007-timing/timfuz_solve.py     |  9 +++--
 5 files changed, 89 insertions(+), 29 deletions(-)
 create mode 100644 fuzzers/007-timing/projects/corner.mk

diff --git a/fuzzers/007-timing/projects/corner.mk b/fuzzers/007-timing/projects/corner.mk
new file mode 100644
index 00000000..c4ac2d23
--- /dev/null
+++ b/fuzzers/007-timing/projects/corner.mk
@@ -0,0 +1,42 @@
+# Run corner specific calculations
+
+TIMFUZ_DIR=$(XRAY_DIR)/fuzzers/007-timing
+CORNER=slow_max
+
+all: build/$(CORNER)/tilea.json
+
+run:
+	$(MAKE) clean
+	$(MAKE) all
+	touch run.ok
+
+clean:
+	rm -rf specimen_[0-9][0-9][0-9]/ seg_clblx.segbits __pycache__ run.ok
+	rm -rf vivado*.log vivado_*.str vivado*.jou design *.bits *.dcp *.bit
+	rm -rf build
+
+.PHONY: all run clean
+
+build/$(CORNER):
+	mkdir build/$(CORNER)
+
+build/$(CORNER)/leastsq.csv: build/sub.json build/grouped.csv build/checksub build/$(CORNER)
+	# Create a rough timing model that approximately fits the given paths
+	python3 $(TIMFUZ_DIR)/solve_leastsq.py --sub-json build/sub.json build/grouped.csv --corner $(CORNER) --out build/$(CORNER)/leastsq.csv.tmp
+	mv build/$(CORNER)/leastsq.csv.tmp build/$(CORNER)/leastsq.csv
+
+build/$(CORNER)/linprog.csv: build/$(CORNER)/leastsq.csv build/grouped.csv
+	# Tweak rough timing model, making sure all constraints are satisfied
+	python3 $(TIMFUZ_DIR)/solve_linprog.py --sub-json build/sub.json --sub-csv build/$(CORNER)/leastsq.csv --massage build/grouped.csv --corner $(CORNER) --out build/$(CORNER)/linprog.csv.tmp
+	mv build/$(CORNER)/linprog.csv.tmp build/$(CORNER)/linprog.csv
+
+build/$(CORNER)/flat.csv: build/$(CORNER)/linprog.csv
+	# Take separated variables and back-annotate them to the original timing variables
+	python3 $(TIMFUZ_DIR)/csv_group2flat.py --sub-json build/sub.json --corner $(CORNER) --sort build/$(CORNER)/linprog.csv build/$(CORNER)/flat.csv.tmp
+	mv build/$(CORNER)/flat.csv.tmp build/$(CORNER)/flat.csv
+
+build/$(CORNER)/tilea.json: build/$(CORNER)/flat.csv
+	# Final processing
+	# Insert timing delays into actual tile layouts
+	python3 $(TIMFUZ_DIR)/tile_annotate.py --tile-json $(TIMFUZ_DIR)/timgrid/build/timgrid.json build/$(CORNER)/flat.csv build/$(CORNER)/tilea.json
+
diff --git a/fuzzers/007-timing/projects/project.mk b/fuzzers/007-timing/projects/project.mk
index 45a6165c..c0b3d1a3 100644
--- a/fuzzers/007-timing/projects/project.mk
+++ b/fuzzers/007-timing/projects/project.mk
@@ -1,11 +1,30 @@
+# project.mk: build specimens (run vivado), compute rref
+# corner.mk: run corner specific calculations
+
 N := 1
 SPECIMENS := $(addprefix specimen_,$(shell seq -f '%03.0f' $(N)))
 SPECIMENS_OK := $(addsuffix /OK,$(SPECIMENS))
 CSVS := $(addsuffix /timing3.csv,$(SPECIMENS))
 TIMFUZ_DIR=$(XRAY_DIR)/fuzzers/007-timing
-CORNER=slow_max
+RREF_CORNER=slow_max
 
-all: build/tilea.json
+TILEA_JSONS=build/fast_max/tilea.json build/fast_min/tilea.json build/slow_max/tilea.json build/slow_min/tilea.json
+
+all: $(TILEA_JSONS)
+
+# make build/checksub first
+build/fast_max/tilea.json: build/checksub
+	$(MAKE) -f $(TIMFUZ_DIR)/projects/corner.mk CORNER=fast_max
+build/fast_min/tilea.json: build/checksub
+	$(MAKE) -f $(TIMFUZ_DIR)/projects/corner.mk CORNER=fast_min
+build/slow_max/tilea.json: build/checksub
+	$(MAKE) -f $(TIMFUZ_DIR)/projects/corner.mk CORNER=slow_max
+build/slow_min/tilea.json: build/checksub
+	$(MAKE) -f $(TIMFUZ_DIR)/projects/corner.mk CORNER=slow_min
+fast_max: build/fast_max/tilea.json
+fast_min: build/fast_min/tilea.json
+slow_max: build/slow_max/tilea.json
+slow_min: build/slow_min/tilea.json
 
 $(SPECIMENS_OK):
 	bash generate.sh $(subst /OK,,$@)
@@ -21,13 +40,15 @@ clean:
 	rm -rf vivado*.log vivado_*.str vivado*.jou design *.bits *.dcp *.bit
 	rm -rf build
 
-.PHONY: database pushdb run clean
+.PHONY: all run clean
+
+# rref should be the same regardless of corner
 
 build/sub.json: $(SPECIMENS_OK)
 	mkdir -p build
 	# Discover which variables can be separated
 	# This is typically the longest running operation
-	python3 $(TIMFUZ_DIR)/rref.py --corner $(CORNER) --simplify --out build/sub.json.tmp $(CSVS)
+	python3 $(TIMFUZ_DIR)/rref.py --corner $(RREF_CORNER) --simplify --out build/sub.json.tmp $(CSVS)
 	mv build/sub.json.tmp build/sub.json
 
 build/grouped.csv: $(SPECIMENS_OK) build/sub.json
@@ -40,23 +61,3 @@ build/checksub: build/grouped.csv build/sub.json
 	python3 $(TIMFUZ_DIR)/checksub.py --sub-json build/sub.json build/grouped.csv
 	touch build/checksub
 
-build/leastsq.csv: build/sub.json build/grouped.csv build/checksub
-	# Create a rough timing model that approximately fits the given paths
-	python3 $(TIMFUZ_DIR)/solve_leastsq.py --sub-json build/sub.json build/grouped.csv --corner $(CORNER) --out build/leastsq.csv.tmp
-	mv build/leastsq.csv.tmp build/leastsq.csv
-
-build/linprog.csv: build/leastsq.csv build/grouped.csv
-	# Tweak rough timing model, making sure all constraints are satisfied
-	python3 $(TIMFUZ_DIR)/solve_linprog.py --sub-json build/sub.json --sub-csv build/leastsq.csv --massage build/grouped.csv --corner $(CORNER) --out build/linprog.csv.tmp
-	mv build/linprog.csv.tmp build/linprog.csv
-
-build/flat.csv: build/linprog.csv
-	# Take separated variables and back-annotate them to the original timing variables
-	python3 $(TIMFUZ_DIR)/csv_group2flat.py --sub-json build/sub.json --corner $(CORNER) --sort build/linprog.csv build/flat.csv.tmp
-	mv build/flat.csv.tmp build/flat.csv
-
-build/tilea.json: build/flat.csv
-	# Final processing
-	# Insert timing delays into actual tile layouts
-	python3 $(TIMFUZ_DIR)/tile_annotate.py --tile-json $(TIMFUZ_DIR)/timgrid/build/timgrid.json build/flat.csv build/tilea.json
-
diff --git a/fuzzers/007-timing/solve_linprog.py b/fuzzers/007-timing/solve_linprog.py
index 037cafe2..9c943ecb 100644
--- a/fuzzers/007-timing/solve_linprog.py
+++ b/fuzzers/007-timing/solve_linprog.py
@@ -12,7 +12,7 @@ import os
 import time
 import timfuz_solve
 
-def save(outfn, res, names, corner):
+def save(outfn, xvals, names, corner):
     # ballpark minimum actual observed delay is around 7 (carry chain)
     # anything less than one is probably a solver artifact
     delta = 0.5
@@ -24,7 +24,7 @@ def save(outfn, res, names, corner):
         # write as one variable per line
         # this natively forms a bound if fed into linprog solver
         fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
-        for xval, name in zip(res.x, names):
+        for xval, name in zip(xvals, names):
             row_ico = 1
 
             # FIXME: only report for the given corner?
@@ -40,6 +40,12 @@ def save(outfn, res, names, corner):
     print('Wrote: zeros %u => %u / %u constrained delays' % (zeros, len(names) - zeros, len(names)))
 
 def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=None):
+    if len(Anp) == 0:
+        print('WARNING: zero equations')
+        if outfn:
+            save(outfn, [], [], corner)
+        return
+
     # Given timing scores for above delays (-ps)
     assert type(Anp[0]) is np.ndarray, type(Anp[0])
     assert type(b) is np.ndarray, type(b)
@@ -126,7 +132,7 @@ def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=Non
         print('Delay on %d / %d' % (nonzeros, len(res.x)))
 
         if outfn:
-            save(outfn, res, names, corner)
+            save(outfn, res.x, names, corner)
 
 def main():
     import argparse
diff --git a/fuzzers/007-timing/timfuz.py b/fuzzers/007-timing/timfuz.py
index c20a1b57..c0d0aad2 100644
--- a/fuzzers/007-timing/timfuz.py
+++ b/fuzzers/007-timing/timfuz.py
@@ -37,6 +37,10 @@ corner_s2i = OrderedDict([
     ('slow_min', 3),
     ])
 
+# Equations are filtered out until nothing is left
+class SimplifiedToZero(Exception):
+    pass
+
 def print_eqns(A_ubd, b_ub, verbose=0, lim=3, label=''):
     rows = len(b_ub)
 
@@ -172,6 +176,8 @@ def simplify_rows(Ads, b_ub, remove_zd=False, corner=None):
         eqns[rowt] = minmax(eqns.get(rowt, 0), b)
 
     print(' done')
+    if len(eqns) == 0:
+        raise SimplifiedToZero()
 
     #A_ub_ret = eqns.keys()
     A_ubd_ret, b_ub_ret = Ab_ub_dt2d(eqns)
diff --git a/fuzzers/007-timing/timfuz_solve.py b/fuzzers/007-timing/timfuz_solve.py
index dd08c5e0..47373411 100644
--- a/fuzzers/007-timing/timfuz_solve.py
+++ b/fuzzers/007-timing/timfuz_solve.py
@@ -2,7 +2,7 @@
 
 # https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
 from scipy.optimize import linprog
-from timfuz import Benchmark, Ar_di2np, Ar_ds2t, A_di2ds, A_ds2di, simplify_rows, loadc_Ads_b, index_names, A_ds2np, load_sub, run_sub_json, A_ub_np2d, print_eqns, print_eqns_np, Ads2bounds, instances
+from timfuz import Benchmark, simplify_rows, loadc_Ads_b, index_names, A_ds2np, run_sub_json, print_eqns, Ads2bounds, instances, SimplifiedToZero
 from timfuz_massage import massage_equations
 import numpy as np
 import glob
@@ -139,7 +139,12 @@ def run(fns_in, corner, run_corner, sub_json=None, sub_csv=None, dedup=True, mas
     This creates derived constraints to provide more realistic results
     '''
     if massage:
-        Ads, b = massage_equations(Ads, b, corner=corner)
+        try:
+            Ads, b = massage_equations(Ads, b, corner=corner)
+        except SimplifiedToZero:
+            print('WARNING: simplified to zero equations')
+            Ads = []
+            b = []
 
     print('Converting to numpy...')
     names, Anp = A_ds2np(Ads)

From 2ad0bf82fc9ca382136232a26e5775777c8bfff9 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 12 Sep 2018 14:03:33 -0700
Subject: [PATCH 43/55] timfuz: ALLOW_ZERO_EQN

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/projects/corner.mk          | 6 +++++-
 fuzzers/007-timing/projects/oneblinkw/Makefile | 2 ++
 fuzzers/007-timing/projects/project.mk         | 1 +
 fuzzers/007-timing/timfuz_solve.py             | 2 ++
 4 files changed, 10 insertions(+), 1 deletion(-)

diff --git a/fuzzers/007-timing/projects/corner.mk b/fuzzers/007-timing/projects/corner.mk
index c4ac2d23..5ae80ca8 100644
--- a/fuzzers/007-timing/projects/corner.mk
+++ b/fuzzers/007-timing/projects/corner.mk
@@ -2,6 +2,7 @@
 
 TIMFUZ_DIR=$(XRAY_DIR)/fuzzers/007-timing
 CORNER=slow_max
+ALLOW_ZERO_EQN?=N
 
 all: build/$(CORNER)/tilea.json
 
@@ -20,6 +21,9 @@ clean:
 build/$(CORNER):
 	mkdir build/$(CORNER)
 
+build/checksub:
+	false
+
 build/$(CORNER)/leastsq.csv: build/sub.json build/grouped.csv build/checksub build/$(CORNER)
 	# Create a rough timing model that approximately fits the given paths
 	python3 $(TIMFUZ_DIR)/solve_leastsq.py --sub-json build/sub.json build/grouped.csv --corner $(CORNER) --out build/$(CORNER)/leastsq.csv.tmp
@@ -27,7 +31,7 @@ build/$(CORNER)/leastsq.csv: build/sub.json build/grouped.csv build/checksub bui
 
 build/$(CORNER)/linprog.csv: build/$(CORNER)/leastsq.csv build/grouped.csv
 	# Tweak rough timing model, making sure all constraints are satisfied
-	python3 $(TIMFUZ_DIR)/solve_linprog.py --sub-json build/sub.json --sub-csv build/$(CORNER)/leastsq.csv --massage build/grouped.csv --corner $(CORNER) --out build/$(CORNER)/linprog.csv.tmp
+	ALLOW_ZERO_EQN=$(ALLOW_ZERO_EQN) python3 $(TIMFUZ_DIR)/solve_linprog.py --sub-json build/sub.json --sub-csv build/$(CORNER)/leastsq.csv --massage build/grouped.csv --corner $(CORNER) --out build/$(CORNER)/linprog.csv.tmp
 	mv build/$(CORNER)/linprog.csv.tmp build/$(CORNER)/linprog.csv
 
 build/$(CORNER)/flat.csv: build/$(CORNER)/linprog.csv
diff --git a/fuzzers/007-timing/projects/oneblinkw/Makefile b/fuzzers/007-timing/projects/oneblinkw/Makefile
index 9c8b1947..5e5721b7 100644
--- a/fuzzers/007-timing/projects/oneblinkw/Makefile
+++ b/fuzzers/007-timing/projects/oneblinkw/Makefile
@@ -1,2 +1,4 @@
+# so simple that likely no linprog adjustments will be needed
+ALLOW_ZERO_EQN?=Y
 include ../project.mk
 
diff --git a/fuzzers/007-timing/projects/project.mk b/fuzzers/007-timing/projects/project.mk
index c0b3d1a3..daa79aeb 100644
--- a/fuzzers/007-timing/projects/project.mk
+++ b/fuzzers/007-timing/projects/project.mk
@@ -7,6 +7,7 @@ SPECIMENS_OK := $(addsuffix /OK,$(SPECIMENS))
 CSVS := $(addsuffix /timing3.csv,$(SPECIMENS))
 TIMFUZ_DIR=$(XRAY_DIR)/fuzzers/007-timing
 RREF_CORNER=slow_max
+ALLOW_ZERO_EQN?=N
 
 TILEA_JSONS=build/fast_max/tilea.json build/fast_min/tilea.json build/slow_max/tilea.json build/slow_min/tilea.json
 
diff --git a/fuzzers/007-timing/timfuz_solve.py b/fuzzers/007-timing/timfuz_solve.py
index 47373411..ccd2b738 100644
--- a/fuzzers/007-timing/timfuz_solve.py
+++ b/fuzzers/007-timing/timfuz_solve.py
@@ -142,6 +142,8 @@ def run(fns_in, corner, run_corner, sub_json=None, sub_csv=None, dedup=True, mas
         try:
             Ads, b = massage_equations(Ads, b, corner=corner)
         except SimplifiedToZero:
+            if os.getenv('ALLOW_ZERO_EQN', 'N') != 'Y':
+                raise
             print('WARNING: simplified to zero equations')
             Ads = []
             b = []

From c965288e75888615b22e7613ad5b52a6caf61880 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 12 Sep 2018 15:14:18 -0700
Subject: [PATCH 44/55] timfuz: min corner tweaks

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/solve_leastsq.py  | 32 ++++++++++++++++-----------
 fuzzers/007-timing/solve_linprog.py  |  2 +-
 fuzzers/007-timing/timfuz.py         | 13 ++++++++++-
 fuzzers/007-timing/timfuz_massage.py |  4 +++-
 fuzzers/007-timing/timfuz_solve.py   | 33 ++++++++++++++++++++++------
 5 files changed, 61 insertions(+), 23 deletions(-)

diff --git a/fuzzers/007-timing/solve_leastsq.py b/fuzzers/007-timing/solve_leastsq.py
index 10cacbe3..5bdd4fad 100644
--- a/fuzzers/007-timing/solve_leastsq.py
+++ b/fuzzers/007-timing/solve_leastsq.py
@@ -33,34 +33,44 @@ def mkestimate(Anp, b):
                     x0[coli] = min(x0[coli], ub)
     return x0
 
-def save(outfn, res, names, corner):
+def save(outfn, xvals, names, corner):
     # ballpark minimum actual observed delay is around 7 (carry chain)
     # anything less than one is probably a solver artifact
     delta = 0.5
     corneri = corner_s2i[corner]
 
-    print('Writing resutls')
+    # Round conservatively
+    roundf = {
+        'fast_max': math.ceil,
+        'fast_min': math.floor,
+        'slow_max': math.ceil,
+        'slow_min': math.floor,
+        }[corner]
+
+    print('Writing results')
     skips = 0
+    keeps = 0
     with open(outfn, 'w') as fout:
         # write as one variable per line
         # this natively forms a bound if fed into linprog solver
         fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
-        for xval, name in zip(res.x, names):
+        for xval, name in zip(xvals, names):
             row_ico = 1
 
-            # FIXME: only report for the given corner?
             # also review ceil vs floor choice for min vs max
             # lets be more conservative for now
             if xval < delta:
                 #print('Skipping %s: %0.6f' % (name, xval))
                 skips += 1
                 continue
+            keeps += 1
             #xvali = round(xval)
 
-            items = [str(row_ico), acorner2csv(math.ceil(xval), corneri)]
+            items = [str(row_ico), acorner2csv(roundf(xval), corneri)]
             items.append('%u %s' % (1, name))
             fout.write(','.join(items) + '\n')
-    print('Wrote: skip %u => %u / %u valid delays' % (skips, len(names) - skips, len(names)))
+    print('Wrote: skip %u => %u / %u valid delays' % (skips, keeps, len(names)))
+    assert keeps, 'Failed to estimate delay'
 
 def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=None):
     # Given timing scores for above delays (-ps)
@@ -131,7 +141,7 @@ def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=Non
     print('Done')
 
     if outfn:
-        save(outfn, res, names, corner)
+        save(outfn, res.x, names, corner)
 
 def main():
     import argparse
@@ -148,23 +158,19 @@ def main():
     parser.add_argument('--out', default=None, help='output timing delay .json')
     parser.add_argument(
         'fns_in',
-        nargs='*',
+        nargs='+',
         help='timing3.csv input files')
     args = parser.parse_args()
     # Store options in dict to ease passing through functions
     bench = Benchmark()
 
-    fns_in = args.fns_in
-    if not fns_in:
-        fns_in = glob.glob('specimen_*/timing3.csv')
-
     sub_json = None
     if args.sub_json:
         sub_json = load_sub(args.sub_json)
 
     try:
         timfuz_solve.run(run_corner=run_corner, sub_json=sub_json,
-            fns_in=fns_in, corner=args.corner, massage=args.massage, outfn=args.out, verbose=args.verbose)
+            fns_in=args.fns_in, corner=args.corner, massage=args.massage, outfn=args.out, verbose=args.verbose)
     finally:
         print('Exiting after %s' % bench)
 
diff --git a/fuzzers/007-timing/solve_linprog.py b/fuzzers/007-timing/solve_linprog.py
index 9c943ecb..e10ce7fb 100644
--- a/fuzzers/007-timing/solve_linprog.py
+++ b/fuzzers/007-timing/solve_linprog.py
@@ -18,7 +18,7 @@ def save(outfn, xvals, names, corner):
     delta = 0.5
     corneri = corner_s2i[corner]
 
-    print('Writing resutls')
+    print('Writing results')
     zeros = 0
     with open(outfn, 'w') as fout:
         # write as one variable per line
diff --git a/fuzzers/007-timing/timfuz.py b/fuzzers/007-timing/timfuz.py
index c0d0aad2..c1ed1bb7 100644
--- a/fuzzers/007-timing/timfuz.py
+++ b/fuzzers/007-timing/timfuz.py
@@ -41,6 +41,10 @@ corner_s2i = OrderedDict([
 class SimplifiedToZero(Exception):
     pass
 
+
+def allow_zero_eqns():
+    return os.getenv('ALLOW_ZERO_EQN', 'N') == 'Y'
+
 def print_eqns(A_ubd, b_ub, verbose=0, lim=3, label=''):
     rows = len(b_ub)
 
@@ -147,6 +151,13 @@ def simplify_rows(Ads, b_ub, remove_zd=False, corner=None):
         'slow_max': max,
         'slow_min': min,
         }[corner]
+    # An outlier to make unknown values be ignored
+    T_UNK = {
+        'fast_max': 0,
+        'fast_min': 10e9,
+        'slow_max': 0,
+        'slow_min': 10e9,
+        }[corner]
 
     sys.stdout.write('SimpR ')
     sys.stdout.flush()
@@ -173,7 +184,7 @@ def simplify_rows(Ads, b_ub, remove_zd=False, corner=None):
             continue
 
         rowt = Ar_ds2t(rowd)
-        eqns[rowt] = minmax(eqns.get(rowt, 0), b)
+        eqns[rowt] = minmax(eqns.get(rowt, T_UNK), b)
 
     print(' done')
     if len(eqns) == 0:
diff --git a/fuzzers/007-timing/timfuz_massage.py b/fuzzers/007-timing/timfuz_massage.py
index e35f4e28..1f52af5b 100644
--- a/fuzzers/007-timing/timfuz_massage.py
+++ b/fuzzers/007-timing/timfuz_massage.py
@@ -80,8 +80,8 @@ def derive_eq_by_row(Ads, b, verbose=0, col_lim=0, tweak=False):
     How to do this in a reasonable time span?
     Also equations are sparse, which makes this harder to compute
     '''
+    assert len(Ads) == len(b), 'Ads, b length mismatch'
     rows = len(Ads)
-    assert rows == len(b)
 
     # Index equations into hash maps so can lookup sparse elements quicker
     assert len(Ads) == len(b)
@@ -403,6 +403,8 @@ def massage_equations_inc_col_lim(Ads, b, verbose=False, corner=None):
     Remove these columns as necessary to speed up solving
     '''
 
+    assert len(Ads) == len(b), 'Ads, b length mismatch'
+
     def debug(what):
         if verbose:
             print('')
diff --git a/fuzzers/007-timing/timfuz_solve.py b/fuzzers/007-timing/timfuz_solve.py
index ccd2b738..52a4c43e 100644
--- a/fuzzers/007-timing/timfuz_solve.py
+++ b/fuzzers/007-timing/timfuz_solve.py
@@ -2,7 +2,7 @@
 
 # https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
 from scipy.optimize import linprog
-from timfuz import Benchmark, simplify_rows, loadc_Ads_b, index_names, A_ds2np, run_sub_json, print_eqns, Ads2bounds, instances, SimplifiedToZero
+from timfuz import Benchmark, simplify_rows, loadc_Ads_b, index_names, A_ds2np, run_sub_json, print_eqns, Ads2bounds, instances, SimplifiedToZero, allow_zero_eqns
 from timfuz_massage import massage_equations
 import numpy as np
 import glob
@@ -68,15 +68,30 @@ def check_feasible(A_ub, b_ub):
             raise Exception("Bad ")
     print(' done')
 
-def filter_bounds(Ads, b, bounds):
+def filter_bounds(Ads, b, bounds, corner):
     '''Given min variable delays, remove rows that won't constrain solution'''
+    #assert len(bounds) > 0
+
+    if 'max' in corner:
+        # Keep delays possibly larger than current bound
+        def keep(row_b, est):
+            return row_b > est
+        T_UNK = 0
+    elif 'min' in corner:
+        # Keep delays possibly smaller than current bound
+        def keep(row_b, est):
+            return row_b < est
+        T_UNK = 1e9
+    else:
+        assert 0
+
     ret_Ads = []
     ret_b = []
     for row_ds, row_b in zip(Ads, b):
         # some variables get estimated at 0
-        est = sum([bounds.get(k, 0) * v for k, v in row_ds.items()])
+        est = sum([bounds.get(k, T_UNK) * v for k, v in row_ds.items()])
         # will this row potentially constrain us more?
-        if row_b > est:
+        if keep(row_b, est):
             ret_Ads.append(row_ds)
             ret_b.append(row_b)
     return ret_Ads, ret_b
@@ -114,11 +129,14 @@ def run(fns_in, corner, run_corner, sub_json=None, sub_csv=None, dedup=True, mas
     if sub_csv:
         Ads2, b2 = loadc_Ads_b([sub_csv], corner, ico=True)
         bounds = Ads2bounds(Ads2, b2)
+        assert len(bounds), 'Failed to load bounds'
         rows_old = len(Ads)
-        Ads, b = filter_bounds(Ads, b, bounds)
-        print('Filter bounds: %s => %s rows' % (rows_old, len(Ads)))
+        Ads, b = filter_bounds(Ads, b, bounds, corner)
+        print('Filter bounds: %s => %s + %s rows' % (rows_old, len(Ads), len(Ads2)))
         Ads = Ads + Ads2
         b = b + b2
+        assert len(Ads) or allow_zero_eqns()
+        assert len(Ads) == len(b), 'Ads, b length mismatch'
 
     if verbose:
         print
@@ -126,6 +144,7 @@ def run(fns_in, corner, run_corner, sub_json=None, sub_csv=None, dedup=True, mas
 
         #print
         #col_dist(A_ubd, 'final', names)
+    print('b10', b[0:100])
 
     '''
     Given:
@@ -142,7 +161,7 @@ def run(fns_in, corner, run_corner, sub_json=None, sub_csv=None, dedup=True, mas
         try:
             Ads, b = massage_equations(Ads, b, corner=corner)
         except SimplifiedToZero:
-            if os.getenv('ALLOW_ZERO_EQN', 'N') != 'Y':
+            if not allow_zero_eqns():
                 raise
             print('WARNING: simplified to zero equations')
             Ads = []

From 0b3aa34b5b111d56c7c153f59c5327331e9dcd4e Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 12 Sep 2018 15:29:32 -0700
Subject: [PATCH 45/55] timfuz: fully support min corner

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/solve_linprog.py | 60 ++++++++++++++++++++++-------
 1 file changed, 46 insertions(+), 14 deletions(-)

diff --git a/fuzzers/007-timing/solve_linprog.py b/fuzzers/007-timing/solve_linprog.py
index e10ce7fb..ee73a702 100644
--- a/fuzzers/007-timing/solve_linprog.py
+++ b/fuzzers/007-timing/solve_linprog.py
@@ -18,6 +18,13 @@ def save(outfn, xvals, names, corner):
     delta = 0.5
     corneri = corner_s2i[corner]
 
+    roundf = {
+        'fast_max': math.ceil,
+        'fast_min': math.floor,
+        'slow_max': math.ceil,
+        'slow_min': math.floor,
+        }[corner]
+
     print('Writing results')
     zeros = 0
     with open(outfn, 'w') as fout:
@@ -34,10 +41,11 @@ def save(outfn, xvals, names, corner):
                 print('WARNING: near 0 delay on %s: %0.6f' % (name, xval))
                 zeros += 1
                 #continue
-            items = [str(row_ico), acorner2csv(math.ceil(xval), corneri)]
+            items = [str(row_ico), acorner2csv(roundf(xval), corneri)]
             items.append('%u %s' % (1, name))
             fout.write(','.join(items) + '\n')
-    print('Wrote: zeros %u => %u / %u constrained delays' % (zeros, len(names) - zeros, len(names)))
+    nonzeros = len(names) - zeros
+    print('Wrote: %u / %u constrained delays, %u zeros' % (nonzeros, len(names), zeros))
 
 def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=None):
     if len(Anp) == 0:
@@ -45,6 +53,12 @@ def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=Non
         if outfn:
             save(outfn, [], [], corner)
         return
+    maxcorner = {
+        'slow_max': True,
+        'slow_min': False,
+        'fast_max': True,
+        'fast_min': False,
+        }[corner]
 
     # Given timing scores for above delays (-ps)
     assert type(Anp[0]) is np.ndarray, type(Anp[0])
@@ -54,28 +68,46 @@ def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=Non
 
     '''
     Be mindful of signs
-    Have something like
-    timing1/timing 2 are constants
-    delay1 +   delay2 +               delay4     >= timing1
-               delay2 +   delay3                 >= timing2
+    t1, t2: total delay contants
+    d1, d2..: variables to solve for
+
+    Max corner intuitive form:
+    d1 + d2 +     d4 >= t1
+         d2 + d3     >= t2
 
     But need it in compliant form:
-    -delay1 +   -delay2 +               -delay4     <= -timing1
-                -delay2 +   -delay3                 <= -timing2
+    -d1 + -d2 +      -d4 <= -t1
+          -d2 + -d3      <= -t2
+    Minimize delay elements
+
+
+    Min corner intuitive form:
+    d1 + d2 +     d4 <= t1
+         d2 + d3     <= t2
+    Maximize delay elements
     '''
-    assert 'max' in corner, 'FIXME: support min corner math'
 
     rows = len(Anp)
     cols = len(Anp[0])
-    print('Scaling to solution form...')
-    b_ub = -1.0 * b
-    #A_ub = -1.0 * Anp
-    A_ub = [-1.0 * x for x in Anp]
+    if maxcorner:
+        print('maxcorner => scaling to solution form...')
+        b_ub = -1.0 * b
+        #A_ub = -1.0 * Anp
+        A_ub = [-1.0 * x for x in Anp]
+    else:
+        print('mincorner => no scaling required')
+        b_ub = b
+        A_ub = Anp
 
     print('Creating misc constants...')
     # Minimization function scalars
     # Treat all logic elements as equally important
-    c = [1 for _i in range(len(names))]
+    if maxcorner:
+        # Best result are min delays
+        c = [1 for _i in range(len(names))]
+    else:
+        # Best result are max delays
+        c = [-1 for _i in range(len(names))]
     # Delays cannot be negative
     # (this is also the default constraint)
     #bounds =  [(0, None) for _i in range(len(names))]

From 2a28dabf02a2585b326e2e4d7883c112186d895b Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 12 Sep 2018 17:14:19 -0700
Subject: [PATCH 46/55] timfuz: ALLOW_ZERO_EQN workaround for projects that
 fail PnR

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/projects/corner.mk  |  1 +
 fuzzers/007-timing/projects/project.mk | 22 ++++++++++++++++++----
 fuzzers/007-timing/rref.py             |  2 +-
 fuzzers/007-timing/timfuz.py           |  8 ++------
 4 files changed, 22 insertions(+), 11 deletions(-)

diff --git a/fuzzers/007-timing/projects/corner.mk b/fuzzers/007-timing/projects/corner.mk
index 5ae80ca8..aaa3cbf2 100644
--- a/fuzzers/007-timing/projects/corner.mk
+++ b/fuzzers/007-timing/projects/corner.mk
@@ -3,6 +3,7 @@
 TIMFUZ_DIR=$(XRAY_DIR)/fuzzers/007-timing
 CORNER=slow_max
 ALLOW_ZERO_EQN?=N
+BADPRJ_OK?=N
 
 all: build/$(CORNER)/tilea.json
 
diff --git a/fuzzers/007-timing/projects/project.mk b/fuzzers/007-timing/projects/project.mk
index daa79aeb..691bb048 100644
--- a/fuzzers/007-timing/projects/project.mk
+++ b/fuzzers/007-timing/projects/project.mk
@@ -8,6 +8,7 @@ CSVS := $(addsuffix /timing3.csv,$(SPECIMENS))
 TIMFUZ_DIR=$(XRAY_DIR)/fuzzers/007-timing
 RREF_CORNER=slow_max
 ALLOW_ZERO_EQN?=N
+BADPRJ_OK?=N
 
 TILEA_JSONS=build/fast_max/tilea.json build/fast_min/tilea.json build/slow_max/tilea.json build/slow_min/tilea.json
 
@@ -28,7 +29,7 @@ slow_max: build/slow_max/tilea.json
 slow_min: build/slow_min/tilea.json
 
 $(SPECIMENS_OK):
-	bash generate.sh $(subst /OK,,$@)
+	bash generate.sh $(subst /OK,,$@) || (if [ "$(BADPRJ_OK)" != 'Y' ] ; then exit 1; fi; exit 0)
 	touch $@
 
 run:
@@ -43,18 +44,31 @@ clean:
 
 .PHONY: all run clean
 
-# rref should be the same regardless of corner
+# Normally require all projects to complete
+# If BADPRJ_OK is allowed, only take projects that were successful
+# FIXME: couldn't get call to work
+exist_csvs = \
+        for f in $(CSVS); do \
+            if [ "$(BADPRJ_OK)" != 'Y' -o -f $$f ] ; then \
+                echo $$f; \
+            fi; \
+        done
 
+# rref should be the same regardless of corner
 build/sub.json: $(SPECIMENS_OK)
 	mkdir -p build
 	# Discover which variables can be separated
 	# This is typically the longest running operation
-	python3 $(TIMFUZ_DIR)/rref.py --corner $(RREF_CORNER) --simplify --out build/sub.json.tmp $(CSVS)
+	\
+	    csvs=$$(for f in $(CSVS); do if [ "$(BADPRJ_OK)" != 'Y' -o -f $$f ] ; then echo $$f; fi; done) ; \
+	    python3 $(TIMFUZ_DIR)/rref.py --corner $(RREF_CORNER) --simplify --out build/sub.json.tmp $$csvs
 	mv build/sub.json.tmp build/sub.json
 
 build/grouped.csv: $(SPECIMENS_OK) build/sub.json
 	# Separate variables
-	python3 $(TIMFUZ_DIR)/csv_flat2group.py --sub-json build/sub.json --strict --out build/grouped.csv.tmp $(CSVS)
+	\
+	    csvs=$$(for f in $(CSVS); do if [ "$(BADPRJ_OK)" != 'Y' -o -f $$f ] ; then echo $$f; fi; done) ; \
+	    python3 $(TIMFUZ_DIR)/csv_flat2group.py --sub-json build/sub.json --strict --out build/grouped.csv.tmp $$csvs
 	mv build/grouped.csv.tmp build/grouped.csv
 
 build/checksub: build/grouped.csv build/sub.json
diff --git a/fuzzers/007-timing/rref.py b/fuzzers/007-timing/rref.py
index 4cf1b9e7..bad37401 100644
--- a/fuzzers/007-timing/rref.py
+++ b/fuzzers/007-timing/rref.py
@@ -221,7 +221,7 @@ def main():
     parser.add_argument('--out', help='Output sub.json substitution result')
     parser.add_argument(
         'fns_in',
-        nargs='*',
+        nargs='+',
         help='timing3.txt input files')
     args = parser.parse_args()
     bench = Benchmark()
diff --git a/fuzzers/007-timing/timfuz.py b/fuzzers/007-timing/timfuz.py
index c1ed1bb7..6287cce2 100644
--- a/fuzzers/007-timing/timfuz.py
+++ b/fuzzers/007-timing/timfuz.py
@@ -187,15 +187,11 @@ def simplify_rows(Ads, b_ub, remove_zd=False, corner=None):
         eqns[rowt] = minmax(eqns.get(rowt, T_UNK), b)
 
     print(' done')
+
+    print('Simplify rows: %d => %d rows w/ zd %d, ze %d' % (len(b_ub), len(eqns), zero_ds, zero_es))
     if len(eqns) == 0:
         raise SimplifiedToZero()
-
-    #A_ub_ret = eqns.keys()
     A_ubd_ret, b_ub_ret = Ab_ub_dt2d(eqns)
-
-    print('Simplify rows: %d => %d rows w/ zd %d, ze %d' % (len(b_ub), len(b_ub_ret), zero_ds, zero_es))
-    #return A_ub_ret, b_ub_ret
-    #return A_ub_np2d(A_ub_ret), b_ub_ret
     return A_ubd_ret, b_ub_ret
 
 def A_ubr_np2d(row):

From c104e70724e43f2b715021609b50d15d08f1f45b Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Wed, 12 Sep 2018 18:30:09 -0700
Subject: [PATCH 47/55] timfuz: combine tile process corners

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/Makefile            |  29 +++++-
 fuzzers/007-timing/README.md           |  12 +--
 fuzzers/007-timing/projects/project.mk |   5 +-
 fuzzers/007-timing/tile_combine.py     | 123 +++++++++++++++++++++++++
 4 files changed, 154 insertions(+), 15 deletions(-)
 create mode 100644 fuzzers/007-timing/tile_combine.py

diff --git a/fuzzers/007-timing/Makefile b/fuzzers/007-timing/Makefile
index 1f90909f..40e42a35 100644
--- a/fuzzers/007-timing/Makefile
+++ b/fuzzers/007-timing/Makefile
@@ -1,5 +1,26 @@
-all:
-	cd speed && make
-	cd timgrid && make
-	cd projects && make
+# for now hammering on just picorv32
+# consider instead aggregating multiple projects
+PRJ?=picorv32
+PRJN?=8
+
+all: build/tilea.json
+
+clean:
+	rm -rf build
+	cd speed && $(MAKE) clean
+	cd timgrid && $(MAKE) clean
+	cd projects && $(MAKE) clean
+
+speed/build/speed.json:
+	cd speed && $(MAKE)
+
+timgrid/build/timgrid.json:
+	cd timgrid && $(MAKE)
+
+build/tilea.json: projects/$(PRJ)/build/tilea.json
+	mkdir -p build
+	cp projects/$(PRJ)/build/tilea.json build/tilea.json
+
+projects/$(PRJ)/build/tilea.json: speed/build/speed.json timgrid/build/timgrid.json
+	cd projects/$(PRJ) && $(MAKE) N=$(PRJN)
 
diff --git a/fuzzers/007-timing/README.md b/fuzzers/007-timing/README.md
index 047e073c..a7c79eb2 100644
--- a/fuzzers/007-timing/README.md
+++ b/fuzzers/007-timing/README.md
@@ -13,19 +13,11 @@ Currently this document focuses exclusively on fabric timing delays.
 ## Quick start
 
 ```
-pushd speed
 make
-popd
-
-pushd timgrid
-make
-popd
-
-pushd projects/placelut
-make N=1
-popd
 ```
 
+This will take a relatively long time (say 45 min) and generate build/tilea.json
+
 
 ## Vivado background
 
diff --git a/fuzzers/007-timing/projects/project.mk b/fuzzers/007-timing/projects/project.mk
index 691bb048..7e2b4f1f 100644
--- a/fuzzers/007-timing/projects/project.mk
+++ b/fuzzers/007-timing/projects/project.mk
@@ -12,7 +12,7 @@ BADPRJ_OK?=N
 
 TILEA_JSONS=build/fast_max/tilea.json build/fast_min/tilea.json build/slow_max/tilea.json build/slow_min/tilea.json
 
-all: $(TILEA_JSONS)
+all: build/tilea.json
 
 # make build/checksub first
 build/fast_max/tilea.json: build/checksub
@@ -76,3 +76,6 @@ build/checksub: build/grouped.csv build/sub.json
 	python3 $(TIMFUZ_DIR)/checksub.py --sub-json build/sub.json build/grouped.csv
 	touch build/checksub
 
+build/tilea.json: $(TILEA_JSONS)
+	python3 $(TIMFUZ_DIR)/tile_combine.py --out build/tilea.json $(TILEA_JSONS)
+
diff --git a/fuzzers/007-timing/tile_combine.py b/fuzzers/007-timing/tile_combine.py
new file mode 100644
index 00000000..35ea2291
--- /dev/null
+++ b/fuzzers/007-timing/tile_combine.py
@@ -0,0 +1,123 @@
+#!/usr/bin/env python3
+
+import sys
+import os
+import time
+import json
+from collections import OrderedDict
+
+corner_s2i = OrderedDict([
+    ('fast_max', 0),
+    ('fast_min', 1),
+    ('slow_max', 2),
+    ('slow_min', 3),
+    ])
+
+corner2minmax = {
+    'fast_max': max,
+    'fast_min': min,
+    'slow_max': max,
+    'slow_min': min,
+    }
+
+def build_tilejo(fnins):
+    '''
+    {
+        "tiles": {
+            "BRKH_B_TERM_INT": {
+                "pips": {},
+                "wires": {
+                    "B_TERM_UTURN_INT_ER1BEG0": [
+                        null,
+                        null,
+                        93,
+                        null
+                    ],
+    '''
+
+    tilejo = {"tiles": {}}
+    for fnin in fnins:
+        tileji = json.load(open(fnin, 'r'))
+        for tilek, tilevi in tileji['tiles'].items():
+            # No previous data? Copy
+            tilevo = tilejo['tiles'].get(tilek, None)
+            if tilevo is None:
+                tilejo['tiles'][tilek] = tilevi
+            # Otherwise combine
+            else:
+                def process_type(etype):
+                    for pipk, pipvi in tilevi[etype].items():
+                        pipvo = tilevo[etype][pipk]
+                        for cornerk, corneri in corner_s2i.items():
+                            cornervo = pipvo[corneri]
+                            cornervi = pipvi[corneri]
+                            # no new data
+                            if cornervi is None:
+                                pass
+                            # no previous data
+                            elif cornervo is None:
+                                pipvo[corneri] = cornervi
+                            # combine
+                            else:
+                                minmax = corner2minmax[cornerk]
+                                pipvo[corneri] = minmax(cornervi, cornervo)
+                process_type('pips')
+                process_type('wires')
+    return tilejo
+
+def check_corner_minmax(tilej, verbose=False):
+    # Post processing pass looking for min/max inconsistencies
+    # Especially an issue due to complexities around under-constrained elements
+    # (ex: pivots set to 0 delay)
+    print('Checking for min/max consistency')
+    checks = 0
+    bad = 0
+    for tilev in tilej['tiles'].values():
+        def process_type(etype):
+            nonlocal checks
+            nonlocal bad
+
+            for pipk, pipv in tilev[etype].items():
+                for corner in ('slow', 'fast'): 
+                    mini = corner_s2i[corner + '_min']
+                    minv = pipv[mini]
+                    maxi = corner_s2i[corner + '_max']
+                    maxv = pipv[maxi]
+                    if minv is not None and maxv is not None:
+                        checks += 1
+                        if minv > maxv:
+                            if verbose:
+                                print('WARNING: element %s %s min/max adjusted on corner %s' % (etype, pipk, corner))
+                            bad += 1
+                            pipv[mini] = maxv
+                            pipv[maxi] = minv
+
+        process_type('pips')
+        process_type('wires')
+    print('minmax: %u / %u bad' % (bad, checks))
+
+def check_corners_minmax(tilej, verbose=False):
+    # TODO: check fast vs slow
+    pass
+
+def run(fnins, fnout, verbose=False):
+    tilejo = build_tilejo(fnins)
+    check_corner_minmax(tilejo)
+    check_corners_minmax(tilejo)
+    json.dump(tilejo, open(fnout, 'w'), sort_keys=True, indent=4, separators=(',', ': '))
+
+def main():
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description=
+        'Combine multiple tile corners into one .json file'
+    )
+    parser.add_argument('--out', required=True, help='Combined .json file')
+    parser.add_argument('fnins', nargs='+', help='Input .json files')
+    args = parser.parse_args()
+
+    run(args.fnins, args.out, verbose=False)
+
+if __name__ == '__main__':
+    main()

From 12978f8051161be1b90e2b2912a54b09c3b34421 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Mon, 17 Sep 2018 11:15:42 -0700
Subject: [PATCH 48/55] timfuz: pep8 reformat

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/benchmark.py               |  20 +--
 fuzzers/007-timing/checksub.py                |  25 ++--
 fuzzers/007-timing/corner_csv.py              |  18 ++-
 fuzzers/007-timing/csv_flat2group.py          |  26 ++--
 fuzzers/007-timing/csv_group2flat.py          |  22 ++-
 fuzzers/007-timing/node_unique.py             |  35 ++---
 fuzzers/007-timing/perf_test.py               |  37 +++--
 fuzzers/007-timing/pip_unique.py              |  45 +++----
 .../007-timing/projects/placelut/generate.py  |  23 ++--
 .../projects/placelut_fb/generate.py          |  24 ++--
 .../projects/placelut_ff_fb/generate.py       |  27 ++--
 fuzzers/007-timing/rref.py                    |  44 +++---
 fuzzers/007-timing/solve_leastsq.py           |  42 +++---
 fuzzers/007-timing/solve_linprog.py           |  59 +++++---
 fuzzers/007-timing/speed/speed_json.py        |  40 +++---
 fuzzers/007-timing/sub2csv.py                 |  16 ++-
 fuzzers/007-timing/tile_annotate.py           |  25 +++-
 fuzzers/007-timing/tile_combine.py            |  39 ++++--
 fuzzers/007-timing/timfuz.py                  | 126 +++++++++++++-----
 fuzzers/007-timing/timfuz_massage.py          |  32 +++--
 fuzzers/007-timing/timfuz_solve.py            |  38 +++++-
 fuzzers/007-timing/timgrid/tile_txt2json.py   |  32 +++--
 fuzzers/007-timing/timing_txt2csv.py          |  77 +++++++----
 fuzzers/007-timing/wire_unique.py             |  51 +++----
 24 files changed, 586 insertions(+), 337 deletions(-)

diff --git a/fuzzers/007-timing/benchmark.py b/fuzzers/007-timing/benchmark.py
index 6da3e132..39a6e797 100644
--- a/fuzzers/007-timing/benchmark.py
+++ b/fuzzers/007-timing/benchmark.py
@@ -6,6 +6,7 @@ Copyright 2010 John McMaster
 
 import time
 
+
 def time_str(delta):
     fraction = delta % 1
     delta -= fraction
@@ -17,11 +18,12 @@ def time_str(delta):
     hours = delta
     return '%02d:%02d:%02d.%04d' % (hours, minutes, seconds, fraction * 10000)
 
+
 class Benchmark:
     start_time = None
     end_time = None
-    
-    def __init__(self, max_items = None):
+
+    def __init__(self, max_items=None):
         # For the lazy
         self.start_time = time.time()
         self.end_time = None
@@ -35,19 +37,19 @@ class Benchmark:
 
     def stop(self):
         self.end_time = time.time()
-    
-    def advance(self, n = 1):
+
+    def advance(self, n=1):
         self.cur_items += n
 
     def set_cur_items(self, n):
         self.cur_items = n
-		
-    def delta_s(self):    
+
+    def delta_s(self):
         if self.end_time:
             return self.end_time - self.start_time
         else:
             return time.time() - self.start_time
-    
+
     def __str__(self):
         if self.end_time:
             return time_str(self.end_time - self.start_time)
@@ -65,7 +67,7 @@ class Benchmark:
                     eta_str = time_str(remaining)
             else:
                 eta_str = "indeterminate"
-            return '%d / %d, ETA: %s @ %s' % (self.cur_items, self.max_items, eta_str, rate_s)
+            return '%d / %d, ETA: %s @ %s' % (
+                self.cur_items, self.max_items, eta_str, rate_s)
         else:
             return time_str(time.time() - self.start_time)
-
diff --git a/fuzzers/007-timing/checksub.py b/fuzzers/007-timing/checksub.py
index 00559735..7a307e14 100644
--- a/fuzzers/007-timing/checksub.py
+++ b/fuzzers/007-timing/checksub.py
@@ -8,6 +8,7 @@ import math
 from collections import OrderedDict
 from fractions import Fraction
 
+
 def Adi2matrix_random(A_ubd, b_ub, names):
     # random assignment
     # was making some empty rows
@@ -24,6 +25,7 @@ def Adi2matrix_random(A_ubd, b_ub, names):
         b_ret[dst_rowi] += b
     return A_ret, b_ret
 
+
 def Ads2matrix_linear(Ads, b):
     names, Adi = A_ds2di(Ads)
     cols = len(names)
@@ -41,16 +43,19 @@ def Ads2matrix_linear(Ads, b):
         dst_rowi = (dst_rowi + 1) % rows_out
     return A_ret, b_ret
 
+
 def pmatrix(Anp, s):
     import sympy
     msym = sympy.Matrix(Anp)
     print(s)
     sympy.pprint(msym)
 
+
 def pds(Ads, s):
     names, Anp = A_ds2np(Ads)
     pmatrix(Anp, s)
-    print('Names: %s' % (names,))
+    print('Names: %s' % (names, ))
+
 
 def run(fns_in, sub_json=None, verbose=False):
     # arbitrary...data is thrown away
@@ -76,7 +81,6 @@ def run(fns_in, sub_json=None, verbose=False):
     # A_ub2, b_ub2 = Adi2matrix_random(A_ubd, b, names)
     Amat, _bmat = Ads2matrix_linear(Ads, b)
     #pmatrix(Amat, 'Matrix')
-
     '''
     The matrix must be fully ranked to even be considered reasonable
     Even then, floating point error *possibly* could make it fully ranked, although probably not since we have whole numbers
@@ -96,22 +100,19 @@ def run(fns_in, sub_json=None, verbose=False):
         else:
             print('slogdet :) : %s, %s' % (sign, logdet))
     if rank != len(names):
-        raise Exception("Matrix not fully ranked w/ %u / %u" % (rank, len(names)))
+        raise Exception(
+            "Matrix not fully ranked w/ %u / %u" % (rank, len(names)))
+
 
 def main():
     import argparse
 
     parser = argparse.ArgumentParser(
-        description=
-        'Check sub.json solution feasibility'
-    )
+        description='Check sub.json solution feasibility')
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--sub-json', help='')
-    parser.add_argument(
-        'fns_in',
-        nargs='*',
-        help='timing3.csv input files')
+    parser.add_argument('fns_in', nargs='*', help='timing3.csv input files')
     args = parser.parse_args()
     # Store options in dict to ease passing through functions
     bench = Benchmark()
@@ -125,10 +126,10 @@ def main():
         sub_json = load_sub(args.sub_json)
 
     try:
-        run(sub_json=sub_json,
-            fns_in=fns_in, verbose=args.verbose)
+        run(sub_json=sub_json, fns_in=fns_in, verbose=args.verbose)
     finally:
         print('Exiting after %s' % bench)
 
+
 if __name__ == '__main__':
     main()
diff --git a/fuzzers/007-timing/corner_csv.py b/fuzzers/007-timing/corner_csv.py
index d64c64ab..429e1e55 100644
--- a/fuzzers/007-timing/corner_csv.py
+++ b/fuzzers/007-timing/corner_csv.py
@@ -3,6 +3,7 @@
 from timfuz import Benchmark, simplify_rows, loadc_Ads_b
 import glob
 
+
 def run(fout, fns_in, corner, verbose=0):
     Ads, b = loadc_Ads_b(fns_in, corner, ico=True)
     Ads, b = simplify_rows(Ads, b, corner=corner)
@@ -18,22 +19,19 @@ def run(fout, fns_in, corner, verbose=0):
             items.append('%u %s' % (v, k))
         fout.write(','.join(items) + '\n')
 
+
 def main():
     import argparse
 
     parser = argparse.ArgumentParser(
-        description=
-        'Create a .csv with a single process corner'
-    )
+        description='Create a .csv with a single process corner')
 
     parser.add_argument('--verbose', type=int, help='')
-    parser.add_argument('--auto-name', action='store_true', help='timing3.csv => timing3c.csv')
+    parser.add_argument(
+        '--auto-name', action='store_true', help='timing3.csv => timing3c.csv')
     parser.add_argument('--out', default=None, help='Output csv')
     parser.add_argument('--corner', help='Output csv')
-    parser.add_argument(
-        'fns_in',
-        nargs='*',
-        help='timing3.csv input files')
+    parser.add_argument('fns_in', nargs='*', help='timing3.csv input files')
     args = parser.parse_args()
     bench = Benchmark()
 
@@ -53,8 +51,8 @@ def main():
     if not fns_in:
         fns_in = glob.glob('specimen_*/timing3.csv')
 
-    run(fout=fout,
-        fns_in=fns_in, corner=args.corner, verbose=args.verbose)
+    run(fout=fout, fns_in=fns_in, corner=args.corner, verbose=args.verbose)
+
 
 if __name__ == '__main__':
     main()
diff --git a/fuzzers/007-timing/csv_flat2group.py b/fuzzers/007-timing/csv_flat2group.py
index f1398b87..4cde0e61 100644
--- a/fuzzers/007-timing/csv_flat2group.py
+++ b/fuzzers/007-timing/csv_flat2group.py
@@ -2,6 +2,7 @@
 
 from timfuz import Benchmark, loadc_Ads_bs, index_names, load_sub, run_sub_json, instances
 
+
 def gen_group(fnin, sub_json, strict=False, verbose=False):
     print('Loading data')
     Ads, bs = loadc_Ads_bs([fnin], ico=True)
@@ -17,6 +18,7 @@ def gen_group(fnin, sub_json, strict=False, verbose=False):
     for row_ds, row_bs in zip(Ads, bs):
         yield row_ds, row_bs
 
+
 def run(fns_in, fnout, sub_json, strict=False, verbose=False):
     with open(fnout, 'w') as fout:
         fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
@@ -28,23 +30,21 @@ def run(fns_in, fnout, sub_json, strict=False, verbose=False):
                     items.append('%u %s' % (v, k))
                 fout.write(','.join(items) + '\n')
 
+
 def main():
     import argparse
 
-    parser = argparse.ArgumentParser(
-        description=
-        'Solve timing solution'
-    )
+    parser = argparse.ArgumentParser(description='Solve timing solution')
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--strict', action='store_true', help='')
     parser.add_argument('--sub-csv', help='')
-    parser.add_argument('--sub-json', required=True, help='Group substitutions to make fully ranked')
-    parser.add_argument('--out', help='Output sub.json substitution result')
     parser.add_argument(
-        'fns_in',
-        nargs='*',
-        help='timing3.txt input files')
+        '--sub-json',
+        required=True,
+        help='Group substitutions to make fully ranked')
+    parser.add_argument('--out', help='Output sub.json substitution result')
+    parser.add_argument('fns_in', nargs='*', help='timing3.txt input files')
     args = parser.parse_args()
     # Store options in dict to ease passing through functions
     bench = Benchmark()
@@ -52,9 +52,15 @@ def main():
     sub_json = load_sub(args.sub_json)
 
     try:
-        run(args.fns_in, args.out, sub_json=sub_json, strict=args.strict, verbose=args.verbose)
+        run(
+            args.fns_in,
+            args.out,
+            sub_json=sub_json,
+            strict=args.strict,
+            verbose=args.verbose)
     finally:
         print('Exiting after %s' % bench)
 
+
 if __name__ == '__main__':
     main()
diff --git a/fuzzers/007-timing/csv_group2flat.py b/fuzzers/007-timing/csv_group2flat.py
index 2449b916..438be40e 100644
--- a/fuzzers/007-timing/csv_group2flat.py
+++ b/fuzzers/007-timing/csv_group2flat.py
@@ -15,6 +15,7 @@ import datetime
 import os
 import time
 
+
 def gen_flat(fnin, sub_json, corner=None):
     Ads, bs = loadc_Ads_bs([fnin], ico=True)
     bounds = Ads2bounds(Ads, bs)
@@ -50,6 +51,7 @@ def gen_flat(fnin, sub_json, corner=None):
         for zero in zeros - violations:
             yield zero, zero_row
 
+
 def run(fnin, fnout, sub_json, corner=None, sort=False, verbose=False):
     if sort:
         sortf = sorted
@@ -65,18 +67,19 @@ def run(fnin, fnout, sub_json, corner=None, sort=False, verbose=False):
             items.append('%u %s' % (1, name))
             fout.write(','.join(items) + '\n')
 
+
 def main():
     import argparse
 
-    parser = argparse.ArgumentParser(
-        description=
-        'Solve timing solution'
-    )
+    parser = argparse.ArgumentParser(description='Solve timing solution')
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--sort', action='store_true', help='')
     parser.add_argument('--sub-csv', help='')
-    parser.add_argument('--sub-json', required=True, help='Group substitutions to make fully ranked')
+    parser.add_argument(
+        '--sub-json',
+        required=True,
+        help='Group substitutions to make fully ranked')
     parser.add_argument('--corner', default=None, help='')
     parser.add_argument('fnin', default=None, help='input timing delay .csv')
     parser.add_argument('fnout', default=None, help='output timing delay .csv')
@@ -87,9 +90,16 @@ def main():
     sub_json = load_sub(args.sub_json)
 
     try:
-        run(args.fnin, args.fnout, sub_json=sub_json, sort=args.sort, verbose=args.verbose, corner=args.corner)
+        run(
+            args.fnin,
+            args.fnout,
+            sub_json=sub_json,
+            sort=args.sort,
+            verbose=args.verbose,
+            corner=args.corner)
     finally:
         print('Exiting after %s' % bench)
 
+
 if __name__ == '__main__':
     main()
diff --git a/fuzzers/007-timing/node_unique.py b/fuzzers/007-timing/node_unique.py
index e5793e64..83b054b9 100644
--- a/fuzzers/007-timing/node_unique.py
+++ b/fuzzers/007-timing/node_unique.py
@@ -4,6 +4,7 @@ Verifies that node timing info is unique
 
 import re
 
+
 def gen_nodes(fin):
     for l in fin:
         lj = {}
@@ -22,8 +23,9 @@ def gen_nodes(fin):
             if name in ('COST_CODE', 'SPEED_CLASS'):
                 value = int(value)
             lj[name] = value
-            
-        tile_type, xy, wname = re.match(r'(.*)_(X[0-9]*Y[0-9]*)/(.*)', lj['NAME']).groups()
+
+        tile_type, xy, wname = re.match(
+            r'(.*)_(X[0-9]*Y[0-9]*)/(.*)', lj['NAME']).groups()
         lj['tile_type'] = tile_type
         lj['xy'] = xy
         lj['wname'] = wname
@@ -32,10 +34,12 @@ def gen_nodes(fin):
 
         yield lj
 
+
 def run(node_fin, verbose=0):
     refnodes = {}
     nodei = 0
     for nodei, anode in enumerate(gen_nodes(node_fin)):
+
         def getk(anode):
             return anode['wname']
             #return (anode['tile_type'], anode['wname'])
@@ -52,22 +56,28 @@ def run(node_fin, verbose=0):
         # Verify equivilence
         for k in (
                 'SPEED_CLASS',
-
-                'COST_CODE', 'COST_CODE_NAME',
-                'IS_BAD', 'IS_COMPLETE', 'IS_GND', 'IS_VCC',
-                ):
+                'COST_CODE',
+                'COST_CODE_NAME',
+                'IS_BAD',
+                'IS_COMPLETE',
+                'IS_GND',
+                'IS_VCC',
+        ):
             if k in refnode and k in anode:
+
                 def fail():
                     print 'Mismatch on %s' % k
                     print refnode[k], anode[k]
                     print refnode['l']
                     print anode['l']
                     #assert 0
+
                 if k == 'SPEED_CLASS':
                     # Parameters known to effect SPEED_CLASS
                     # Verify at least one parameter is different
                     if refnode[k] != anode[k]:
-                        for k2 in ('IS_PIN', 'IS_INPUT_PIN', 'IS_OUTPUT_PIN', 'PIN_WIRE', 'NUM_WIRES'):
+                        for k2 in ('IS_PIN', 'IS_INPUT_PIN', 'IS_OUTPUT_PIN',
+                                   'PIN_WIRE', 'NUM_WIRES'):
                             if refnode[k2] != anode[k2]:
                                 break
                         else:
@@ -81,19 +91,14 @@ def run(node_fin, verbose=0):
             elif k in refnode or k in anode:
                 assert 0
 
+
 if __name__ == '__main__':
     import argparse
 
-    parser = argparse.ArgumentParser(
-        description=
-        'Timing fuzzer'
-    )
+    parser = argparse.ArgumentParser(description='Timing fuzzer')
 
     parser.add_argument('--verbose', type=int, help='')
     parser.add_argument(
-        'node_fn_in',
-        default='/dev/stdin',
-        nargs='?',
-        help='Input file')
+        'node_fn_in', default='/dev/stdin', nargs='?', help='Input file')
     args = parser.parse_args()
     run(open(args.node_fn_in, 'r'), verbose=args.verbose)
diff --git a/fuzzers/007-timing/perf_test.py b/fuzzers/007-timing/perf_test.py
index df1998a8..cb400809 100644
--- a/fuzzers/007-timing/perf_test.py
+++ b/fuzzers/007-timing/perf_test.py
@@ -1,5 +1,4 @@
 #!/usr/bin/env python3
-
 '''
 Triaging tool to help understand where we need more timing coverage
 Finds correlated variables to help make better test cases
@@ -16,6 +15,7 @@ from fractions import Fraction
 import random
 from sympy import Rational
 
+
 def intr(r):
     DELTA = 0.0001
 
@@ -25,24 +25,30 @@ def intr(r):
             assert abs(xi - x) < DELTA
             r[i] = xi
 
+
 def fracr(r):
     intr(r)
     return [Fraction(x) for x in r]
 
+
 def fracm(m):
     return [fracr(r) for r in m]
 
+
 def symratr(r):
     intr(r)
     return [Rational(x) for x in r]
 
+
 def symratm(m):
     return [symratr(r) for r in m]
 
+
 def intm(m):
     [intr(r) for r in m]
     return m
 
+
 def create_matrix(rows, cols):
     ret = np.zeros((rows, cols))
     for rowi in range(rows):
@@ -50,6 +56,7 @@ def create_matrix(rows, cols):
             ret[rowi][coli] = random.randint(1, 10)
     return ret
 
+
 def create_matrix_sparse(rows, cols):
     ret = np.zeros((rows, cols))
     for rowi in range(rows):
@@ -58,7 +65,14 @@ def create_matrix_sparse(rows, cols):
                 ret[rowi][coli] = random.randint(1, 10)
     return ret
 
-def run(rows=35, cols=200, verbose=False, encoding='np', sparse=False, normalize_last=True):
+
+def run(
+        rows=35,
+        cols=200,
+        verbose=False,
+        encoding='np',
+        sparse=False,
+        normalize_last=True):
     random.seed(0)
     if sparse:
         mnp = create_matrix_sparse(rows, cols)
@@ -85,7 +99,9 @@ def run(rows=35, cols=200, verbose=False, encoding='np', sparse=False, normalize
         print('Matrix')
         sympy.pprint(msym)
 
-    print('%s matrix, %u rows x %u cols, sparse: %s, normlast: %s' % (encoding, len(mnp), len(mnp[0]), sparse, normalize_last))
+    print(
+        '%s matrix, %u rows x %u cols, sparse: %s, normlast: %s' %
+        (encoding, len(mnp), len(mnp[0]), sparse, normalize_last))
     bench = Benchmark()
     try:
         rref, pivots = msym.rref(normalize_last=normalize_last)
@@ -99,13 +115,11 @@ def run(rows=35, cols=200, verbose=False, encoding='np', sparse=False, normalize
         print('rref')
         sympy.pprint(rref)
 
+
 def main():
     import argparse
 
-    parser = argparse.ArgumentParser(
-        description=
-        'Timing fuzzer'
-    )
+    parser = argparse.ArgumentParser(description='Timing fuzzer')
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--sparse', action='store_true', help='')
@@ -115,7 +129,14 @@ def main():
     parser.add_argument('--encoding', default='np', help='')
     args = parser.parse_args()
 
-    run(encoding=args.encoding, rows=args.rows, cols=args.cols, sparse=args.sparse, normalize_last=bool(args.normalize_last), verbose=args.verbose)
+    run(
+        encoding=args.encoding,
+        rows=args.rows,
+        cols=args.cols,
+        sparse=args.sparse,
+        normalize_last=bool(args.normalize_last),
+        verbose=args.verbose)
+
 
 if __name__ == '__main__':
     main()
diff --git a/fuzzers/007-timing/pip_unique.py b/fuzzers/007-timing/pip_unique.py
index 39b45d44..b38c9f4e 100644
--- a/fuzzers/007-timing/pip_unique.py
+++ b/fuzzers/007-timing/pip_unique.py
@@ -4,6 +4,7 @@ Verifies that node timing info is unique
 
 import re
 
+
 def gen_wires(fin):
     for l in fin:
         lj = {}
@@ -12,7 +13,8 @@ def gen_wires(fin):
             name, value = kvs.split(':')
             lj[name] = value
 
-        tile_type, xy, wname = re.match(r'(.*)_(X[0-9]*Y[0-9]*)/(.*)', lj['NAME']).groups()
+        tile_type, xy, wname = re.match(
+            r'(.*)_(X[0-9]*Y[0-9]*)/(.*)', lj['NAME']).groups()
         lj['tile_type'] = tile_type
         lj['xy'] = xy
         lj['wname'] = wname
@@ -21,10 +23,12 @@ def gen_wires(fin):
 
         yield lj
 
+
 def run(node_fin, verbose=0):
     refnodes = {}
     nodei = 0
     for nodei, anode in enumerate(gen_wires(node_fin)):
+
         def getk(anode):
             return anode['wname']
             return (anode['tile_type'], anode['wname'])
@@ -39,29 +43,29 @@ def run(node_fin, verbose=0):
             refnodes[getk(anode)] = anode
             continue
         k_invariant = (
-                'CAN_INVERT',
-                'IS_BUFFERED_2_0',
-                'IS_BUFFERED_2_1',
-                'IS_DIRECTIONAL',
-                'IS_EXCLUDED_PIP',
-                'IS_FIXED_INVERSION',
-                'IS_INVERTED',
-                'IS_PSEUDO',
-                'IS_SITE_PIP',
-                'IS_TEST_PIP',
-                )
-        k_varies = (
-                'TILE',
-            )
+            'CAN_INVERT',
+            'IS_BUFFERED_2_0',
+            'IS_BUFFERED_2_1',
+            'IS_DIRECTIONAL',
+            'IS_EXCLUDED_PIP',
+            'IS_FIXED_INVERSION',
+            'IS_INVERTED',
+            'IS_PSEUDO',
+            'IS_SITE_PIP',
+            'IS_TEST_PIP',
+        )
+        k_varies = ('TILE', )
         # Verify equivilence
         for k in k_invariant:
             if k in refnode and k in anode:
+
                 def fail():
                     print 'Mismatch on %s' % k
                     print refnode[k], anode[k]
                     print refnode['l']
                     print anode['l']
                     #assert 0
+
                 if refnode[k] != anode[k]:
                     print
                     fail()
@@ -71,19 +75,14 @@ def run(node_fin, verbose=0):
             elif k not in k_varies:
                 assert 0
 
+
 if __name__ == '__main__':
     import argparse
 
-    parser = argparse.ArgumentParser(
-        description=
-        'Timing fuzzer'
-    )
+    parser = argparse.ArgumentParser(description='Timing fuzzer')
 
     parser.add_argument('--verbose', type=int, help='')
     parser.add_argument(
-        'node_fn_in',
-        default='/dev/stdin',
-        nargs='?',
-        help='Input file')
+        'node_fn_in', default='/dev/stdin', nargs='?', help='Input file')
     args = parser.parse_args()
     run(open(args.node_fn_in, 'r'), verbose=args.verbose)
diff --git a/fuzzers/007-timing/projects/placelut/generate.py b/fuzzers/007-timing/projects/placelut/generate.py
index a56d4c55..68687f91 100644
--- a/fuzzers/007-timing/projects/placelut/generate.py
+++ b/fuzzers/007-timing/projects/placelut/generate.py
@@ -6,7 +6,6 @@ parser = argparse.ArgumentParser(description='')
 parser.add_argument('--sdx', default='8', help='')
 parser.add_argument('--sdy', default='4', help='')
 args = parser.parse_args()
-
 '''
 Generate in pairs
 Fill up switchbox quad for now
@@ -26,15 +25,16 @@ nin = 6 * nlut
 nout = nlut
 
 print('//placelut simple')
-print('//SBASE: %s' % (SBASE,))
-print('//SDX: %s' % (SDX,))
-print('//SDY: %s' % (SDX,))
-print('//nlut: %s' % (nlut,))
-print('''\
+print('//SBASE: %s' % (SBASE, ))
+print('//SDX: %s' % (SDX, ))
+print('//SDY: %s' % (SDX, ))
+print('//nlut: %s' % (nlut, ))
+print(
+    '''\
 module roi (
         input wire clk,
         input wire [%u:0] ins,
-        output wire [%u:0] outs);''') % (nin - 1, nout -1)
+        output wire [%u:0] outs);''') % (nin - 1, nout - 1)
 
 ini = 0
 outi = 0
@@ -43,7 +43,8 @@ for lutx in xrange(SBASE[0], SBASE[0] + SDX):
         loc = "SLICE_X%uY%u" % (lutx, luty)
         for belc in 'ABCD':
             bel = '%c6LUT' % belc
-            print('''\
+            print(
+                '''\
 
 	(* KEEP, DONT_TOUCH, LOC="%s", BEL="%s" *)
 	LUT6 #(
@@ -54,12 +55,13 @@ for lutx in xrange(SBASE[0], SBASE[0] + SDX):
 		.I%u(ins[%u]),''' % (i, ini))
                 ini += 1
             print('''\
-		.O(outs[%u]));''') % (outi,)
+		.O(outs[%u]));''') % (outi, )
             outi += 1
 assert nin == ini
 assert nout == outi
 
-print('''
+print(
+    '''
 endmodule
 
 module top(input wire clk, input wire stb, input wire di, output wire do);
@@ -88,4 +90,3 @@ module top(input wire clk, input wire stb, input wire di, output wire do);
             .outs(dout)
             );
 endmodule''') % (nin, nout)
-
diff --git a/fuzzers/007-timing/projects/placelut_fb/generate.py b/fuzzers/007-timing/projects/placelut_fb/generate.py
index 7e973da0..8f22dd37 100644
--- a/fuzzers/007-timing/projects/placelut_fb/generate.py
+++ b/fuzzers/007-timing/projects/placelut_fb/generate.py
@@ -1,5 +1,4 @@
 #!/usr/bin/env python
-
 '''
 Note: vivado will (by default) fail bitgen DRC on LUT feedback loops
 Looks like can probably be disabled, but we actually don't need a bitstream for timing analysis
@@ -14,7 +13,6 @@ parser = argparse.ArgumentParser(description='')
 parser.add_argument('--sdx', default='8', help='')
 parser.add_argument('--sdy', default='4', help='')
 args = parser.parse_args()
-
 '''
 Generate in pairs
 Fill up switchbox quad for now
@@ -34,15 +32,16 @@ nin = 6 * nlut
 nout = nlut
 
 print('//placelut w/ feedback')
-print('//SBASE: %s' % (SBASE,))
-print('//SDX: %s' % (SDX,))
-print('//SDY: %s' % (SDX,))
-print('//nlut: %s' % (nlut,))
-print('''\
+print('//SBASE: %s' % (SBASE, ))
+print('//SDX: %s' % (SDX, ))
+print('//SDY: %s' % (SDX, ))
+print('//nlut: %s' % (nlut, ))
+print(
+    '''\
 module roi (
         input wire clk,
         input wire [%u:0] ins,
-        output wire [%u:0] outs);''') % (nin - 1, nout -1)
+        output wire [%u:0] outs);''') % (nin - 1, nout - 1)
 
 ini = 0
 outi = 0
@@ -51,7 +50,8 @@ for lutx in xrange(SBASE[0], SBASE[0] + SDX):
         loc = "SLICE_X%uY%u" % (lutx, luty)
         for belc in 'ABCD':
             bel = '%c6LUT' % belc
-            print('''\
+            print(
+                '''\
 
     (* KEEP, DONT_TOUCH, LOC="%s", BEL="%s" *)
     LUT6 #(
@@ -66,12 +66,13 @@ for lutx in xrange(SBASE[0], SBASE[0] + SDX):
                 print('''\
         .I%u(%s),''' % (i, wfrom))
             print('''\
-        .O(outs[%u]));''') % (outi,)
+        .O(outs[%u]));''') % (outi, )
             outi += 1
 #assert nin == ini
 assert nout == outi
 
-print('''
+print(
+    '''
 endmodule
 
 module top(input wire clk, input wire stb, input wire di, output wire do);
@@ -100,4 +101,3 @@ module top(input wire clk, input wire stb, input wire di, output wire do);
             .outs(dout)
             );
 endmodule''') % (nin, nout)
-
diff --git a/fuzzers/007-timing/projects/placelut_ff_fb/generate.py b/fuzzers/007-timing/projects/placelut_ff_fb/generate.py
index 3f8b2784..410e995f 100644
--- a/fuzzers/007-timing/projects/placelut_ff_fb/generate.py
+++ b/fuzzers/007-timing/projects/placelut_ff_fb/generate.py
@@ -1,5 +1,4 @@
 #!/usr/bin/env python
-
 '''
 Note: vivado will (by default) fail bitgen DRC on LUT feedback loops
 Looks like can probably be disabled, but we actually don't need a bitstream for timing analysis
@@ -18,7 +17,6 @@ parser = argparse.ArgumentParser(description='')
 parser.add_argument('--sdx', default='8', help='')
 parser.add_argument('--sdy', default='4', help='')
 args = parser.parse_args()
-
 '''
 Generate in pairs
 Fill up switchbox quad for now
@@ -38,15 +36,16 @@ nin = 6 * nlut
 nout = nlut
 
 print('//placelut w/ FF + feedback')
-print('//SBASE: %s' % (SBASE,))
-print('//SDX: %s' % (SDX,))
-print('//SDY: %s' % (SDX,))
-print('//nlut: %s' % (nlut,))
-print('''\
+print('//SBASE: %s' % (SBASE, ))
+print('//SDX: %s' % (SDX, ))
+print('//SDY: %s' % (SDX, ))
+print('//nlut: %s' % (nlut, ))
+print(
+    '''\
 module roi (
         input wire clk,
         input wire [%u:0] ins,
-        output wire [%u:0] outs);''') % (nin - 1, nout -1)
+        output wire [%u:0] outs);''') % (nin - 1, nout - 1)
 
 ini = 0
 outi = 0
@@ -56,7 +55,8 @@ for lutx in xrange(SBASE[0], SBASE[0] + SDX):
         for belc in 'ABCD':
             bel = '%c6LUT' % belc
             name = 'lut_x%uy%u_%c' % (lutx, luty, belc)
-            print('''\
+            print(
+                '''\
 
     (* KEEP, DONT_TOUCH, LOC="%s", BEL="%s" *)
     LUT6 #(
@@ -75,14 +75,15 @@ for lutx in xrange(SBASE[0], SBASE[0] + SDX):
         .I%u(%s),''' % (i, wfrom))
             out_w = name + '_o'
             print('''\
-        .O(%s));''') % (out_w,)
+        .O(%s));''') % (out_w, )
 
             outs_w = "outs[%u]" % outi
             if random.randint(0, 9) < 5:
                 print('    assign %s = %s;' % (outs_w, out_w))
             else:
                 out_r = name + '_or'
-                print('''\
+                print(
+                    '''\
     reg %s;
     assign %s = %s;
     always @(posedge clk) begin
@@ -94,7 +95,8 @@ for lutx in xrange(SBASE[0], SBASE[0] + SDX):
 #assert nin == ini
 assert nout == outi
 
-print('''
+print(
+    '''
 endmodule
 
 module top(input wire clk, input wire stb, input wire di, output wire do);
@@ -123,4 +125,3 @@ module top(input wire clk, input wire stb, input wire di, output wire do);
             .outs(dout)
             );
 endmodule''') % (nin, nout)
-
diff --git a/fuzzers/007-timing/rref.py b/fuzzers/007-timing/rref.py
index bad37401..97b4efa0 100644
--- a/fuzzers/007-timing/rref.py
+++ b/fuzzers/007-timing/rref.py
@@ -1,5 +1,4 @@
 #!/usr/bin/env python3
-
 '''
 Triaging tool to help understand where we need more timing coverage
 Finds correlated variables to help make better test cases
@@ -14,6 +13,7 @@ import sympy
 from collections import OrderedDict
 from fractions import Fraction
 
+
 def fracr(r):
     DELTA = 0.0001
 
@@ -24,12 +24,15 @@ def fracr(r):
             r[i] = xi
     return [Fraction(x) for x in r]
 
+
 def fracm(m):
     return [fracr(r) for r in m]
 
+
 def fracr_quick(r):
     return [Fraction(numerator=int(x), denominator=1) for x in r]
 
+
 # the way I'm doing thing they should all be even integers
 # hmm this was only slightly faster
 def fracm_quick(m):
@@ -37,6 +40,7 @@ def fracm_quick(m):
     print('fracm_quick type: %s' % t)
     return [fracr_quick(r) for r in m]
 
+
 class State(object):
     def __init__(self, Ads, drop_names=[]):
         self.Ads = Ads
@@ -57,9 +61,11 @@ class State(object):
         print("Stats")
         print("  Substitutions: %u" % len(self.subs))
         if self.subs:
-            print("    Largest: %u" % max([len(x) for x in self.subs.values()]))
+            print(
+                "    Largest: %u" % max([len(x) for x in self.subs.values()]))
         print("  Rows: %u" % len(self.Ads))
-        print("  Cols (in): %u" % (len(self.base_names) + len(self.drop_names)))
+        print(
+            "  Cols (in): %u" % (len(self.base_names) + len(self.drop_names)))
         print("  Cols (preprocessed): %u" % len(self.base_names))
         print("    Drop names: %u" % len(self.drop_names))
         print("  Cols (out): %u" % len(self.names))
@@ -70,10 +76,11 @@ class State(object):
     def load(fn_ins, simplify=False, corner=None):
         Ads, b = loadc_Ads_b(fn_ins, corner=corner, ico=True)
         if simplify:
-            print('Simplifying corner %s' % (corner,))
+            print('Simplifying corner %s' % (corner, ))
             Ads, b = simplify_rows(Ads, b, remove_zd=False, corner=corner)
         return State(Ads)
 
+
 def write_state(state, fout):
     j = {
         'names': dict([(x, None) for x in state.names]),
@@ -84,6 +91,7 @@ def write_state(state, fout):
     }
     json.dump(j, fout, sort_keys=True, indent=4, separators=(',', ': '))
 
+
 def Anp2matrix(Anp):
     '''
     Original idea was to make into a square matrix
@@ -99,6 +107,7 @@ def Anp2matrix(Anp):
         dst_rowi = (dst_rowi + 1) % ncols
     return A_ub2
 
+
 def row_np2ds(rownp, names):
     ret = {}
     assert len(rownp) == len(names), (len(rownp), len(names))
@@ -108,6 +117,7 @@ def row_np2ds(rownp, names):
             ret[name] = v
     return ret
 
+
 def row_sym2dsf(rowsym, names):
     '''Convert a sympy row into a dictionary of keys to (numerator, denominator) tuples'''
     from sympy import fraction
@@ -121,6 +131,7 @@ def row_sym2dsf(rowsym, names):
             ret[name] = (int(num), int(den))
     return ret
 
+
 def state_rref(state, verbose=False):
     print('Converting rows to integer keys')
     names, Anp = A_ds2np(state.Ads)
@@ -195,6 +206,7 @@ def state_rref(state, verbose=False):
 
     return state
 
+
 def run(fnout, fn_ins, simplify=False, corner=None, verbose=0):
     print('Loading data')
 
@@ -205,24 +217,21 @@ def run(fnout, fn_ins, simplify=False, corner=None, verbose=0):
         with open(fnout, 'w') as fout:
             write_state(state, fout)
 
+
 def main():
     import argparse
 
-    parser = argparse.ArgumentParser(
-        description=
-        'Timing fuzzer'
-    )
+    parser = argparse.ArgumentParser(description='Timing fuzzer')
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--simplify', action='store_true', help='')
     parser.add_argument('--corner', default="slow_max", help='')
-    parser.add_argument('--speed-json', default='build_speed/speed.json',
+    parser.add_argument(
+        '--speed-json',
+        default='build_speed/speed.json',
         help='Provides speed index to name translation')
     parser.add_argument('--out', help='Output sub.json substitution result')
-    parser.add_argument(
-        'fns_in',
-        nargs='+',
-        help='timing3.txt input files')
+    parser.add_argument('fns_in', nargs='+', help='timing3.txt input files')
     args = parser.parse_args()
     bench = Benchmark()
 
@@ -231,10 +240,15 @@ def main():
         fns_in = glob.glob('specimen_*/timing3.csv')
 
     try:
-        run(fnout=args.out,
-            fn_ins=args.fns_in, simplify=args.simplify, corner=args.corner, verbose=args.verbose)
+        run(
+            fnout=args.out,
+            fn_ins=args.fns_in,
+            simplify=args.simplify,
+            corner=args.corner,
+            verbose=args.verbose)
     finally:
         print('Exiting after %s' % bench)
 
+
 if __name__ == '__main__':
     main()
diff --git a/fuzzers/007-timing/solve_leastsq.py b/fuzzers/007-timing/solve_leastsq.py
index 5bdd4fad..1a1b55e6 100644
--- a/fuzzers/007-timing/solve_leastsq.py
+++ b/fuzzers/007-timing/solve_leastsq.py
@@ -15,6 +15,7 @@ import timfuz_solve
 import scipy.optimize as optimize
 from scipy.optimize import least_squares
 
+
 def mkestimate(Anp, b):
     '''
     Ballpark upper bound estimate assuming variables contribute all of the delay in their respective row
@@ -33,6 +34,7 @@ def mkestimate(Anp, b):
                     x0[coli] = min(x0[coli], ub)
     return x0
 
+
 def save(outfn, xvals, names, corner):
     # ballpark minimum actual observed delay is around 7 (carry chain)
     # anything less than one is probably a solver artifact
@@ -45,7 +47,7 @@ def save(outfn, xvals, names, corner):
         'fast_min': math.floor,
         'slow_max': math.ceil,
         'slow_min': math.floor,
-        }[corner]
+    }[corner]
 
     print('Writing results')
     skips = 0
@@ -69,16 +71,18 @@ def save(outfn, xvals, names, corner):
             items = [str(row_ico), acorner2csv(roundf(xval), corneri)]
             items.append('%u %s' % (1, name))
             fout.write(','.join(items) + '\n')
-    print('Wrote: skip %u => %u / %u valid delays' % (skips, keeps, len(names)))
+    print(
+        'Wrote: skip %u => %u / %u valid delays' % (skips, keeps, len(names)))
     assert keeps, 'Failed to estimate delay'
 
-def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=None):
+
+def run_corner(
+        Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=None):
     # Given timing scores for above delays (-ps)
     assert type(Anp[0]) is np.ndarray, type(Anp[0])
     assert type(b) is np.ndarray, type(b)
 
     #check_feasible(Anp, b)
-
     '''
     Be mindful of signs
     Have something like
@@ -97,7 +101,6 @@ def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=Non
     print('Input paths')
     print('  # timing scores: %d' % len(b))
     print('  Rows: %d' % rows)
-
     '''
     You must have at least as many things to optimize as variables
     That is, the system must be plausibly constrained for it to attempt a solve
@@ -110,10 +113,11 @@ def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=Non
     tlast = [None]
     iters = [0]
     printn = [0]
+
     def progress_print():
         iters[0] += 1
         if tlast[0] is None:
-            tlast[0]= time.time()
+            tlast[0] = time.time()
         if time.time() - tlast[0] > 1.0:
             sys.stdout.write('I:%d ' % iters[0])
             tlast[0] = time.time()
@@ -143,23 +147,22 @@ def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=Non
     if outfn:
         save(outfn, res.x, names, corner)
 
+
 def main():
     import argparse
 
     parser = argparse.ArgumentParser(
         description=
-        'Solve timing solution using least squares objective function'
-    )
+        'Solve timing solution using least squares objective function')
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--massage', action='store_true', help='')
-    parser.add_argument('--sub-json', help='Group substitutions to make fully ranked')
-    parser.add_argument('--corner', default="slow_max", help='')
-    parser.add_argument('--out', default=None, help='output timing delay .json')
     parser.add_argument(
-        'fns_in',
-        nargs='+',
-        help='timing3.csv input files')
+        '--sub-json', help='Group substitutions to make fully ranked')
+    parser.add_argument('--corner', default="slow_max", help='')
+    parser.add_argument(
+        '--out', default=None, help='output timing delay .json')
+    parser.add_argument('fns_in', nargs='+', help='timing3.csv input files')
     args = parser.parse_args()
     # Store options in dict to ease passing through functions
     bench = Benchmark()
@@ -169,10 +172,17 @@ def main():
         sub_json = load_sub(args.sub_json)
 
     try:
-        timfuz_solve.run(run_corner=run_corner, sub_json=sub_json,
-            fns_in=args.fns_in, corner=args.corner, massage=args.massage, outfn=args.out, verbose=args.verbose)
+        timfuz_solve.run(
+            run_corner=run_corner,
+            sub_json=sub_json,
+            fns_in=args.fns_in,
+            corner=args.corner,
+            massage=args.massage,
+            outfn=args.out,
+            verbose=args.verbose)
     finally:
         print('Exiting after %s' % bench)
 
+
 if __name__ == '__main__':
     main()
diff --git a/fuzzers/007-timing/solve_linprog.py b/fuzzers/007-timing/solve_linprog.py
index ee73a702..29e4d826 100644
--- a/fuzzers/007-timing/solve_linprog.py
+++ b/fuzzers/007-timing/solve_linprog.py
@@ -12,6 +12,7 @@ import os
 import time
 import timfuz_solve
 
+
 def save(outfn, xvals, names, corner):
     # ballpark minimum actual observed delay is around 7 (carry chain)
     # anything less than one is probably a solver artifact
@@ -23,7 +24,7 @@ def save(outfn, xvals, names, corner):
         'fast_min': math.floor,
         'slow_max': math.ceil,
         'slow_min': math.floor,
-        }[corner]
+    }[corner]
 
     print('Writing results')
     zeros = 0
@@ -45,9 +46,13 @@ def save(outfn, xvals, names, corner):
             items.append('%u %s' % (1, name))
             fout.write(','.join(items) + '\n')
     nonzeros = len(names) - zeros
-    print('Wrote: %u / %u constrained delays, %u zeros' % (nonzeros, len(names), zeros))
+    print(
+        'Wrote: %u / %u constrained delays, %u zeros' %
+        (nonzeros, len(names), zeros))
 
-def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=None):
+
+def run_corner(
+        Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=None):
     if len(Anp) == 0:
         print('WARNING: zero equations')
         if outfn:
@@ -58,14 +63,13 @@ def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=Non
         'slow_min': False,
         'fast_max': True,
         'fast_min': False,
-        }[corner]
+    }[corner]
 
     # Given timing scores for above delays (-ps)
     assert type(Anp[0]) is np.ndarray, type(Anp[0])
     assert type(b) is np.ndarray, type(b)
 
     #check_feasible(Anp, b)
-
     '''
     Be mindful of signs
     t1, t2: total delay contants
@@ -133,6 +137,7 @@ def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=Non
     tlast = [time.time()]
     iters = [0]
     printn = [0]
+
     def callback(xk, **kwargs):
         iters[0] = kwargs['nit']
         if time.time() - tlast[0] > 1.0:
@@ -147,8 +152,18 @@ def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=Non
     # Now find smallest values for delay constants
     # Due to input bounds (ex: column limit), some delay elements may get eliminated entirely
     print('Running linprog w/ %d r, %d c (%d name)' % (rows, cols, len(names)))
-    res = linprog(c, A_ub=A_ub, b_ub=b_ub, bounds=bounds, callback=callback,
-          options={"disp": True, 'maxiter': maxiter, 'bland': True, 'tol': 1e-6,})
+    res = linprog(
+        c,
+        A_ub=A_ub,
+        b_ub=b_ub,
+        bounds=bounds,
+        callback=callback,
+        options={
+            "disp": True,
+            'maxiter': maxiter,
+            'bland': True,
+            'tol': 1e-6,
+        })
     nonzeros = 0
     print('Ran %d iters' % iters[0])
     if res.success:
@@ -159,31 +174,31 @@ def run_corner(Anp, b, names, corner, verbose=False, opts={}, meta={}, outfn=Non
             if nonzero:
                 nonzeros += 1
             #if nonzero and (verbose >= 1 or xi > 30):
-            if nonzero and (verbose or ((nonzeros < 100 or nonzeros % 20 == 0) and nonzeros <= plim)):
+            if nonzero and (verbose or (
+                (nonzeros < 100 or nonzeros % 20 == 0) and nonzeros <= plim)):
                 print('  % 4u % -80s % 10.1f' % (xi, name, x))
         print('Delay on %d / %d' % (nonzeros, len(res.x)))
 
         if outfn:
             save(outfn, res.x, names, corner)
 
+
 def main():
     import argparse
 
     parser = argparse.ArgumentParser(
         description=
-        'Solve timing solution using linear programming inequalities'
-    )
+        'Solve timing solution using linear programming inequalities')
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--massage', action='store_true', help='')
     parser.add_argument('--sub-csv', help='')
-    parser.add_argument('--sub-json', help='Group substitutions to make fully ranked')
-    parser.add_argument('--corner', default=None, required=True, help='')
-    parser.add_argument('--out', default=None, help='output timing delay .json')
     parser.add_argument(
-        'fns_in',
-        nargs='*',
-        help='timing3.csv input files')
+        '--sub-json', help='Group substitutions to make fully ranked')
+    parser.add_argument('--corner', default=None, required=True, help='')
+    parser.add_argument(
+        '--out', default=None, help='output timing delay .json')
+    parser.add_argument('fns_in', nargs='*', help='timing3.csv input files')
     args = parser.parse_args()
     # Store options in dict to ease passing through functions
     bench = Benchmark()
@@ -197,10 +212,18 @@ def main():
         sub_json = load_sub(args.sub_json)
 
     try:
-        timfuz_solve.run(run_corner=run_corner, sub_json=sub_json, sub_csv=args.sub_csv,
-            fns_in=fns_in, corner=args.corner, massage=args.massage, outfn=args.out, verbose=args.verbose)
+        timfuz_solve.run(
+            run_corner=run_corner,
+            sub_json=sub_json,
+            sub_csv=args.sub_csv,
+            fns_in=fns_in,
+            corner=args.corner,
+            massage=args.massage,
+            outfn=args.out,
+            verbose=args.verbose)
     finally:
         print('Exiting after %s' % bench)
 
+
 if __name__ == '__main__':
     main()
diff --git a/fuzzers/007-timing/speed/speed_json.py b/fuzzers/007-timing/speed/speed_json.py
index 07dfd20b..1f0a3910 100644
--- a/fuzzers/007-timing/speed/speed_json.py
+++ b/fuzzers/007-timing/speed/speed_json.py
@@ -1,5 +1,6 @@
 import json
 
+
 def load_speed(fin):
     speed_models = {}
     speed_types = {}
@@ -9,9 +10,9 @@ def load_speed(fin):
         for kvs in l.split():
             name, value = kvs.split(':')
             name = name.lower()
-            if name in ('class',):
+            if name in ('class', ):
                 continue
-            if name in ('speed_index',):
+            if name in ('speed_index', ):
                 value = int(value)
             if name == 'type':
                 speed_types.setdefault(value, {})
@@ -38,6 +39,7 @@ def load_speed(fin):
         speed_models[delayk] = delay
     return speed_models, speed_types
 
+
 def load_cost_code(fin):
     # COST_CODE:4 COST_CODE_NAME:SLOWSINGLE
     cost_codes = {}
@@ -53,11 +55,12 @@ def load_cost_code(fin):
             'code': int(lj['cost_code']),
             # Hmm is this unique per type?
             #'speed_class': int(lj['speed_class']),
-            }
-        
+        }
+
         cost_codes[cost_code['name']] = cost_code
     return cost_codes
 
+
 def run(speed_fin, node_fin, fout, verbose=0):
     print('Loading data')
     speed_models, speed_types = load_speed(speed_fin)
@@ -67,32 +70,25 @@ def run(speed_fin, node_fin, fout, verbose=0):
         'speed_model': speed_models,
         'speed_type': speed_types,
         'cost_code': cost_codes,
-        }
+    }
     json.dump(j, fout, sort_keys=True, indent=4, separators=(',', ': '))
 
+
 if __name__ == '__main__':
     import argparse
 
-    parser = argparse.ArgumentParser(
-        description=
-        'Timing fuzzer'
-    )
+    parser = argparse.ArgumentParser(description='Timing fuzzer')
 
     parser.add_argument('--verbose', type=int, help='')
     parser.add_argument(
-        'speed_fn_in',
-        default='/dev/stdin',
-        nargs='?',
-        help='Input file')
+        'speed_fn_in', default='/dev/stdin', nargs='?', help='Input file')
     parser.add_argument(
-        'node_fn_in',
-        default='/dev/stdin',
-        nargs='?',
-        help='Input file')
+        'node_fn_in', default='/dev/stdin', nargs='?', help='Input file')
     parser.add_argument(
-        'fn_out',
-        default='/dev/stdout',
-        nargs='?',
-        help='Output file')
+        'fn_out', default='/dev/stdout', nargs='?', help='Output file')
     args = parser.parse_args()
-    run(open(args.speed_fn_in, 'r'), open(args.node_fn_in, 'r'), open(args.fn_out, 'w'), verbose=args.verbose)
+    run(
+        open(args.speed_fn_in, 'r'),
+        open(args.node_fn_in, 'r'),
+        open(args.fn_out, 'w'),
+        verbose=args.verbose)
diff --git a/fuzzers/007-timing/sub2csv.py b/fuzzers/007-timing/sub2csv.py
index 9ea9bbbc..8567d5e3 100644
--- a/fuzzers/007-timing/sub2csv.py
+++ b/fuzzers/007-timing/sub2csv.py
@@ -9,6 +9,7 @@ import sympy
 from collections import OrderedDict
 from fractions import Fraction
 
+
 def mlcm(xs):
     '''
     Find the LCM between elements in a group
@@ -20,6 +21,7 @@ def mlcm(xs):
             l = int(max(lthis, l))
     return ret
 
+
 def write_state(state, fout):
     j = {
         'names': dict([(x, None) for x in state.names]),
@@ -30,6 +32,7 @@ def write_state(state, fout):
     }
     json.dump(j, fout, sort_keys=True, indent=4, separators=(',', ': '))
 
+
 def gen_rows(fn_ins):
     for fn_in in fn_ins:
         try:
@@ -52,7 +55,7 @@ def gen_rows(fn_ins):
                 n = 1
                 for _var, (_num, den) in sub.items():
                     n *= den
-    
+
                 for var, (num, den) in sub.items():
                     num2 = n * num
                     assert num2 % den == 0
@@ -62,6 +65,7 @@ def gen_rows(fn_ins):
             print("Error processing %s" % fn_in)
             raise
 
+
 def run(fnout, fn_ins, verbose=0):
     print('Loading data')
 
@@ -76,6 +80,7 @@ def run(fnout, fn_ins, verbose=0):
                 items.append('%i %s' % (v, k))
             fout.write(','.join(items) + '\n')
 
+
 def main():
     import argparse
 
@@ -86,20 +91,17 @@ def main():
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--out', help='Output csv')
-    parser.add_argument(
-        'fns_in',
-        nargs='*',
-        help='sub.json input files')
+    parser.add_argument('fns_in', nargs='*', help='sub.json input files')
     args = parser.parse_args()
     bench = Benchmark()
 
     fns_in = args.fns_in
 
     try:
-        run(fnout=args.out,
-            fn_ins=args.fns_in, verbose=args.verbose)
+        run(fnout=args.out, fn_ins=args.fns_in, verbose=args.verbose)
     finally:
         print('Exiting after %s' % bench)
 
+
 if __name__ == '__main__':
     main()
diff --git a/fuzzers/007-timing/tile_annotate.py b/fuzzers/007-timing/tile_annotate.py
index 5b897b4d..58b89235 100644
--- a/fuzzers/007-timing/tile_annotate.py
+++ b/fuzzers/007-timing/tile_annotate.py
@@ -8,10 +8,12 @@ import os
 import time
 import json
 
+
 # corner wokraround
 def quad(x):
     return [x for _ in range(4)]
 
+
 def run(fnin, fnout, tile_json_fn, verbose=False):
     # modified in place
     tilej = json.load(open(tile_json_fn, 'r'))
@@ -50,18 +52,26 @@ def run(fnin, fnout, tile_json_fn, verbose=False):
 
     for corner, corneri in timfuz.corner_s2i.items():
         print('Corner %s' % corner)
-        print('  Pips: %u / %u solved, %u / %u covered' % (pipn_solved[corneri], pipn_net, pipn_covered[corneri], pipn_net))
-        print('  Wires: %u / %u solved, %u / %u covered' % (wiren_solved[corneri], wiren_net, wiren_covered[corneri], wiren_net))
+        print(
+            '  Pips: %u / %u solved, %u / %u covered' %
+            (pipn_solved[corneri], pipn_net, pipn_covered[corneri], pipn_net))
+        print(
+            '  Wires: %u / %u solved, %u / %u covered' % (
+                wiren_solved[corneri], wiren_net, wiren_covered[corneri],
+                wiren_net))
+
+    json.dump(
+        tilej,
+        open(fnout, 'w'),
+        sort_keys=True,
+        indent=4,
+        separators=(',', ': '))
 
-    json.dump(tilej, open(fnout, 'w'), sort_keys=True, indent=4, separators=(',', ': '))
 
 def main():
     import argparse
 
-    parser = argparse.ArgumentParser(
-        description=
-        ''
-    )
+    parser = argparse.ArgumentParser(description='')
     parser.add_argument('--tile-json', default='tiles.json', help='')
     parser.add_argument('fnin', default=None, help='Flattened timing csv')
     parser.add_argument('fnout', default=None, help='output tile .json')
@@ -69,5 +79,6 @@ def main():
 
     run(args.fnin, args.fnout, args.tile_json, verbose=False)
 
+
 if __name__ == '__main__':
     main()
diff --git a/fuzzers/007-timing/tile_combine.py b/fuzzers/007-timing/tile_combine.py
index 35ea2291..940d628f 100644
--- a/fuzzers/007-timing/tile_combine.py
+++ b/fuzzers/007-timing/tile_combine.py
@@ -6,11 +6,12 @@ import time
 import json
 from collections import OrderedDict
 
-corner_s2i = OrderedDict([
-    ('fast_max', 0),
-    ('fast_min', 1),
-    ('slow_max', 2),
-    ('slow_min', 3),
+corner_s2i = OrderedDict(
+    [
+        ('fast_max', 0),
+        ('fast_min', 1),
+        ('slow_max', 2),
+        ('slow_min', 3),
     ])
 
 corner2minmax = {
@@ -18,7 +19,8 @@ corner2minmax = {
     'fast_min': min,
     'slow_max': max,
     'slow_min': min,
-    }
+}
+
 
 def build_tilejo(fnins):
     '''
@@ -45,6 +47,7 @@ def build_tilejo(fnins):
                 tilejo['tiles'][tilek] = tilevi
             # Otherwise combine
             else:
+
                 def process_type(etype):
                     for pipk, pipvi in tilevi[etype].items():
                         pipvo = tilevo[etype][pipk]
@@ -61,10 +64,12 @@ def build_tilejo(fnins):
                             else:
                                 minmax = corner2minmax[cornerk]
                                 pipvo[corneri] = minmax(cornervi, cornervo)
+
                 process_type('pips')
                 process_type('wires')
     return tilejo
 
+
 def check_corner_minmax(tilej, verbose=False):
     # Post processing pass looking for min/max inconsistencies
     # Especially an issue due to complexities around under-constrained elements
@@ -73,12 +78,13 @@ def check_corner_minmax(tilej, verbose=False):
     checks = 0
     bad = 0
     for tilev in tilej['tiles'].values():
+
         def process_type(etype):
             nonlocal checks
             nonlocal bad
 
             for pipk, pipv in tilev[etype].items():
-                for corner in ('slow', 'fast'): 
+                for corner in ('slow', 'fast'):
                     mini = corner_s2i[corner + '_min']
                     minv = pipv[mini]
                     maxi = corner_s2i[corner + '_max']
@@ -87,7 +93,9 @@ def check_corner_minmax(tilej, verbose=False):
                         checks += 1
                         if minv > maxv:
                             if verbose:
-                                print('WARNING: element %s %s min/max adjusted on corner %s' % (etype, pipk, corner))
+                                print(
+                                    'WARNING: element %s %s min/max adjusted on corner %s'
+                                    % (etype, pipk, corner))
                             bad += 1
                             pipv[mini] = maxv
                             pipv[maxi] = minv
@@ -96,28 +104,35 @@ def check_corner_minmax(tilej, verbose=False):
         process_type('wires')
     print('minmax: %u / %u bad' % (bad, checks))
 
+
 def check_corners_minmax(tilej, verbose=False):
     # TODO: check fast vs slow
     pass
 
+
 def run(fnins, fnout, verbose=False):
     tilejo = build_tilejo(fnins)
     check_corner_minmax(tilejo)
     check_corners_minmax(tilejo)
-    json.dump(tilejo, open(fnout, 'w'), sort_keys=True, indent=4, separators=(',', ': '))
+    json.dump(
+        tilejo,
+        open(fnout, 'w'),
+        sort_keys=True,
+        indent=4,
+        separators=(',', ': '))
+
 
 def main():
     import argparse
 
     parser = argparse.ArgumentParser(
-        description=
-        'Combine multiple tile corners into one .json file'
-    )
+        description='Combine multiple tile corners into one .json file')
     parser.add_argument('--out', required=True, help='Combined .json file')
     parser.add_argument('fnins', nargs='+', help='Input .json files')
     args = parser.parse_args()
 
     run(args.fnins, args.out, verbose=False)
 
+
 if __name__ == '__main__':
     main()
diff --git a/fuzzers/007-timing/timfuz.py b/fuzzers/007-timing/timfuz.py
index 6287cce2..45569ed2 100644
--- a/fuzzers/007-timing/timfuz.py
+++ b/fuzzers/007-timing/timfuz.py
@@ -16,27 +16,30 @@ from fractions import Fraction
 
 from benchmark import Benchmark
 
-NAME_ZERO = set([
-            "BSW_CLK_ZERO",
-            "BSW_ZERO",
-            "B_ZERO",
-            "C_CLK_ZERO",
-            "C_DSP_ZERO",
-            "C_ZERO",
-            "I_ZERO",
-            "O_ZERO",
-            "RC_ZERO",
-            "R_ZERO",
-            ])
+NAME_ZERO = set(
+    [
+        "BSW_CLK_ZERO",
+        "BSW_ZERO",
+        "B_ZERO",
+        "C_CLK_ZERO",
+        "C_DSP_ZERO",
+        "C_ZERO",
+        "I_ZERO",
+        "O_ZERO",
+        "RC_ZERO",
+        "R_ZERO",
+    ])
 
 # csv index
-corner_s2i = OrderedDict([
-    ('fast_max', 0),
-    ('fast_min', 1),
-    ('slow_max', 2),
-    ('slow_min', 3),
+corner_s2i = OrderedDict(
+    [
+        ('fast_max', 0),
+        ('fast_min', 1),
+        ('slow_max', 2),
+        ('slow_min', 3),
     ])
 
+
 # Equations are filtered out until nothing is left
 class SimplifiedToZero(Exception):
     pass
@@ -45,6 +48,7 @@ class SimplifiedToZero(Exception):
 def allow_zero_eqns():
     return os.getenv('ALLOW_ZERO_EQN', 'N') == 'Y'
 
+
 def print_eqns(A_ubd, b_ub, verbose=0, lim=3, label=''):
     rows = len(b_ub)
 
@@ -52,7 +56,8 @@ def print_eqns(A_ubd, b_ub, verbose=0, lim=3, label=''):
     prints = 0
     #verbose = 1
     for rowi, row in enumerate(A_ubd):
-        if verbose or ((rowi < 10 or rowi % max(1, (rows / 20)) == 0) and (not lim or prints < lim)):
+        if verbose or ((rowi < 10 or rowi % max(1, (rows / 20)) == 0) and
+                       (not lim or prints < lim)):
             line = '  EQN: p%u: ' % rowi
             for k, v in sorted(row.items()):
                 line += '%u*t%d ' % (v, k)
@@ -60,6 +65,7 @@ def print_eqns(A_ubd, b_ub, verbose=0, lim=3, label=''):
             print(line)
             prints += 1
 
+
 def print_name_eqns(A_ubd, b_ub, names, verbose=0, lim=3, label=''):
     rows = len(b_ub)
 
@@ -67,7 +73,8 @@ def print_name_eqns(A_ubd, b_ub, names, verbose=0, lim=3, label=''):
     prints = 0
     #verbose = 1
     for rowi, row in enumerate(A_ubd):
-        if verbose or ((rowi < 10 or rowi % max(1, (rows / 20)) == 0) and (not lim or prints < lim)):
+        if verbose or ((rowi < 10 or rowi % max(1, (rows / 20)) == 0) and
+                       (not lim or prints < lim)):
             line = '  EQN: p%u: ' % rowi
             for k, v in sorted(row.items()):
                 line += '%u*%s ' % (v, names[k])
@@ -75,19 +82,23 @@ def print_name_eqns(A_ubd, b_ub, names, verbose=0, lim=3, label=''):
             print(line)
             prints += 1
 
+
 def print_names(names, verbose=1):
     print('Names: %d' % len(names))
     for xi, name in enumerate(names):
         print('  % 4u % -80s' % (xi, name))
 
+
 def invb(b_ub):
     #return [-b for b in b_ub]
     return -np.array(b_ub)
 
+
 def check_feasible_d(A_ubd, b_ub, names):
     A_ub, b_ub_inv = Ab_d2np(A_ubd, b_ub, names)
     check_feasible(A_ub, b_ub_inv)
 
+
 def check_feasible(A_ub, b_ub):
     sys.stdout.write('Check feasible ')
     sys.stdout.flush()
@@ -118,6 +129,7 @@ def check_feasible(A_ub, b_ub):
                 this += A_ub[row][col] * xs[col]
             ret[row] = this
         return ret
+
     b_res = my_mul(A_ub, xs)
 
     # Verify bound was respected
@@ -126,10 +138,13 @@ def check_feasible(A_ub, b_ub):
             sys.stdout.write('.')
             sys.stdout.flush()
         if this_b >= this_b_ub or this_b > 0:
-            print('% 4d Want res % 10.1f <= % 10.1f <= 0' % (rowi, this_b, this_b_ub))
+            print(
+                '% 4d Want res % 10.1f <= % 10.1f <= 0' %
+                (rowi, this_b, this_b_ub))
             raise Exception("Bad ")
     print(' done')
 
+
 def Ab_ub_dt2d(eqns):
     '''Convert dict using the rows as keys into a list of dicts + b_ub list (ie return A_ub, b_ub)'''
     #return [dict(rowt) for rowt in eqns]
@@ -137,6 +152,7 @@ def Ab_ub_dt2d(eqns):
     A_ubd, b_ub = zip(*rows)
     return list(A_ubd), list(b_ub)
 
+
 # This significantly reduces runtime
 def simplify_rows(Ads, b_ub, remove_zd=False, corner=None):
     '''Remove duplicate equations, taking highest delay'''
@@ -150,14 +166,14 @@ def simplify_rows(Ads, b_ub, remove_zd=False, corner=None):
         'fast_min': min,
         'slow_max': max,
         'slow_min': min,
-        }[corner]
+    }[corner]
     # An outlier to make unknown values be ignored
     T_UNK = {
         'fast_max': 0,
         'fast_min': 10e9,
         'slow_max': 0,
         'slow_min': 10e9,
-        }[corner]
+    }[corner]
 
     sys.stdout.write('SimpR ')
     sys.stdout.flush()
@@ -188,12 +204,15 @@ def simplify_rows(Ads, b_ub, remove_zd=False, corner=None):
 
     print(' done')
 
-    print('Simplify rows: %d => %d rows w/ zd %d, ze %d' % (len(b_ub), len(eqns), zero_ds, zero_es))
+    print(
+        'Simplify rows: %d => %d rows w/ zd %d, ze %d' %
+        (len(b_ub), len(eqns), zero_ds, zero_es))
     if len(eqns) == 0:
         raise SimplifiedToZero()
     A_ubd_ret, b_ub_ret = Ab_ub_dt2d(eqns)
     return A_ubd_ret, b_ub_ret
 
+
 def A_ubr_np2d(row):
     '''Convert a single row'''
     #d = {}
@@ -203,6 +222,7 @@ def A_ubr_np2d(row):
             d[coli] = val
     return d
 
+
 def A_ub_np2d(A_ub):
     '''Convert A_ub entries in numpy matrix to dictionary / sparse form'''
     Adi = [None] * len(A_ub)
@@ -210,6 +230,7 @@ def A_ub_np2d(A_ub):
         Adi[i] = A_ubr_np2d(row)
     return Adi
 
+
 def Ar_di2np(row_di, cols):
     rownp = np.zeros(cols)
     for coli, val in row_di.items():
@@ -217,37 +238,45 @@ def Ar_di2np(row_di, cols):
         rownp[coli] = val
     return rownp
 
+
 # NOTE: sign inversion
 def A_di2np(Adi, cols):
     '''Convert A_ub entries in dictionary / sparse to numpy matrix form'''
     return [Ar_di2np(row_di, cols) for row_di in Adi]
 
+
 def Ar_ds2t(rowd):
     '''Convert a dictionary row into a tuple with (column number, value) tuples'''
     return tuple(sorted(rowd.items()))
 
+
 def A_ubr_t2d(rowt):
     '''Convert a dictionary row into a tuple with (column number, value) tuples'''
     return OrderedDict(rowt)
 
+
 def A_ub_d2t(A_ubd):
     '''Convert rows as dicts to rows as tuples'''
     return [Ar_ds2t(rowd) for rowd in A_ubd]
 
+
 def A_ub_t2d(A_ubd):
     '''Convert rows as tuples to rows as dicts'''
     return [OrderedDict(rowt) for rowt in A_ubd]
 
+
 def Ab_d2np(A_ubd, b_ub, names):
     A_ub = A_di2np(A_ubd, len(names))
     b_ub_inv = invb(b_ub)
     return A_ub, b_ub_inv
 
+
 def Ab_np2d(A_ub, b_ub_inv):
     A_ubd = A_ub_np2d(A_ub)
     b_ub = invb(b_ub_inv)
     return A_ubd, b_ub
 
+
 def sort_equations(Ads, b):
     # Track rows with value column
     # Hmm can't sort against np arrays
@@ -257,6 +286,7 @@ def sort_equations(Ads, b):
     A_ubtr, b_ubr = zip(*res)
     return [OrderedDict(rowt) for rowt in A_ubtr], b_ubr
 
+
 def derive_eq_by_row(A_ubd, b_ub, verbose=0, col_lim=0, tweak=False):
     '''
     Derive equations by subtracting whole rows
@@ -348,10 +378,13 @@ def derive_eq_by_row(A_ubd, b_ub, verbose=0, col_lim=0, tweak=False):
     print(' done')
 
     #A_ub_ret = A_di2np(A_ubd2, cols=cols)
-    print('Derive row: %d => %d rows using %d lte, %d sc' % (len(b_ub), len(b_ub_ret), ltes, scs))
+    print(
+        'Derive row: %d => %d rows using %d lte, %d sc' %
+        (len(b_ub), len(b_ub_ret), ltes, scs))
     assert len(A_ubd_ret) == len(b_ub_ret)
     return A_ubd_ret, b_ub_ret
 
+
 def derive_eq_by_col(A_ubd, b_ub, verbose=0):
     '''
     Derive equations by subtracting out all bounded constants (ie "known" columns)
@@ -380,7 +413,6 @@ def derive_eq_by_col(A_ubd, b_ub, verbose=0):
     print(' done')
     #knowns_set = set(knowns.keys())
     print('%d constrained' % len(knowns))
-
     '''
     Now see what we can do
     Rows that are already constrained: eliminate
@@ -425,6 +457,7 @@ def derive_eq_by_col(A_ubd, b_ub, verbose=0):
     print('Derive col: %d => %d rows' % (len(b_ub), len(b_ub_ret)))
     return A_ubd_ret, b_ub_ret
 
+
 def col_dist(Ads, desc='of', names=[], lim=0):
     '''print(frequency distribution of number of elements in a given row'''
     rows = len(Ads)
@@ -435,7 +468,9 @@ def col_dist(Ads, desc='of', names=[], lim=0):
         this_cols = len(row)
         fs[this_cols] = fs.get(this_cols, 0) + 1
 
-    print('Col count distribution (%s) for %dr x %dc w/ %d freqs' % (desc, rows, cols, len(fs)))
+    print(
+        'Col count distribution (%s) for %dr x %dc w/ %d freqs' %
+        (desc, rows, cols, len(fs)))
     prints = 0
     for i, (k, v) in enumerate(sorted(fs.items())):
         if lim == 0 or (lim and prints < lim or i == len(fs) - 1):
@@ -444,6 +479,7 @@ def col_dist(Ads, desc='of', names=[], lim=0):
         if lim and prints == lim:
             print('  ...')
 
+
 def name_dist(A_ubd, desc='of', names=[], lim=0):
     '''print(frequency distribution of number of times an element appears'''
     rows = len(A_ubd)
@@ -467,7 +503,7 @@ def name_dist(A_ubd, desc='of', names=[], lim=0):
     for v in fs.values():
         fs2[v] = fs2.get(v, 0) + 1
     prints = 0
-    print('Distribution distribution (%d items)'% len(fs2))
+    print('Distribution distribution (%d items)' % len(fs2))
     for i, (k, v) in enumerate(sorted(fs2.items())):
         if lim == 0 or (lim and prints < lim or i == len(fs2) - 1):
             print('  %s: %s' % (k, v))
@@ -479,6 +515,7 @@ def name_dist(A_ubd, desc='of', names=[], lim=0):
     if zeros:
         raise Exception("%d names without equation" % zeros)
 
+
 def filter_ncols(A_ubd, b_ub, cols_min=0, cols_max=0):
     '''Only keep equations with a few delay elements'''
     A_ubd_ret = []
@@ -486,26 +523,32 @@ def filter_ncols(A_ubd, b_ub, cols_min=0, cols_max=0):
 
     #print('Removing large rows')
     for rowd, b in zip(A_ubd, b_ub):
-        if (not cols_min or len(rowd) >= cols_min) and (not cols_max or len(rowd) <= cols_max):
+        if (not cols_min or len(rowd) >= cols_min) and (not cols_max or
+                                                        len(rowd) <= cols_max):
             A_ubd_ret.append(rowd)
             b_ub_ret.append(b)
 
-    print('Filter ncols w/ %d <= cols <= %d: %d ==> %d rows' % (cols_min, cols_max, len(b_ub), len(b_ub_ret)))
+    print(
+        'Filter ncols w/ %d <= cols <= %d: %d ==> %d rows' %
+        (cols_min, cols_max, len(b_ub), len(b_ub_ret)))
     assert len(b_ub_ret)
     return A_ubd_ret, b_ub_ret
 
+
 def Ar_di2ds(rowA, names):
     row = OrderedDict()
     for k, v in rowA.items():
         row[names[k]] = v
     return row
 
+
 def A_di2ds(Adi, names):
     rows = []
     for row_di in Adi:
         rows.append(Ar_di2ds(row_di, names))
     return rows
 
+
 def Ar_ds2di(row_ds, names):
     def keyi(name):
         if name not in names:
@@ -517,6 +560,7 @@ def Ar_ds2di(row_ds, names):
         row_di[keyi(k)] = v
     return row_di
 
+
 def A_ds2di(rows):
     names = OrderedDict()
 
@@ -526,10 +570,12 @@ def A_ds2di(rows):
 
     return list(names.keys()), A_ubd
 
+
 def A_ds2np(Ads):
     names, Adi = A_ds2di(Ads)
     return names, A_di2np(Adi, len(names))
 
+
 def loadc_Ads_mkb(fns, mkb, filt):
     bs = []
     Ads = []
@@ -548,10 +594,13 @@ def loadc_Ads_mkb(fns, mkb, filt):
                         return None
                     else:
                         return int(bstr)
+
                 corners = [mkcorner(corner) for corner in corners.split()]
+
                 def mkvar(x):
                     i, var = x.split()
                     return (var, int(i))
+
                 vars = OrderedDict([mkvar(var) for var in vars])
                 if not filt(ico, corners, vars):
                     continue
@@ -561,6 +610,7 @@ def loadc_Ads_mkb(fns, mkb, filt):
 
     return Ads, bs
 
+
 def loadc_Ads_b(fns, corner, ico=None):
     corner = corner or "slow_max"
     corneri = corner_s2i[corner]
@@ -572,8 +622,10 @@ def loadc_Ads_b(fns, corner, ico=None):
 
     def mkb(val):
         return val[corneri]
+
     return loadc_Ads_mkb(fns, mkb, filt)
 
+
 def loadc_Ads_bs(fns, ico=None):
     if ico is not None:
         filt = lambda ico_, corners, vars: ico_ == ico
@@ -582,15 +634,19 @@ def loadc_Ads_bs(fns, ico=None):
 
     def mkb(val):
         return val
+
     return loadc_Ads_mkb(fns, mkb, filt)
 
+
 def loadc_Ads_raw(fns):
     filt = lambda ico, corners, vars: True
 
     def mkb(val):
         return val
+
     return loadc_Ads_mkb(fns, mkb, filt)
 
+
 def index_names(Ads):
     names = set()
     for row_ds in Ads:
@@ -598,6 +654,7 @@ def index_names(Ads):
             names.add(k1)
     return names
 
+
 def load_sub(fn):
     j = json.load(open(fn, 'r'))
 
@@ -607,6 +664,7 @@ def load_sub(fn):
 
     return j
 
+
 def row_sub_syms(row, sub_json, strict=False, verbose=False):
     if 0 and verbose:
         print("")
@@ -669,6 +727,7 @@ def row_sub_syms(row, sub_json, strict=False, verbose=False):
         for k, v in sorted(row.items()):
             assert v > 0, (k, v)
 
+
 def run_sub_json(Ads, sub_json, strict=False, verbose=False):
     '''
     strict: complain if a sub doesn't go in evenly
@@ -709,13 +768,15 @@ def run_sub_json(Ads, sub_json, strict=False, verbose=False):
     print("Sub: %u / %u rows changed" % (nsubs, nrows))
     print("Sub: %u => %u non-zero row cols" % (ncols_old, ncols_new))
 
+
 def print_eqns(Ads, b, verbose=0, lim=3, label=''):
     rows = len(b)
 
     print('Sample equations (%s) from %d r' % (label, rows))
     prints = 0
     for rowi, row in enumerate(Ads):
-        if verbose or ((rowi < 10 or rowi % max(1, (rows / 20)) == 0) and (not lim or prints < lim)):
+        if verbose or ((rowi < 10 or rowi % max(1, (rows / 20)) == 0) and
+                       (not lim or prints < lim)):
             line = '  EQN: p%u: ' % rowi
             for k, v in sorted(row.items()):
                 line += '%u*t%s ' % (v, k)
@@ -723,10 +784,12 @@ def print_eqns(Ads, b, verbose=0, lim=3, label=''):
             print(line)
             prints += 1
 
+
 def print_eqns_np(A_ub, b_ub, verbose=0):
     Adi = A_ub_np2d(A_ub)
     print_eqns(Adi, b_ub, verbose=verbose)
 
+
 def Ads2bounds(Ads, bs):
     ret = {}
     for row_ds, row_bs in zip(Ads, bs):
@@ -736,17 +799,20 @@ def Ads2bounds(Ads, bs):
         ret[k] = row_bs
     return ret
 
+
 def instances(Ads):
     ret = 0
     for row_ds in Ads:
         ret += sum(row_ds.values())
     return ret
 
+
 def acorner2csv(b, corneri):
     corners = ["None" for _ in range(4)]
     corners[corneri] = str(b)
     return ' '.join(corners)
 
+
 def corners2csv(bs):
     assert len(bs) == 4
     corners = ["None" if b is None else str(b) for b in bs]
diff --git a/fuzzers/007-timing/timfuz_massage.py b/fuzzers/007-timing/timfuz_massage.py
index 1f52af5b..4be04737 100644
--- a/fuzzers/007-timing/timfuz_massage.py
+++ b/fuzzers/007-timing/timfuz_massage.py
@@ -10,6 +10,7 @@ import time
 import copy
 from collections import OrderedDict
 
+
 def lte_const(row_ref, row_cmp):
     '''Return true if all constants are smaller magnitude in row_cmp than row_ref'''
     #return False
@@ -22,6 +23,7 @@ def lte_const(row_ref, row_cmp):
             return False
     return True
 
+
 def shared_const(row_ref, row_cmp):
     '''Return true if more constants are equal than not equal'''
     #return False
@@ -43,6 +45,7 @@ def shared_const(row_ref, row_cmp):
     # Will equation reduce if subtracted?
     return matches > unmatches
 
+
 def reduce_const(row_ref, row_cmp):
     '''Subtract cmp constants from ref'''
     #ret = {}
@@ -57,6 +60,7 @@ def reduce_const(row_ref, row_cmp):
             ret[k] = res
     return ret
 
+
 def derive_eq_by_row(Ads, b, verbose=0, col_lim=0, tweak=False):
     '''
     Derive equations by subtracting whole rows
@@ -148,10 +152,13 @@ def derive_eq_by_row(Ads, b, verbose=0, col_lim=0, tweak=False):
     print(' done')
 
     #A_ub_ret = A_di2np(Ads2, cols=cols)
-    print('Derive row: %d => %d rows using %d lte, %d sc' % (len(b), len(b_ret), ltes, scs))
+    print(
+        'Derive row: %d => %d rows using %d lte, %d sc' %
+        (len(b), len(b_ret), ltes, scs))
     assert len(Ads_ret) == len(b_ret)
     return Ads_ret, b_ret
 
+
 def derive_eq_by_near_row(Ads, b, verbose=0, col_lim=0, tweak=False):
     '''
     Derive equations by subtracting whole rows
@@ -199,7 +206,8 @@ def derive_eq_by_near_row(Ads, b, verbose=0, col_lim=0, tweak=False):
             continue
 
         #for row_cmpi, row_cmp in enumerate(Ads):
-        for row_cmpi in range(max(0, row_refi - rowdelta), min(len(Ads), row_refi + rowdelta)):
+        for row_cmpi in range(max(0, row_refi - rowdelta),
+                              min(len(Ads), row_refi + rowdelta)):
             if row_refi == row_cmpi or col_lim and len(row_cmp) > col_lim:
                 continue
             row_cmp = Ads[row_cmpi]
@@ -246,10 +254,13 @@ def derive_eq_by_near_row(Ads, b, verbose=0, col_lim=0, tweak=False):
     print(' done')
 
     #A_ub_ret = A_di2np(Ads2, cols=cols)
-    print('Derive row: %d => %d rows using %d lte, %d sc' % (len(b), len(b_ret), ltes, scs))
+    print(
+        'Derive row: %d => %d rows using %d lte, %d sc' %
+        (len(b), len(b_ret), ltes, scs))
     assert len(Ads_ret) == len(b_ret)
     return Ads_ret, b_ret
 
+
 def derive_eq_by_col(Ads, b_ub, verbose=0):
     '''
     Derive equations by subtracting out all bounded constants (ie "known" columns)
@@ -277,7 +288,6 @@ def derive_eq_by_col(Ads, b_ub, verbose=0):
     print(' done')
     #knowns_set = set(knowns.keys())
     print('%d constrained' % len(knowns))
-
     '''
     Now see what we can do
     Rows that are already constrained: eliminate
@@ -322,6 +332,7 @@ def derive_eq_by_col(Ads, b_ub, verbose=0):
     print('Derive col: %d => %d rows' % (len(b_ub), len(b_ret)))
     return Ads_ret, b_ret
 
+
 # keep derriving until solution is (probably) stable
 def massage_equations_old(Ads, b, verbose=False, derive_lim=3, corner=None):
     '''
@@ -357,7 +368,9 @@ def massage_equations_old(Ads, b, verbose=False, derive_lim=3, corner=None):
         debug("der_rows")
         # Run another simplify pass since new equations may have overlap with original
         Ads, b = simplify_rows(Ads, b, corner=corner)
-        print('Derive row %d / %d: %d => %d equations' % (di + 1, derive_lim, n_orig, len(b)))
+        print(
+            'Derive row %d / %d: %d => %d equations' %
+            (di + 1, derive_lim, n_orig, len(b)))
         debug("der_rows simp")
 
         n_orig2 = len(b)
@@ -366,19 +379,19 @@ def massage_equations_old(Ads, b, verbose=False, derive_lim=3, corner=None):
         debug("der_cols")
         # Run another simplify pass since new equations may have overlap with original
         Ads, b = simplify_rows(Ads, b, corner=corner)
-        print('Derive col %d / %d: %d => %d equations' % (di + 1, derive_lim, n_orig2, len(b)))
+        print(
+            'Derive col %d / %d: %d => %d equations' %
+            (di + 1, derive_lim, n_orig2, len(b)))
         debug("der_cols simp")
 
         if n_orig == len(b):
             break
 
-
     dend = len(b)
     print('')
     print('Derive net: %d => %d' % (dstart, dend))
     print('')
     # Was experimentting to see how much the higher order columns really help
-
     '''
     cols_min_post = opts.get('cols_min_post', None)
     cols_max_post = opts.get('cols_max_post', None)
@@ -393,6 +406,7 @@ def massage_equations_old(Ads, b, verbose=False, derive_lim=3, corner=None):
     debug("final (sorted)")
     return Ads, b
 
+
 # iteratively increasing column limit until all columns are added
 def massage_equations_inc_col_lim(Ads, b, verbose=False, corner=None):
     '''
@@ -467,6 +481,7 @@ def massage_equations_inc_col_lim(Ads, b, verbose=False, corner=None):
     print('Massage final: %d => %d rows' % (dstart, dend))
     return Ads, b
 
+
 # only derive based on nearby equations
 # theory is they will be the best to diff
 def massage_equations_near(Ads, b, verbose=False, corner=None):
@@ -532,4 +547,5 @@ def massage_equations_near(Ads, b, verbose=False, corner=None):
     print('Massage final: %d => %d rows' % (dstart, dend))
     return Ads, b
 
+
 massage_equations = massage_equations_inc_col_lim
diff --git a/fuzzers/007-timing/timfuz_solve.py b/fuzzers/007-timing/timfuz_solve.py
index 52a4c43e..4f6446ef 100644
--- a/fuzzers/007-timing/timfuz_solve.py
+++ b/fuzzers/007-timing/timfuz_solve.py
@@ -15,6 +15,7 @@ import datetime
 import os
 import time
 
+
 def check_feasible(A_ub, b_ub):
     '''
     Put large timing constants into the equations
@@ -31,7 +32,6 @@ def check_feasible(A_ub, b_ub):
     cols = len(A_ub[0])
 
     progress = max(1, rows / 100)
-
     '''
     Delays should be in order of ns, so a 10 ns delay should be way above what anything should be
     Series can have several hundred delay elements
@@ -56,6 +56,7 @@ def check_feasible(A_ub, b_ub):
                 this += A_ub[row][col] * xs[col]
             ret[row] = this
         return ret
+
     b_res = my_mul(A_ub, xs)
 
     # Verify bound was respected
@@ -64,10 +65,13 @@ def check_feasible(A_ub, b_ub):
             sys.stdout.write('.')
             sys.stdout.flush()
         if this_b >= this_b_ub or this_b > 0:
-            print('% 4d Want res % 10.1f <= % 10.1f <= 0' % (rowi, this_b, this_b_ub))
+            print(
+                '% 4d Want res % 10.1f <= % 10.1f <= 0' %
+                (rowi, this_b, this_b_ub))
             raise Exception("Bad ")
     print(' done')
 
+
 def filter_bounds(Ads, b, bounds, corner):
     '''Given min variable delays, remove rows that won't constrain solution'''
     #assert len(bounds) > 0
@@ -76,11 +80,13 @@ def filter_bounds(Ads, b, bounds, corner):
         # Keep delays possibly larger than current bound
         def keep(row_b, est):
             return row_b > est
+
         T_UNK = 0
     elif 'min' in corner:
         # Keep delays possibly smaller than current bound
         def keep(row_b, est):
             return row_b < est
+
         T_UNK = 1e9
     else:
         assert 0
@@ -96,7 +102,18 @@ def filter_bounds(Ads, b, bounds, corner):
             ret_b.append(row_b)
     return ret_Ads, ret_b
 
-def run(fns_in, corner, run_corner, sub_json=None, sub_csv=None, dedup=True, massage=False, outfn=None, verbose=False, **kwargs):
+
+def run(
+        fns_in,
+        corner,
+        run_corner,
+        sub_json=None,
+        sub_csv=None,
+        dedup=True,
+        massage=False,
+        outfn=None,
+        verbose=False,
+        **kwargs):
     print('Loading data')
     Ads, b = loadc_Ads_b(fns_in, corner, ico=True)
 
@@ -120,7 +137,6 @@ def run(fns_in, corner, run_corner, sub_json=None, sub_csv=None, dedup=True, mas
         print('Sub: %u => %u instances' % (iold, instances(Ads)))
     else:
         names = index_names(Ads)
-
     '''
     Substitution .csv
     Special .csv containing one variable per line
@@ -132,7 +148,9 @@ def run(fns_in, corner, run_corner, sub_json=None, sub_csv=None, dedup=True, mas
         assert len(bounds), 'Failed to load bounds'
         rows_old = len(Ads)
         Ads, b = filter_bounds(Ads, b, bounds, corner)
-        print('Filter bounds: %s => %s + %s rows' % (rows_old, len(Ads), len(Ads2)))
+        print(
+            'Filter bounds: %s => %s + %s rows' %
+            (rows_old, len(Ads), len(Ads2)))
         Ads = Ads + Ads2
         b = b + b2
         assert len(Ads) or allow_zero_eqns()
@@ -145,7 +163,6 @@ def run(fns_in, corner, run_corner, sub_json=None, sub_csv=None, dedup=True, mas
         #print
         #col_dist(A_ubd, 'final', names)
     print('b10', b[0:100])
-
     '''
     Given:
     a >= 10
@@ -169,4 +186,11 @@ def run(fns_in, corner, run_corner, sub_json=None, sub_csv=None, dedup=True, mas
 
     print('Converting to numpy...')
     names, Anp = A_ds2np(Ads)
-    run_corner(Anp, np.asarray(b), names, corner, outfn=outfn, verbose=verbose, **kwargs)
+    run_corner(
+        Anp,
+        np.asarray(b),
+        names,
+        corner,
+        outfn=outfn,
+        verbose=verbose,
+        **kwargs)
diff --git a/fuzzers/007-timing/timgrid/tile_txt2json.py b/fuzzers/007-timing/timgrid/tile_txt2json.py
index b6e410ff..4342805d 100644
--- a/fuzzers/007-timing/timgrid/tile_txt2json.py
+++ b/fuzzers/007-timing/timgrid/tile_txt2json.py
@@ -6,6 +6,8 @@ import time
 import json
 
 SI_NONE = 0xFFFF
+
+
 def load_speed_json(f):
     j = json.load(f)
     # Index speed indexes to names
@@ -16,6 +18,7 @@ def load_speed_json(f):
             speed_i2s[i] = k
     return j, speed_i2s
 
+
 def gen_tiles(fnin, speed_i2s):
     for l in open(fnin):
         # lappend items pip $name $speed_index
@@ -28,7 +31,7 @@ def gen_tiles(fnin, speed_i2s):
         pips = {}
         wires = {}
         for i in range(0, len(tuples), 3):
-            ttype, name, speed_index = tuples[i:i+3]
+            ttype, name, speed_index = tuples[i:i + 3]
             name_local = name.split('/')[1]
             {
                 'pip': pips,
@@ -36,6 +39,7 @@ def gen_tiles(fnin, speed_i2s):
             }[ttype][name_local] = speed_i2s[int(speed_index)]
         yield (tile_type, tile_name, grid_x, grid_y, pips, wires)
 
+
 def run(fnin, fnout, speed_json_fn, verbose=False):
     speedj, speed_i2s = load_speed_json(open(speed_json_fn, 'r'))
 
@@ -46,23 +50,24 @@ def run(fnin, fnout, speed_json_fn, verbose=False):
         if tile_type not in tiles:
             tiles[tile_type] = this_dat
         else:
-                if tiles[tile_type] != this_dat:
-                    print(tile_name, tile_type)
-                    print(this_dat)
-                    print(tiles[tile_type])
-                    assert 0
-    
+            if tiles[tile_type] != this_dat:
+                print(tile_name, tile_type)
+                print(this_dat)
+                print(tiles[tile_type])
+                assert 0
+
     j = {'tiles': tiles}
-    json.dump(j, open(fnout, 'w'), sort_keys=True, indent=4, separators=(',', ': '))
+    json.dump(
+        j, open(fnout, 'w'), sort_keys=True, indent=4, separators=(',', ': '))
+
 
 def main():
     import argparse
 
-    parser = argparse.ArgumentParser(
-        description=
-        'Solve timing solution'
-    )
-    parser.add_argument('--speed-json', default='../../speed/build/speed.json',
+    parser = argparse.ArgumentParser(description='Solve timing solution')
+    parser.add_argument(
+        '--speed-json',
+        default='../../speed/build/speed.json',
         help='Provides speed index to name translation')
     parser.add_argument('fnin', default=None, help='input tcl output .txt')
     parser.add_argument('fnout', default=None, help='output .json')
@@ -70,5 +75,6 @@ def main():
 
     run(args.fnin, args.fnout, speed_json_fn=args.speed_json, verbose=False)
 
+
 if __name__ == '__main__':
     main()
diff --git a/fuzzers/007-timing/timing_txt2csv.py b/fuzzers/007-timing/timing_txt2csv.py
index 51f04f42..1a4891eb 100644
--- a/fuzzers/007-timing/timing_txt2csv.py
+++ b/fuzzers/007-timing/timing_txt2csv.py
@@ -14,9 +14,11 @@ SI_NONE = 0xFFFF
 
 PREFIX_W = 'WIRE_'
 PREFIX_P = 'PIP_'
+
 #PREFIX_W = ''
 #PREFIX_P = ''
 
+
 def parse_pip(s):
     # Entries like
     # CLK_BUFG_REBUF_X60Y117/CLK_BUFG_REBUF.CLK_BUFG_REBUF_R_CK_GCLK0_BOT<<->>CLK_BUFG_REBUF_R_CK_GCLK0_TOP
@@ -28,22 +30,26 @@ def parse_pip(s):
     #return (site, type, pip_junction, pip)
     return site, instance, int(speed_index)
 
+
 def parse_node(s):
     node, nwires = s.split(':')
     return node, int(nwires)
 
+
 def parse_wire(s):
     # CLBLM_R_X3Y80/CLBLM_M_D6:952
     wirestr, speed_index = s.split(':')
     site, instance = wirestr.split('/')
     return site, instance, int(speed_index)
 
+
 # FIXME: these actually have a delay element
 # Probably need to put these back in
 def remove_virtual_pips(pips):
     return pips
     return filter(lambda pip: not re.match(r'CLBL[LM]_[LR]_', pip[0]), pips)
 
+
 def load_timing3(f, name='file'):
     # src_bel dst_bel ico fast_max fast_min slow_max slow_min pips
     f.readline()
@@ -66,25 +72,27 @@ def load_timing3(f, name='file'):
         pips = pips.split('|')
         nodes = nodes.split('|')
         wires = wires.split('|')
-        ret.append({
-            'net': net,
-            'src_bel': src_bel,
-            'dst_bel': dst_bel,
-            'ico': int(ico),
-            # ps
-            'fast_max': int(fast_max),
-            'fast_min': int(fast_min),
-            'slow_max': int(slow_max),
-            'slow_min': int(slow_min),
-            'pips': remove_virtual_pips([parse_pip(pip) for pip in pips]),
-            'nodes': [parse_node(node) for node in nodes],
-            'wires': [parse_wire(wire) for wire in wires],
-            'line': l,
+        ret.append(
+            {
+                'net': net,
+                'src_bel': src_bel,
+                'dst_bel': dst_bel,
+                'ico': int(ico),
+                # ps
+                'fast_max': int(fast_max),
+                'fast_min': int(fast_min),
+                'slow_max': int(slow_max),
+                'slow_min': int(slow_min),
+                'pips': remove_virtual_pips([parse_pip(pip) for pip in pips]),
+                'nodes': [parse_node(node) for node in nodes],
+                'wires': [parse_wire(wire) for wire in wires],
+                'line': l,
             })
     print('  load %s: %d bad, %d good' % (name, bads, len(ret)))
     #assert 0
     return ret
 
+
 def load_speed_json(f):
     j = json.load(f)
     # Index speed indexes to names
@@ -95,6 +103,7 @@ def load_speed_json(f):
             speed_i2s[i] = k
     return j, speed_i2s
 
+
 # Verify the nodes and wires really do line up
 def vals2Adi_check(vals, names):
     print('Checking')
@@ -106,12 +115,12 @@ def vals2Adi_check(vals, names):
     print('Done')
     assert 0
 
-def vals2Adi(vals, speed_i2s,
-        name_tr={}, name_drop=[],
-        verbose=False):
+
+def vals2Adi(vals, speed_i2s, name_tr={}, name_drop=[], verbose=False):
     def pip2speed(pip):
-        _site, _name, speed_index  = pip
+        _site, _name, speed_index = pip
         return PREFIX_P + speed_i2s[speed_index]
+
     def wire2speed(wire):
         _site, _name, speed_index = wire
         return PREFIX_W + speed_i2s[speed_index]
@@ -119,7 +128,8 @@ def vals2Adi(vals, speed_i2s,
     # Want this ordered
     names = OrderedDict()
 
-    print('Creating matrix w/ tr: %d, drop: %d' % (len(name_tr), len(name_drop)))
+    print(
+        'Creating matrix w/ tr: %d, drop: %d' % (len(name_tr), len(name_drop)))
 
     # Take sites out entirely using handy "interconnect only" option
     #vals = filter(lambda x: str(x).find('SLICE') >= 0, vals)
@@ -171,6 +181,7 @@ def vals2Adi(vals, speed_i2s,
     print('Creating delay element matrix w/ %d names' % len(names))
     Adi = [None for _i in range(len(vals))]
     for vali, val in enumerate(vals):
+
         def add_name(name):
             if name in name_drop:
                 return
@@ -192,12 +203,14 @@ def vals2Adi(vals, speed_i2s,
 
     return Adi, names
 
+
 # TODO: load directly as Ads
 # remove names_tr, names_drop
 def vals2Ads(vals, speed_i2s, verbose=False):
     Adi, names = vals2Adi(vals, speed_i2s, verbose=False)
     return A_di2ds(Adi, names)
 
+
 def load_Ads(speed_json_f, f_ins):
 
     print('Loading data')
@@ -211,12 +224,15 @@ def load_Ads(speed_json_f, f_ins):
     Ads = vals2Ads(vals, speed_i2s)
 
     def mkb(val):
-        return (val['fast_max'], val['fast_min'], val['slow_max'], val['slow_min'])
+        return (
+            val['fast_max'], val['fast_min'], val['slow_max'], val['slow_min'])
+
     b = [mkb(val) for val in vals]
     ico = [val['ico'] for val in vals]
 
     return Ads, b, ico
 
+
 def run(speed_json_f, fout, f_ins, verbose=0, corner=None):
     Ads, bs, ico = load_Ads(speed_json_f, f_ins)
 
@@ -229,6 +245,7 @@ def run(speed_json_f, fout, f_ins, verbose=0, corner=None):
             items.append('%u %s' % (v, k))
         fout.write(','.join(items) + '\n')
 
+
 def main():
     import argparse
 
@@ -238,14 +255,14 @@ def main():
     )
 
     parser.add_argument('--verbose', type=int, help='')
-    parser.add_argument('--auto-name', action='store_true', help='timing3.txt => timing3.csv')
-    parser.add_argument('--speed-json', default='build_speed/speed.json',
+    parser.add_argument(
+        '--auto-name', action='store_true', help='timing3.txt => timing3.csv')
+    parser.add_argument(
+        '--speed-json',
+        default='build_speed/speed.json',
         help='Provides speed index to name translation')
     parser.add_argument('--out', default=None, help='Output csv')
-    parser.add_argument(
-        'fns_in',
-        nargs='*',
-        help='timing3.txt input files')
+    parser.add_argument('fns_in', nargs='*', help='timing3.txt input files')
     args = parser.parse_args()
     bench = Benchmark()
 
@@ -265,8 +282,12 @@ def main():
     if not fns_in:
         fns_in = glob.glob('specimen_*/timing3.txt')
 
-    run(speed_json_f=open(args.speed_json, 'r'), fout=fout,
-        f_ins=[(open(fn_in, 'r'), fn_in) for fn_in in fns_in], verbose=args.verbose)
+    run(
+        speed_json_f=open(args.speed_json, 'r'),
+        fout=fout,
+        f_ins=[(open(fn_in, 'r'), fn_in) for fn_in in fns_in],
+        verbose=args.verbose)
+
 
 if __name__ == '__main__':
     main()
diff --git a/fuzzers/007-timing/wire_unique.py b/fuzzers/007-timing/wire_unique.py
index 391c2e0c..efae6e26 100644
--- a/fuzzers/007-timing/wire_unique.py
+++ b/fuzzers/007-timing/wire_unique.py
@@ -4,6 +4,7 @@ Verifies that node timing info is unique
 
 import re
 
+
 def gen_wires(fin):
     for l in fin:
         lj = {}
@@ -12,7 +13,8 @@ def gen_wires(fin):
             name, value = kvs.split(':')
             lj[name] = value
 
-        tile_type, xy, wname = re.match(r'(.*)_(X[0-9]*Y[0-9]*)/(.*)', lj['NAME']).groups()
+        tile_type, xy, wname = re.match(
+            r'(.*)_(X[0-9]*Y[0-9]*)/(.*)', lj['NAME']).groups()
         lj['tile_type'] = tile_type
         lj['xy'] = xy
         lj['wname'] = wname
@@ -21,10 +23,12 @@ def gen_wires(fin):
 
         yield lj
 
+
 def run(node_fin, verbose=0):
     refnodes = {}
     nodei = 0
     for nodei, anode in enumerate(gen_wires(node_fin)):
+
         def getk(anode):
             return anode['wname']
             #return (anode['tile_type'], anode['wname'])
@@ -39,32 +43,34 @@ def run(node_fin, verbose=0):
             refnodes[getk(anode)] = anode
             continue
         k_invariant = (
-                'COST_CODE',
-                'IS_INPUT_PIN',
-                'IS_OUTPUT_PIN',
-                'IS_PART_OF_BUS',
-                'NUM_INTERSECTS',
-                'NUM_TILE_PORTS',
-                'SPEED_INDEX',
-                'TILE_PATTERN_OFFSET',
-                )
+            'COST_CODE',
+            'IS_INPUT_PIN',
+            'IS_OUTPUT_PIN',
+            'IS_PART_OF_BUS',
+            'NUM_INTERSECTS',
+            'NUM_TILE_PORTS',
+            'SPEED_INDEX',
+            'TILE_PATTERN_OFFSET',
+        )
         k_varies = (
-                'ID_IN_TILE_TYPE',
-                'IS_CONNECTED',
-                'NUM_DOWNHILL_PIPS',
-                'NUM_PIPS',
-                'NUM_UPHILL_PIPS',
-                'TILE_NAME',
-            )
+            'ID_IN_TILE_TYPE',
+            'IS_CONNECTED',
+            'NUM_DOWNHILL_PIPS',
+            'NUM_PIPS',
+            'NUM_UPHILL_PIPS',
+            'TILE_NAME',
+        )
         # Verify equivilence
         for k in k_invariant:
             if k in refnode and k in anode:
+
                 def fail():
                     print 'Mismatch on %s' % k
                     print refnode[k], anode[k]
                     print refnode['l']
                     print anode['l']
                     #assert 0
+
                 if refnode[k] != anode[k]:
                     print
                     fail()
@@ -74,19 +80,14 @@ def run(node_fin, verbose=0):
             elif k not in k_varies:
                 assert 0
 
+
 if __name__ == '__main__':
     import argparse
 
-    parser = argparse.ArgumentParser(
-        description=
-        'Timing fuzzer'
-    )
+    parser = argparse.ArgumentParser(description='Timing fuzzer')
 
     parser.add_argument('--verbose', type=int, help='')
     parser.add_argument(
-        'node_fn_in',
-        default='/dev/stdin',
-        nargs='?',
-        help='Input file')
+        'node_fn_in', default='/dev/stdin', nargs='?', help='Input file')
     args = parser.parse_args()
     run(open(args.node_fn_in, 'r'), verbose=args.verbose)

From 3b686de46fd3936b956c91355374795ab4f6abf9 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Mon, 17 Sep 2018 11:28:03 -0700
Subject: [PATCH 49/55] timfuz: move non-fuzzer experiments to experiments dir

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 {fuzzers/007-timing => experiments/timfuz}/node_unique.py | 8 +++-----
 {fuzzers/007-timing => experiments/timfuz}/pip_unique.py  | 8 +++-----
 {fuzzers/007-timing => experiments/timfuz}/wire_unique.py | 8 +++-----
 3 files changed, 9 insertions(+), 15 deletions(-)
 rename {fuzzers/007-timing => experiments/timfuz}/node_unique.py (95%)
 rename {fuzzers/007-timing => experiments/timfuz}/pip_unique.py (94%)
 rename {fuzzers/007-timing => experiments/timfuz}/wire_unique.py (94%)

diff --git a/fuzzers/007-timing/node_unique.py b/experiments/timfuz/node_unique.py
similarity index 95%
rename from fuzzers/007-timing/node_unique.py
rename to experiments/timfuz/node_unique.py
index 83b054b9..4a0630e7 100644
--- a/fuzzers/007-timing/node_unique.py
+++ b/experiments/timfuz/node_unique.py
@@ -1,7 +1,3 @@
-'''
-Verifies that node timing info is unique
-'''
-
 import re
 
 
@@ -95,7 +91,9 @@ def run(node_fin, verbose=0):
 if __name__ == '__main__':
     import argparse
 
-    parser = argparse.ArgumentParser(description='Timing fuzzer')
+    parser = argparse.ArgumentParser(
+        description=
+        'Determines which info is consistent across nodes with the same name')
 
     parser.add_argument('--verbose', type=int, help='')
     parser.add_argument(
diff --git a/fuzzers/007-timing/pip_unique.py b/experiments/timfuz/pip_unique.py
similarity index 94%
rename from fuzzers/007-timing/pip_unique.py
rename to experiments/timfuz/pip_unique.py
index b38c9f4e..f49cb1ca 100644
--- a/fuzzers/007-timing/pip_unique.py
+++ b/experiments/timfuz/pip_unique.py
@@ -1,7 +1,3 @@
-'''
-Verifies that node timing info is unique
-'''
-
 import re
 
 
@@ -79,7 +75,9 @@ def run(node_fin, verbose=0):
 if __name__ == '__main__':
     import argparse
 
-    parser = argparse.ArgumentParser(description='Timing fuzzer')
+    parser = argparse.ArgumentParser(
+        description=
+        'Determines which info is consistent across PIPs with the same name')
 
     parser.add_argument('--verbose', type=int, help='')
     parser.add_argument(
diff --git a/fuzzers/007-timing/wire_unique.py b/experiments/timfuz/wire_unique.py
similarity index 94%
rename from fuzzers/007-timing/wire_unique.py
rename to experiments/timfuz/wire_unique.py
index efae6e26..c7b57272 100644
--- a/fuzzers/007-timing/wire_unique.py
+++ b/experiments/timfuz/wire_unique.py
@@ -1,7 +1,3 @@
-'''
-Verifies that node timing info is unique
-'''
-
 import re
 
 
@@ -84,7 +80,9 @@ def run(node_fin, verbose=0):
 if __name__ == '__main__':
     import argparse
 
-    parser = argparse.ArgumentParser(description='Timing fuzzer')
+    parser = argparse.ArgumentParser(
+        description=
+        'Determines which info is consistent across wires with the same name')
 
     parser.add_argument('--verbose', type=int, help='')
     parser.add_argument(

From bf5b435a69852af725e7a9cdbd2ad8a42296d18b Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Mon, 17 Sep 2018 14:23:00 -0700
Subject: [PATCH 50/55] timfuz: cleanup help

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 .../timfuz}/perf_test.py                      |  2 +-
 fuzzers/007-timing/checksub.py                |  4 +--
 fuzzers/007-timing/corner_csv.py              |  2 +-
 fuzzers/007-timing/csv_flat2group.py          |  5 +--
 fuzzers/007-timing/csv_group2flat.py          | 35 +++++++++++--------
 fuzzers/007-timing/projects/corner.mk         |  2 +-
 fuzzers/007-timing/rref.py                    | 30 ++++------------
 fuzzers/007-timing/solve_leastsq.py           |  9 +++--
 fuzzers/007-timing/solve_linprog.py           |  6 ++--
 fuzzers/007-timing/sub2csv.py                 |  2 +-
 fuzzers/007-timing/tile_annotate.py           | 13 +++----
 fuzzers/007-timing/timing_txt2csv.py          |  7 ++--
 12 files changed, 55 insertions(+), 62 deletions(-)
 rename {fuzzers/007-timing => experiments/timfuz}/perf_test.py (97%)

diff --git a/fuzzers/007-timing/perf_test.py b/experiments/timfuz/perf_test.py
similarity index 97%
rename from fuzzers/007-timing/perf_test.py
rename to experiments/timfuz/perf_test.py
index cb400809..77d0aefe 100644
--- a/fuzzers/007-timing/perf_test.py
+++ b/experiments/timfuz/perf_test.py
@@ -119,7 +119,7 @@ def run(
 def main():
     import argparse
 
-    parser = argparse.ArgumentParser(description='Timing fuzzer')
+    parser = argparse.ArgumentParser(description='Matrix solving performance tests')
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--sparse', action='store_true', help='')
diff --git a/fuzzers/007-timing/checksub.py b/fuzzers/007-timing/checksub.py
index 7a307e14..977d5b6f 100644
--- a/fuzzers/007-timing/checksub.py
+++ b/fuzzers/007-timing/checksub.py
@@ -108,11 +108,11 @@ def main():
     import argparse
 
     parser = argparse.ArgumentParser(
-        description='Check sub.json solution feasibility')
+        description='Check if sub.json would make a linear equation solvable')
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--sub-json', help='')
-    parser.add_argument('fns_in', nargs='*', help='timing3.csv input files')
+    parser.add_argument('fns_in', nargs='+', help='timing3.csv input files')
     args = parser.parse_args()
     # Store options in dict to ease passing through functions
     bench = Benchmark()
diff --git a/fuzzers/007-timing/corner_csv.py b/fuzzers/007-timing/corner_csv.py
index 429e1e55..a4ccbf84 100644
--- a/fuzzers/007-timing/corner_csv.py
+++ b/fuzzers/007-timing/corner_csv.py
@@ -31,7 +31,7 @@ def main():
         '--auto-name', action='store_true', help='timing3.csv => timing3c.csv')
     parser.add_argument('--out', default=None, help='Output csv')
     parser.add_argument('--corner', help='Output csv')
-    parser.add_argument('fns_in', nargs='*', help='timing3.csv input files')
+    parser.add_argument('fns_in', nargs='+', help='timing3.csv input files')
     args = parser.parse_args()
     bench = Benchmark()
 
diff --git a/fuzzers/007-timing/csv_flat2group.py b/fuzzers/007-timing/csv_flat2group.py
index 4cde0e61..4cdc04fd 100644
--- a/fuzzers/007-timing/csv_flat2group.py
+++ b/fuzzers/007-timing/csv_flat2group.py
@@ -34,7 +34,8 @@ def run(fns_in, fnout, sub_json, strict=False, verbose=False):
 def main():
     import argparse
 
-    parser = argparse.ArgumentParser(description='Solve timing solution')
+    parser = argparse.ArgumentParser(
+        description='Substitute .csv to group correlated symbols')
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--strict', action='store_true', help='')
@@ -44,7 +45,7 @@ def main():
         required=True,
         help='Group substitutions to make fully ranked')
     parser.add_argument('--out', help='Output sub.json substitution result')
-    parser.add_argument('fns_in', nargs='*', help='timing3.txt input files')
+    parser.add_argument('fns_in', nargs='+', help='timing3.csv input files')
     args = parser.parse_args()
     # Store options in dict to ease passing through functions
     bench = Benchmark()
diff --git a/fuzzers/007-timing/csv_group2flat.py b/fuzzers/007-timing/csv_group2flat.py
index 438be40e..45aacdb1 100644
--- a/fuzzers/007-timing/csv_group2flat.py
+++ b/fuzzers/007-timing/csv_group2flat.py
@@ -52,37 +52,44 @@ def gen_flat(fnin, sub_json, corner=None):
             yield zero, zero_row
 
 
-def run(fnin, fnout, sub_json, corner=None, sort=False, verbose=False):
+def run(fns_in, fnout, sub_json, corner=None, sort=False, verbose=False):
+    '''
     if sort:
         sortf = sorted
     else:
         sortf = lambda x: x
+    '''
 
     with open(fnout, 'w') as fout:
         fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
-        #for name, corners in sortf(gen_flat(fnin, sub_json)):
-        for name, corners in gen_flat(fnin, sub_json, corner=corner):
-            row_ico = 1
-            items = [str(row_ico), corners2csv(corners)]
-            items.append('%u %s' % (1, name))
-            fout.write(','.join(items) + '\n')
+        for fnin in fns_in:
+            #for name, corners in sortf(gen_flat(fnin, sub_json)):
+            for name, corners in gen_flat(fnin, sub_json, corner=corner):
+                row_ico = 1
+                items = [str(row_ico), corners2csv(corners)]
+                items.append('%u %s' % (1, name))
+                fout.write(','.join(items) + '\n')
 
 
 def main():
     import argparse
 
-    parser = argparse.ArgumentParser(description='Solve timing solution')
+    parser = argparse.ArgumentParser(
+        description='Substitute .csv to ungroup correlated symbols')
 
     parser.add_argument('--verbose', action='store_true', help='')
-    parser.add_argument('--sort', action='store_true', help='')
+    #parser.add_argument('--sort', action='store_true', help='')
     parser.add_argument('--sub-csv', help='')
     parser.add_argument(
         '--sub-json',
         required=True,
         help='Group substitutions to make fully ranked')
     parser.add_argument('--corner', default=None, help='')
-    parser.add_argument('fnin', default=None, help='input timing delay .csv')
-    parser.add_argument('fnout', default=None, help='output timing delay .csv')
+    parser.add_argument('--out', default=None, help='output timing delay .csv')
+    parser.add_argument(
+        'fns_in',
+        default=None,
+        help='input timing delay .csv (NOTE: must be single column)')
     args = parser.parse_args()
     # Store options in dict to ease passing through functions
     bench = Benchmark()
@@ -91,10 +98,10 @@ def main():
 
     try:
         run(
-            args.fnin,
-            args.fnout,
+            args.fns_in,
+            args.out,
             sub_json=sub_json,
-            sort=args.sort,
+            #sort=args.sort,
             verbose=args.verbose,
             corner=args.corner)
     finally:
diff --git a/fuzzers/007-timing/projects/corner.mk b/fuzzers/007-timing/projects/corner.mk
index aaa3cbf2..3ed37050 100644
--- a/fuzzers/007-timing/projects/corner.mk
+++ b/fuzzers/007-timing/projects/corner.mk
@@ -37,7 +37,7 @@ build/$(CORNER)/linprog.csv: build/$(CORNER)/leastsq.csv build/grouped.csv
 
 build/$(CORNER)/flat.csv: build/$(CORNER)/linprog.csv
 	# Take separated variables and back-annotate them to the original timing variables
-	python3 $(TIMFUZ_DIR)/csv_group2flat.py --sub-json build/sub.json --corner $(CORNER) --sort build/$(CORNER)/linprog.csv build/$(CORNER)/flat.csv.tmp
+	python3 $(TIMFUZ_DIR)/csv_group2flat.py --sub-json build/sub.json --corner $(CORNER) --sort --out build/$(CORNER)/flat.csv.tmp build/$(CORNER)/linprog.csv
 	mv build/$(CORNER)/flat.csv.tmp build/$(CORNER)/flat.csv
 
 build/$(CORNER)/tilea.json: build/$(CORNER)/flat.csv
diff --git a/fuzzers/007-timing/rref.py b/fuzzers/007-timing/rref.py
index 97b4efa0..6db813b4 100644
--- a/fuzzers/007-timing/rref.py
+++ b/fuzzers/007-timing/rref.py
@@ -14,28 +14,12 @@ from collections import OrderedDict
 from fractions import Fraction
 
 
-def fracr(r):
-    DELTA = 0.0001
-
-    for i, x in enumerate(r):
-        if type(x) is float:
-            xi = int(x)
-            assert abs(xi - x) < DELTA
-            r[i] = xi
-    return [Fraction(x) for x in r]
-
-
-def fracm(m):
-    return [fracr(r) for r in m]
-
-
 def fracr_quick(r):
     return [Fraction(numerator=int(x), denominator=1) for x in r]
 
 
-# the way I'm doing thing they should all be even integers
-# hmm this was only slightly faster
 def fracm_quick(m):
+    '''Convert integer matrix to Fraction matrix'''
     t = type(m[0][0])
     print('fracm_quick type: %s' % t)
     return [fracr_quick(r) for r in m]
@@ -149,7 +133,6 @@ def state_rref(state, verbose=False):
     #msym = sympy.MutableSparseMatrix(mfrac)
     msym = sympy.Matrix(mfrac)
     # internal encoding has significnat performance implications
-    #print(type(msym[3]))
     #assert type(msym[0]) is sympy.Integer
 
     if verbose:
@@ -221,7 +204,10 @@ def run(fnout, fn_ins, simplify=False, corner=None, verbose=0):
 def main():
     import argparse
 
-    parser = argparse.ArgumentParser(description='Timing fuzzer')
+    parser = argparse.ArgumentParser(
+        description=
+        'Compute reduced row echelon (RREF) to form sub.json (variable groups)'
+    )
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--simplify', action='store_true', help='')
@@ -231,14 +217,10 @@ def main():
         default='build_speed/speed.json',
         help='Provides speed index to name translation')
     parser.add_argument('--out', help='Output sub.json substitution result')
-    parser.add_argument('fns_in', nargs='+', help='timing3.txt input files')
+    parser.add_argument('fns_in', nargs='+', help='timing3.csv input files')
     args = parser.parse_args()
     bench = Benchmark()
 
-    fns_in = args.fns_in
-    if not fns_in:
-        fns_in = glob.glob('specimen_*/timing3.csv')
-
     try:
         run(
             fnout=args.out,
diff --git a/fuzzers/007-timing/solve_leastsq.py b/fuzzers/007-timing/solve_leastsq.py
index 1a1b55e6..5bd1f7b0 100644
--- a/fuzzers/007-timing/solve_leastsq.py
+++ b/fuzzers/007-timing/solve_leastsq.py
@@ -156,13 +156,16 @@ def main():
         'Solve timing solution using least squares objective function')
 
     parser.add_argument('--verbose', action='store_true', help='')
-    parser.add_argument('--massage', action='store_true', help='')
+    parser.add_argument(
+        '--massage',
+        action='store_true',
+        help='Derive additional constraints to improve solution')
     parser.add_argument(
         '--sub-json', help='Group substitutions to make fully ranked')
-    parser.add_argument('--corner', default="slow_max", help='')
+    parser.add_argument('--corner', required=True, default="slow_max", help='')
     parser.add_argument(
         '--out', default=None, help='output timing delay .json')
-    parser.add_argument('fns_in', nargs='+', help='timing3.csv input files')
+    parser.add_argument('fns_in', nargs='+', 'timing3.csv input files')
     args = parser.parse_args()
     # Store options in dict to ease passing through functions
     bench = Benchmark()
diff --git a/fuzzers/007-timing/solve_linprog.py b/fuzzers/007-timing/solve_linprog.py
index 29e4d826..28f181a6 100644
--- a/fuzzers/007-timing/solve_linprog.py
+++ b/fuzzers/007-timing/solve_linprog.py
@@ -195,10 +195,10 @@ def main():
     parser.add_argument('--sub-csv', help='')
     parser.add_argument(
         '--sub-json', help='Group substitutions to make fully ranked')
-    parser.add_argument('--corner', default=None, required=True, help='')
+    parser.add_argument('--corner', required=True, default="slow_max", help='')
     parser.add_argument(
         '--out', default=None, help='output timing delay .json')
-    parser.add_argument('fns_in', nargs='*', help='timing3.csv input files')
+    parser.add_argument('fns_in', nargs='+', help='timing3.csv input files')
     args = parser.parse_args()
     # Store options in dict to ease passing through functions
     bench = Benchmark()
@@ -216,7 +216,7 @@ def main():
             run_corner=run_corner,
             sub_json=sub_json,
             sub_csv=args.sub_csv,
-            fns_in=fns_in,
+            fn_in=fn_in,
             corner=args.corner,
             massage=args.massage,
             outfn=args.out,
diff --git a/fuzzers/007-timing/sub2csv.py b/fuzzers/007-timing/sub2csv.py
index 8567d5e3..dfb65227 100644
--- a/fuzzers/007-timing/sub2csv.py
+++ b/fuzzers/007-timing/sub2csv.py
@@ -91,7 +91,7 @@ def main():
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--out', help='Output csv')
-    parser.add_argument('fns_in', nargs='*', help='sub.json input files')
+    parser.add_argument('fns_in', nargs='+', help='sub.json input files')
     args = parser.parse_args()
     bench = Benchmark()
 
diff --git a/fuzzers/007-timing/tile_annotate.py b/fuzzers/007-timing/tile_annotate.py
index 58b89235..7e87f2fa 100644
--- a/fuzzers/007-timing/tile_annotate.py
+++ b/fuzzers/007-timing/tile_annotate.py
@@ -9,16 +9,10 @@ import time
 import json
 
 
-# corner wokraround
-def quad(x):
-    return [x for _ in range(4)]
-
-
 def run(fnin, fnout, tile_json_fn, verbose=False):
     # modified in place
     tilej = json.load(open(tile_json_fn, 'r'))
 
-    # FIXME: all corners
     Ads, bs = loadc_Ads_bs([fnin], ico=True)
     bounds = Ads2bounds(Ads, bs)
 
@@ -71,9 +65,12 @@ def run(fnin, fnout, tile_json_fn, verbose=False):
 def main():
     import argparse
 
-    parser = argparse.ArgumentParser(description='')
+    parser = argparse.ArgumentParser(
+        description=
+        'Substitute timgrid timing model names for real timing values')
     parser.add_argument('--tile-json', default='tiles.json', help='')
-    parser.add_argument('fnin', default=None, help='Flattened timing csv')
+    parser.add_argument(
+        'fnin', default=None, help='Input flattened timing csv (flat.json)')
     parser.add_argument('fnout', default=None, help='output tile .json')
     args = parser.parse_args()
 
diff --git a/fuzzers/007-timing/timing_txt2csv.py b/fuzzers/007-timing/timing_txt2csv.py
index 1a4891eb..ebdda26d 100644
--- a/fuzzers/007-timing/timing_txt2csv.py
+++ b/fuzzers/007-timing/timing_txt2csv.py
@@ -255,14 +255,15 @@ def main():
     )
 
     parser.add_argument('--verbose', type=int, help='')
+    # made a bulk conversion easier...keep?
     parser.add_argument(
         '--auto-name', action='store_true', help='timing3.txt => timing3.csv')
     parser.add_argument(
         '--speed-json',
         default='build_speed/speed.json',
         help='Provides speed index to name translation')
-    parser.add_argument('--out', default=None, help='Output csv')
-    parser.add_argument('fns_in', nargs='*', help='timing3.txt input files')
+    parser.add_argument('--out', default=None, help='Output timing3.csv file')
+    parser.add_argument('fns_in', nargs='+', help='Input timing3.txt files')
     args = parser.parse_args()
     bench = Benchmark()
 
@@ -274,6 +275,8 @@ def main():
             fnout = fnin.replace('.txt', '.csv')
             assert fnout != fnin, 'Expect .txt in'
         else:
+            # practically there are too many stray prints to make this work as expected
+            assert 0, 'File name required'
             fnout = '/dev/stdout'
     print("Writing to %s" % fnout)
     fout = open(fnout, 'w')

From 43ccabe8152d3bbac1db5c83c69cadbf01edc44e Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Mon, 17 Sep 2018 14:26:03 -0700
Subject: [PATCH 51/55] timfuz: massage cleanup

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/timfuz_massage.py | 149 +--------------------------
 1 file changed, 5 insertions(+), 144 deletions(-)

diff --git a/fuzzers/007-timing/timfuz_massage.py b/fuzzers/007-timing/timfuz_massage.py
index 4be04737..4871e0f4 100644
--- a/fuzzers/007-timing/timfuz_massage.py
+++ b/fuzzers/007-timing/timfuz_massage.py
@@ -333,83 +333,12 @@ def derive_eq_by_col(Ads, b_ub, verbose=0):
     return Ads_ret, b_ret
 
 
-# keep derriving until solution is (probably) stable
-def massage_equations_old(Ads, b, verbose=False, derive_lim=3, corner=None):
-    '''
-    Equation pipeline
-    Some operations may generate new equations
-    Simplify after these to avoid unnecessary overhead on redundant constraints
-    Similarly some operations may eliminate equations, potentially eliminating a column (ie variable)
-    Remove these columns as necessary to speed up solving
-    '''
-
-    def debug(what):
-        if verbose:
-            print('')
-            print_eqns(Ads, b, verbose=verbose, label=what, lim=20)
-            col_dist(Ads, what)
-            check_feasible_d(Ads, b)
-
-    # Try to (intelligently) subtract equations to generate additional constraints
-    # This helps avoid putting all delay in a single shared variable
-    dstart = len(b)
-
-    # Original simple
-    for di in range(derive_lim):
-        print
-        assert len(Ads) == len(b)
-        n_orig = len(b)
-
-        # Meat of the operation
-        # Focus on easy equations for first pass to get a lot of easy derrivations
-        col_lim = 12 if di == 0 else None
-        #col_lim = None
-        Ads, b = derive_eq_by_row(Ads, b, col_lim=col_lim)
-        debug("der_rows")
-        # Run another simplify pass since new equations may have overlap with original
-        Ads, b = simplify_rows(Ads, b, corner=corner)
-        print(
-            'Derive row %d / %d: %d => %d equations' %
-            (di + 1, derive_lim, n_orig, len(b)))
-        debug("der_rows simp")
-
-        n_orig2 = len(b)
-        # Meat of the operation
-        Ads, b = derive_eq_by_col(Ads, b)
-        debug("der_cols")
-        # Run another simplify pass since new equations may have overlap with original
-        Ads, b = simplify_rows(Ads, b, corner=corner)
-        print(
-            'Derive col %d / %d: %d => %d equations' %
-            (di + 1, derive_lim, n_orig2, len(b)))
-        debug("der_cols simp")
-
-        if n_orig == len(b):
-            break
-
-    dend = len(b)
-    print('')
-    print('Derive net: %d => %d' % (dstart, dend))
-    print('')
-    # Was experimentting to see how much the higher order columns really help
-    '''
-    cols_min_post = opts.get('cols_min_post', None)
-    cols_max_post = opts.get('cols_max_post', None)
-    # Filter input based on number of columns
-    if cols_min_post or cols_max_post:
-        Ads, b = filter_ncols(Ads=Ads, b=b, cols_min=cols_min_post, cols_max=cols_max_post)
-        debug("filter_ncals final")
-    '''
-
-    # Helps debug readability
-    Ads, b = sort_equations(Ads, b)
-    debug("final (sorted)")
-    return Ads, b
-
-
 # iteratively increasing column limit until all columns are added
-def massage_equations_inc_col_lim(Ads, b, verbose=False, corner=None):
+def massage_equations(Ads, b, verbose=False, corner=None):
     '''
+    Subtract equations from each other to generate additional constraints
+    Helps provide additional guidance to solver for realistic delays
+
     Equation pipeline
     Some operations may generate new equations
     Simplify after these to avoid unnecessary overhead on redundant constraints
@@ -463,6 +392,7 @@ def massage_equations_inc_col_lim(Ads, b, verbose=False, corner=None):
         col_dist(Ads, 'derive done iter %d, lim %d' % (di, col_lim), lim=12)
 
         rows = len(Ads)
+        # possible that a new equation was generated and taken away, but close enough
         if n_orig == len(b) and col_lim >= cols:
             break
         col_lim += col_lim / 5
@@ -480,72 +410,3 @@ def massage_equations_inc_col_lim(Ads, b, verbose=False, corner=None):
     print('')
     print('Massage final: %d => %d rows' % (dstart, dend))
     return Ads, b
-
-
-# only derive based on nearby equations
-# theory is they will be the best to diff
-def massage_equations_near(Ads, b, verbose=False, corner=None):
-    '''
-    Equation pipeline
-    Some operations may generate new equations
-    Simplify after these to avoid unnecessary overhead on redundant constraints
-    Similarly some operations may eliminate equations, potentially eliminating a column (ie variable)
-    Remove these columns as necessary to speed up solving
-    '''
-
-    def debug(what):
-        if verbose:
-            print('')
-            print_eqns(Ads, b, verbose=verbose, label=what, lim=20)
-            col_dist(Ads, what)
-            check_feasible_d(Ads, b)
-
-    # Try to (intelligently) subtract equations to generate additional constraints
-    # This helps avoid putting all delay in a single shared variable
-    dstart = len(b)
-    cols = len(index_names(Ads))
-
-    # Each iteration one more column is allowed until all columns are included
-    # (and the system is stable)
-    print
-    n_orig = len(b)
-
-    # Meat of the operation
-    Ads, b = derive_eq_by_near_row(Ads, b, tweak=True)
-    debug("der_rows")
-    # Run another simplify pass since new equations may have overlap with original
-    Ads, b = simplify_rows(Ads, b, corner=corner)
-    print('Derive row: %d => %d equations' % (n_orig, len(b)))
-    debug("der_rows simp")
-
-    n_orig2 = len(b)
-    # Meat of the operation
-    Ads, b = derive_eq_by_col(Ads, b)
-    debug("der_cols")
-    # Run another simplify pass since new equations may have overlap with original
-    Ads, b = simplify_rows(Ads, b, corner=corner)
-    print('Derive col: %d => %d equations' % (n_orig2, len(b)))
-    debug("der_cols simp")
-
-    # Doesn't help computation, but helps debugging
-    Ads, b = sort_equations(Ads, b)
-    debug("loop done")
-    col_dist(Ads, 'derive done', lim=12)
-
-    rows = len(Ads)
-
-    dend = len(b)
-    print('')
-    print('Derive net: %d => %d' % (dstart, dend))
-    print('')
-    # Was experimentting to see how much the higher order columns really help
-
-    # Helps debug readability
-    Ads, b = sort_equations(Ads, b)
-    debug("final (sorted)")
-    print('')
-    print('Massage final: %d => %d rows' % (dstart, dend))
-    return Ads, b
-
-
-massage_equations = massage_equations_inc_col_lim

From d5c9f1d8578cc09b1c64ccc248f20e4df8086966 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Mon, 17 Sep 2018 14:39:58 -0700
Subject: [PATCH 52/55] timfuz: misc cleanup

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/checksub.py       |  9 ++++-----
 fuzzers/007-timing/csv_flat2group.py |  6 +++++-
 fuzzers/007-timing/csv_group2flat.py | 13 -------------
 fuzzers/007-timing/rref.py           | 13 +++++++------
 fuzzers/007-timing/solve_leastsq.py  |  7 +------
 fuzzers/007-timing/solve_linprog.py  |  6 +++---
 fuzzers/007-timing/sub2csv.py        | 20 +-------------------
 fuzzers/007-timing/timfuz_massage.py | 10 ++++++++++
 fuzzers/007-timing/timfuz_solve.py   | 24 +-----------------------
 fuzzers/007-timing/timing_txt2csv.py |  5 ++---
 10 files changed, 34 insertions(+), 79 deletions(-)

diff --git a/fuzzers/007-timing/checksub.py b/fuzzers/007-timing/checksub.py
index 977d5b6f..5387eaf1 100644
--- a/fuzzers/007-timing/checksub.py
+++ b/fuzzers/007-timing/checksub.py
@@ -58,10 +58,9 @@ def pds(Ads, s):
 
 
 def run(fns_in, sub_json=None, verbose=False):
-    # arbitrary...data is thrown away
-    corner = "slow_max"
-
-    Ads, b = loadc_Ads_b(fns_in, corner, ico=True)
+    assert len(fn_ins) > 0
+    # arbitrary corner...data is thrown away
+    Ads, b = loadc_Ads_b(fns_in, "slow_max", ico=True)
 
     if sub_json:
         print('Subbing JSON %u rows' % len(Ads))
@@ -112,7 +111,7 @@ def main():
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--sub-json', help='')
-    parser.add_argument('fns_in', nargs='+', help='timing3.csv input files')
+    parser.add_argument('fns_in', nargs='*', help='timing3.csv input files')
     args = parser.parse_args()
     # Store options in dict to ease passing through functions
     bench = Benchmark()
diff --git a/fuzzers/007-timing/csv_flat2group.py b/fuzzers/007-timing/csv_flat2group.py
index 4cdc04fd..a1defef2 100644
--- a/fuzzers/007-timing/csv_flat2group.py
+++ b/fuzzers/007-timing/csv_flat2group.py
@@ -50,11 +50,15 @@ def main():
     # Store options in dict to ease passing through functions
     bench = Benchmark()
 
+    fns_in = args.fns_in
+    if not fns_in:
+        fns_in = glob.glob('specimen_*/timing3.csv')
+
     sub_json = load_sub(args.sub_json)
 
     try:
         run(
-            args.fns_in,
+            fns_in,
             args.out,
             sub_json=sub_json,
             strict=args.strict,
diff --git a/fuzzers/007-timing/csv_group2flat.py b/fuzzers/007-timing/csv_group2flat.py
index 45aacdb1..bba0cc5b 100644
--- a/fuzzers/007-timing/csv_group2flat.py
+++ b/fuzzers/007-timing/csv_group2flat.py
@@ -1,19 +1,6 @@
 #!/usr/bin/env python3
 
-# https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
-from scipy.optimize import linprog
 from timfuz import Benchmark, loadc_Ads_bs, load_sub, Ads2bounds, corners2csv, corner_s2i
-from timfuz_massage import massage_equations
-import numpy as np
-import glob
-import json
-import math
-from collections import OrderedDict
-from fractions import Fraction
-import sys
-import datetime
-import os
-import time
 
 
 def gen_flat(fnin, sub_json, corner=None):
diff --git a/fuzzers/007-timing/rref.py b/fuzzers/007-timing/rref.py
index 6db813b4..e160768c 100644
--- a/fuzzers/007-timing/rref.py
+++ b/fuzzers/007-timing/rref.py
@@ -1,8 +1,4 @@
 #!/usr/bin/env python3
-'''
-Triaging tool to help understand where we need more timing coverage
-Finds correlated variables to help make better test cases
-'''
 
 from timfuz import Benchmark, Ar_di2np, loadc_Ads_b, index_names, A_ds2np, simplify_rows
 import numpy as np
@@ -193,6 +189,7 @@ def state_rref(state, verbose=False):
 def run(fnout, fn_ins, simplify=False, corner=None, verbose=0):
     print('Loading data')
 
+    assert len(fn_ins) > 0
     state = State.load(fn_ins, simplify=simplify, corner=corner)
     state_rref(state, verbose=verbose)
     state.print_stats()
@@ -217,14 +214,18 @@ def main():
         default='build_speed/speed.json',
         help='Provides speed index to name translation')
     parser.add_argument('--out', help='Output sub.json substitution result')
-    parser.add_argument('fns_in', nargs='+', help='timing3.csv input files')
+    parser.add_argument('fns_in', nargs='*', help='timing3.csv input files')
     args = parser.parse_args()
     bench = Benchmark()
 
+    fns_in = args.fns_in
+    if not fns_in:
+        fns_in = glob.glob('specimen_*/timing3.csv')
+
     try:
         run(
             fnout=args.out,
-            fn_ins=args.fns_in,
+            fn_ins=fns_in,
             simplify=args.simplify,
             corner=args.corner,
             verbose=args.verbose)
diff --git a/fuzzers/007-timing/solve_leastsq.py b/fuzzers/007-timing/solve_leastsq.py
index 5bd1f7b0..d77acd2d 100644
--- a/fuzzers/007-timing/solve_leastsq.py
+++ b/fuzzers/007-timing/solve_leastsq.py
@@ -1,19 +1,14 @@
 #!/usr/bin/env python3
 
-# https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
-from scipy.optimize import linprog
 from timfuz import Benchmark, load_sub, corner_s2i, acorner2csv
 import timfuz
 import numpy as np
-import glob
 import math
-from fractions import Fraction
 import sys
 import os
 import time
 import timfuz_solve
 import scipy.optimize as optimize
-from scipy.optimize import least_squares
 
 
 def mkestimate(Anp, b):
@@ -141,7 +136,7 @@ def run_corner(
     x0 = mkestimate(Anp, b)
 
     print('Solving')
-    res = least_squares(func, x0, bounds=(0, float('inf')))
+    res = optimize.least_squares(func, x0, bounds=(0, float('inf')))
     print('Done')
 
     if outfn:
diff --git a/fuzzers/007-timing/solve_linprog.py b/fuzzers/007-timing/solve_linprog.py
index 28f181a6..6a27ac4c 100644
--- a/fuzzers/007-timing/solve_linprog.py
+++ b/fuzzers/007-timing/solve_linprog.py
@@ -1,7 +1,6 @@
 #!/usr/bin/env python3
 
-# https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
-from scipy.optimize import linprog
+import scipy.optimize as optimize
 from timfuz import Benchmark, load_sub, A_ub_np2d, acorner2csv, corner_s2i
 import numpy as np
 import glob
@@ -151,8 +150,9 @@ def run_corner(
     print('')
     # Now find smallest values for delay constants
     # Due to input bounds (ex: column limit), some delay elements may get eliminated entirely
+    # https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
     print('Running linprog w/ %d r, %d c (%d name)' % (rows, cols, len(names)))
-    res = linprog(
+    res = optimize.linprog(
         c,
         A_ub=A_ub,
         b_ub=b_ub,
diff --git a/fuzzers/007-timing/sub2csv.py b/fuzzers/007-timing/sub2csv.py
index dfb65227..48322dff 100644
--- a/fuzzers/007-timing/sub2csv.py
+++ b/fuzzers/007-timing/sub2csv.py
@@ -1,25 +1,7 @@
 #!/usr/bin/env python3
 
-from timfuz import Benchmark, Ar_di2np, loadc_Ads_b, index_names, A_ds2np, simplify_rows
-import numpy as np
-import glob
-import math
+from timfuz import Benchmark
 import json
-import sympy
-from collections import OrderedDict
-from fractions import Fraction
-
-
-def mlcm(xs):
-    '''
-    Find the LCM between elements in a group
-    '''
-    l = xs[0]
-    for n in xs:
-        for m in xs:
-            lthis = lcm(n, m)
-            l = int(max(lthis, l))
-    return ret
 
 
 def write_state(state, fout):
diff --git a/fuzzers/007-timing/timfuz_massage.py b/fuzzers/007-timing/timfuz_massage.py
index 4871e0f4..cd96d314 100644
--- a/fuzzers/007-timing/timfuz_massage.py
+++ b/fuzzers/007-timing/timfuz_massage.py
@@ -339,6 +339,16 @@ def massage_equations(Ads, b, verbose=False, corner=None):
     Subtract equations from each other to generate additional constraints
     Helps provide additional guidance to solver for realistic delays
 
+    Ex: given:
+    a >= 10
+    a + b >= 100
+    A valid solution is:
+         a = 100
+    However, a better solution is something like
+        a = 10
+        b = 90
+    This creates derived constraints to provide more realistic results
+
     Equation pipeline
     Some operations may generate new equations
     Simplify after these to avoid unnecessary overhead on redundant constraints
diff --git a/fuzzers/007-timing/timfuz_solve.py b/fuzzers/007-timing/timfuz_solve.py
index 4f6446ef..684cf05d 100644
--- a/fuzzers/007-timing/timfuz_solve.py
+++ b/fuzzers/007-timing/timfuz_solve.py
@@ -1,19 +1,9 @@
 #!/usr/bin/env python3
 
-# https://docs.scipy.org/doc/scipy-0.18.1/reference/generated/scipy.optimize.linprog.html
-from scipy.optimize import linprog
-from timfuz import Benchmark, simplify_rows, loadc_Ads_b, index_names, A_ds2np, run_sub_json, print_eqns, Ads2bounds, instances, SimplifiedToZero, allow_zero_eqns
+from timfuz import simplify_rows, loadc_Ads_b, index_names, A_ds2np, run_sub_json, print_eqns, Ads2bounds, instances, SimplifiedToZero, allow_zero_eqns
 from timfuz_massage import massage_equations
 import numpy as np
-import glob
-import json
-import math
-from collections import OrderedDict
-from fractions import Fraction
 import sys
-import datetime
-import os
-import time
 
 
 def check_feasible(A_ub, b_ub):
@@ -162,18 +152,6 @@ def run(
 
         #print
         #col_dist(A_ubd, 'final', names)
-    print('b10', b[0:100])
-    '''
-    Given:
-    a >= 10
-    a + b >= 100
-    A valid solution is:
-         a = 100
-    However, a better solution is something like
-        a = 10
-        b = 90
-    This creates derived constraints to provide more realistic results
-    '''
     if massage:
         try:
             Ads, b = massage_equations(Ads, b, corner=corner)
diff --git a/fuzzers/007-timing/timing_txt2csv.py b/fuzzers/007-timing/timing_txt2csv.py
index ebdda26d..3f0e62af 100644
--- a/fuzzers/007-timing/timing_txt2csv.py
+++ b/fuzzers/007-timing/timing_txt2csv.py
@@ -12,12 +12,11 @@ from collections import OrderedDict
 # Speed index: some sort of special value
 SI_NONE = 0xFFFF
 
+# prefix to make easier to track
+# models do not overlap between PIPs and WIREs
 PREFIX_W = 'WIRE_'
 PREFIX_P = 'PIP_'
 
-#PREFIX_W = ''
-#PREFIX_P = ''
-
 
 def parse_pip(s):
     # Entries like

From b6b9d9a661fc6cddebf924015c536999d1db5f40 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Mon, 17 Sep 2018 15:40:27 -0700
Subject: [PATCH 53/55] misc cleanup

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 fuzzers/007-timing/Makefile                   | 10 +--
 fuzzers/007-timing/README.md                  |  9 ++-
 fuzzers/007-timing/checksub.py                |  2 +-
 fuzzers/007-timing/csv_flat2group.py          |  2 +-
 fuzzers/007-timing/csv_group2flat.py          | 21 +++---
 fuzzers/007-timing/projects/corner.mk         |  8 +--
 fuzzers/007-timing/projects/project.mk        | 20 +++---
 fuzzers/007-timing/rref.py                    |  8 +--
 fuzzers/007-timing/solve_leastsq.py           |  8 ++-
 fuzzers/007-timing/solve_linprog.py           |  2 +-
 fuzzers/007-timing/tile_annotate.py           | 64 +++++++------------
 fuzzers/007-timing/timfuz.py                  | 40 ++++++++++--
 fuzzers/007-timing/timgrid/Makefile           |  2 +-
 .../{tile_combine.py => timgrid_vc2v.py}      | 12 +++-
 fuzzers/007-timing/timing_txt2csv.py          |  2 -
 15 files changed, 114 insertions(+), 96 deletions(-)
 rename fuzzers/007-timing/{tile_combine.py => timgrid_vc2v.py} (92%)

diff --git a/fuzzers/007-timing/Makefile b/fuzzers/007-timing/Makefile
index 40e42a35..5734d78a 100644
--- a/fuzzers/007-timing/Makefile
+++ b/fuzzers/007-timing/Makefile
@@ -3,13 +3,13 @@
 PRJ?=picorv32
 PRJN?=8
 
-all: build/tilea.json
+all: build/timgrid-v.json
 
 clean:
 	rm -rf build
 	cd speed && $(MAKE) clean
 	cd timgrid && $(MAKE) clean
-	cd projects && $(MAKE) clean
+	cd projects/$(PRJ) && $(MAKE) clean
 
 speed/build/speed.json:
 	cd speed && $(MAKE)
@@ -17,10 +17,10 @@ speed/build/speed.json:
 timgrid/build/timgrid.json:
 	cd timgrid && $(MAKE)
 
-build/tilea.json: projects/$(PRJ)/build/tilea.json
+build/timgrid-v.json: projects/$(PRJ)/build/timgrid-v.json
 	mkdir -p build
-	cp projects/$(PRJ)/build/tilea.json build/tilea.json
+	cp projects/$(PRJ)/build/timgrid-v.json build/timgrid-v.json
 
-projects/$(PRJ)/build/tilea.json: speed/build/speed.json timgrid/build/timgrid.json
+projects/$(PRJ)/build/timgrid-v.json: speed/build/speed.json timgrid/build/timgrid.json
 	cd projects/$(PRJ) && $(MAKE) N=$(PRJN)
 
diff --git a/fuzzers/007-timing/README.md b/fuzzers/007-timing/README.md
index a7c79eb2..db5a98bc 100644
--- a/fuzzers/007-timing/README.md
+++ b/fuzzers/007-timing/README.md
@@ -13,10 +13,15 @@ Currently this document focuses exclusively on fabric timing delays.
 ## Quick start
 
 ```
-make
+make -j$(nproc)
 ```
 
-This will take a relatively long time (say 45 min) and generate build/tilea.json
+This will take a relatively long time (say 45 min) and generate build/timgrid-v.json.
+You can do a quicker test run (say 3 min) using:
+
+```
+make PRJ=oneblinkw PRJN=1 -j$(nproc)
+```
 
 
 ## Vivado background
diff --git a/fuzzers/007-timing/checksub.py b/fuzzers/007-timing/checksub.py
index 5387eaf1..86823805 100644
--- a/fuzzers/007-timing/checksub.py
+++ b/fuzzers/007-timing/checksub.py
@@ -58,7 +58,7 @@ def pds(Ads, s):
 
 
 def run(fns_in, sub_json=None, verbose=False):
-    assert len(fn_ins) > 0
+    assert len(fns_in) > 0
     # arbitrary corner...data is thrown away
     Ads, b = loadc_Ads_b(fns_in, "slow_max", ico=True)
 
diff --git a/fuzzers/007-timing/csv_flat2group.py b/fuzzers/007-timing/csv_flat2group.py
index a1defef2..a0f76f1d 100644
--- a/fuzzers/007-timing/csv_flat2group.py
+++ b/fuzzers/007-timing/csv_flat2group.py
@@ -35,7 +35,7 @@ def main():
     import argparse
 
     parser = argparse.ArgumentParser(
-        description='Substitute .csv to group correlated symbols')
+        description='Substitute .csv to group correlated variables')
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--strict', action='store_true', help='')
diff --git a/fuzzers/007-timing/csv_group2flat.py b/fuzzers/007-timing/csv_group2flat.py
index bba0cc5b..403b2991 100644
--- a/fuzzers/007-timing/csv_group2flat.py
+++ b/fuzzers/007-timing/csv_group2flat.py
@@ -3,8 +3,8 @@
 from timfuz import Benchmark, loadc_Ads_bs, load_sub, Ads2bounds, corners2csv, corner_s2i
 
 
-def gen_flat(fnin, sub_json, corner=None):
-    Ads, bs = loadc_Ads_bs([fnin], ico=True)
+def gen_flat(fns_in, sub_json, corner=None):
+    Ads, bs = loadc_Ads_bs(fns_in, ico=True)
     bounds = Ads2bounds(Ads, bs)
     zeros = set()
     nonzeros = set()
@@ -49,20 +49,19 @@ def run(fns_in, fnout, sub_json, corner=None, sort=False, verbose=False):
 
     with open(fnout, 'w') as fout:
         fout.write('ico,fast_max fast_min slow_max slow_min,rows...\n')
-        for fnin in fns_in:
-            #for name, corners in sortf(gen_flat(fnin, sub_json)):
-            for name, corners in gen_flat(fnin, sub_json, corner=corner):
-                row_ico = 1
-                items = [str(row_ico), corners2csv(corners)]
-                items.append('%u %s' % (1, name))
-                fout.write(','.join(items) + '\n')
+        #for name, corners in sortf(gen_flat(fnin, sub_json)):
+        for name, corners in gen_flat(fns_in, sub_json, corner=corner):
+            row_ico = 1
+            items = [str(row_ico), corners2csv(corners)]
+            items.append('%u %s' % (1, name))
+            fout.write(','.join(items) + '\n')
 
 
 def main():
     import argparse
 
     parser = argparse.ArgumentParser(
-        description='Substitute .csv to ungroup correlated symbols')
+        description='Substitute .csv to ungroup correlated variables')
 
     parser.add_argument('--verbose', action='store_true', help='')
     #parser.add_argument('--sort', action='store_true', help='')
@@ -75,7 +74,7 @@ def main():
     parser.add_argument('--out', default=None, help='output timing delay .csv')
     parser.add_argument(
         'fns_in',
-        default=None,
+        nargs='+',
         help='input timing delay .csv (NOTE: must be single column)')
     args = parser.parse_args()
     # Store options in dict to ease passing through functions
diff --git a/fuzzers/007-timing/projects/corner.mk b/fuzzers/007-timing/projects/corner.mk
index 3ed37050..f332d727 100644
--- a/fuzzers/007-timing/projects/corner.mk
+++ b/fuzzers/007-timing/projects/corner.mk
@@ -5,7 +5,7 @@ CORNER=slow_max
 ALLOW_ZERO_EQN?=N
 BADPRJ_OK?=N
 
-all: build/$(CORNER)/tilea.json
+all: build/$(CORNER)/timgrid-s.json
 
 run:
 	$(MAKE) clean
@@ -37,11 +37,11 @@ build/$(CORNER)/linprog.csv: build/$(CORNER)/leastsq.csv build/grouped.csv
 
 build/$(CORNER)/flat.csv: build/$(CORNER)/linprog.csv
 	# Take separated variables and back-annotate them to the original timing variables
-	python3 $(TIMFUZ_DIR)/csv_group2flat.py --sub-json build/sub.json --corner $(CORNER) --sort --out build/$(CORNER)/flat.csv.tmp build/$(CORNER)/linprog.csv
+	python3 $(TIMFUZ_DIR)/csv_group2flat.py --sub-json build/sub.json --corner $(CORNER) --out build/$(CORNER)/flat.csv.tmp build/$(CORNER)/linprog.csv
 	mv build/$(CORNER)/flat.csv.tmp build/$(CORNER)/flat.csv
 
-build/$(CORNER)/tilea.json: build/$(CORNER)/flat.csv
+build/$(CORNER)/timgrid-s.json: build/$(CORNER)/flat.csv
 	# Final processing
 	# Insert timing delays into actual tile layouts
-	python3 $(TIMFUZ_DIR)/tile_annotate.py --tile-json $(TIMFUZ_DIR)/timgrid/build/timgrid.json build/$(CORNER)/flat.csv build/$(CORNER)/tilea.json
+	python3 $(TIMFUZ_DIR)/tile_annotate.py --timgrid-s $(TIMFUZ_DIR)/timgrid/build/timgrid-s.json --out build/$(CORNER)/timgrid-vc.json build/$(CORNER)/flat.csv
 
diff --git a/fuzzers/007-timing/projects/project.mk b/fuzzers/007-timing/projects/project.mk
index 7e2b4f1f..dc29c28e 100644
--- a/fuzzers/007-timing/projects/project.mk
+++ b/fuzzers/007-timing/projects/project.mk
@@ -10,23 +10,19 @@ RREF_CORNER=slow_max
 ALLOW_ZERO_EQN?=N
 BADPRJ_OK?=N
 
-TILEA_JSONS=build/fast_max/tilea.json build/fast_min/tilea.json build/slow_max/tilea.json build/slow_min/tilea.json
+TIMGRID_VCS=build/fast_max/timgrid-vc.json build/fast_min/timgrid-vc.json build/slow_max/timgrid-vc.json build/slow_min/timgrid-vc.json
 
-all: build/tilea.json
+all: build/timgrid-v.json
 
 # make build/checksub first
-build/fast_max/tilea.json: build/checksub
+build/fast_max/timgrid-vc.json: build/checksub
 	$(MAKE) -f $(TIMFUZ_DIR)/projects/corner.mk CORNER=fast_max
-build/fast_min/tilea.json: build/checksub
+build/fast_min/timgrid-vc.json: build/checksub
 	$(MAKE) -f $(TIMFUZ_DIR)/projects/corner.mk CORNER=fast_min
-build/slow_max/tilea.json: build/checksub
+build/slow_max/timgrid-vc.json: build/checksub
 	$(MAKE) -f $(TIMFUZ_DIR)/projects/corner.mk CORNER=slow_max
-build/slow_min/tilea.json: build/checksub
+build/slow_min/timgrid-vc.json: build/checksub
 	$(MAKE) -f $(TIMFUZ_DIR)/projects/corner.mk CORNER=slow_min
-fast_max: build/fast_max/tilea.json
-fast_min: build/fast_min/tilea.json
-slow_max: build/slow_max/tilea.json
-slow_min: build/slow_min/tilea.json
 
 $(SPECIMENS_OK):
 	bash generate.sh $(subst /OK,,$@) || (if [ "$(BADPRJ_OK)" != 'Y' ] ; then exit 1; fi; exit 0)
@@ -76,6 +72,6 @@ build/checksub: build/grouped.csv build/sub.json
 	python3 $(TIMFUZ_DIR)/checksub.py --sub-json build/sub.json build/grouped.csv
 	touch build/checksub
 
-build/tilea.json: $(TILEA_JSONS)
-	python3 $(TIMFUZ_DIR)/tile_combine.py --out build/tilea.json $(TILEA_JSONS)
+build/timgrid-v.json: $(TIMGRID_VCS)
+	python3 $(TIMFUZ_DIR)/timgrid_vc2v.py --out build/timgrid-v.json $(TIMGRID_VCS)
 
diff --git a/fuzzers/007-timing/rref.py b/fuzzers/007-timing/rref.py
index e160768c..fedcfef5 100644
--- a/fuzzers/007-timing/rref.py
+++ b/fuzzers/007-timing/rref.py
@@ -29,7 +29,7 @@ class State(object):
         # known zero delay elements
         self.drop_names = set(drop_names)
         # active names in rows
-        # includes sub symbols, excludes symbols that have been substituted out
+        # includes sub variables, excludes variables that have been substituted out
         self.base_names = set(self.names)
         self.names = set(self.base_names)
         # List of variable substitutions
@@ -173,10 +173,10 @@ def state_rref(state, verbose=False):
         rowdsf = row_sym2dsf(rowsym, names)
 
         state.subs[group_name] = rowdsf
-        # Add the new symbol
+        # Add the new variables
         state.names.add(group_name)
-        # Remove substituted symbols
-        # Note: symbols may appear multiple times
+        # Remove substituted variables
+        # Note: variables may appear multiple times
         state.names.difference_update(set(rowdsf.keys()))
         pivot_name = names[row_pivot]
         state.pivots[group_name] = pivot_name
diff --git a/fuzzers/007-timing/solve_leastsq.py b/fuzzers/007-timing/solve_leastsq.py
index d77acd2d..db22b168 100644
--- a/fuzzers/007-timing/solve_leastsq.py
+++ b/fuzzers/007-timing/solve_leastsq.py
@@ -160,11 +160,15 @@ def main():
     parser.add_argument('--corner', required=True, default="slow_max", help='')
     parser.add_argument(
         '--out', default=None, help='output timing delay .json')
-    parser.add_argument('fns_in', nargs='+', 'timing3.csv input files')
+    parser.add_argument('fns_in', nargs='+', help='timing3.csv input files')
     args = parser.parse_args()
     # Store options in dict to ease passing through functions
     bench = Benchmark()
 
+    fns_in = args.fns_in
+    if not fns_in:
+        fns_in = glob.glob('specimen_*/timing3.csv')
+
     sub_json = None
     if args.sub_json:
         sub_json = load_sub(args.sub_json)
@@ -173,7 +177,7 @@ def main():
         timfuz_solve.run(
             run_corner=run_corner,
             sub_json=sub_json,
-            fns_in=args.fns_in,
+            fns_in=fns_in,
             corner=args.corner,
             massage=args.massage,
             outfn=args.out,
diff --git a/fuzzers/007-timing/solve_linprog.py b/fuzzers/007-timing/solve_linprog.py
index 6a27ac4c..d22e14d1 100644
--- a/fuzzers/007-timing/solve_linprog.py
+++ b/fuzzers/007-timing/solve_linprog.py
@@ -216,7 +216,7 @@ def main():
             run_corner=run_corner,
             sub_json=sub_json,
             sub_csv=args.sub_csv,
-            fn_in=fn_in,
+            fns_in=fns_in,
             corner=args.corner,
             massage=args.massage,
             outfn=args.out,
diff --git a/fuzzers/007-timing/tile_annotate.py b/fuzzers/007-timing/tile_annotate.py
index 7e87f2fa..ffc07a21 100644
--- a/fuzzers/007-timing/tile_annotate.py
+++ b/fuzzers/007-timing/tile_annotate.py
@@ -9,50 +9,24 @@ import time
 import json
 
 
-def run(fnin, fnout, tile_json_fn, verbose=False):
+def run(fns_in, fnout, tile_json_fn, verbose=False):
     # modified in place
     tilej = json.load(open(tile_json_fn, 'r'))
 
-    Ads, bs = loadc_Ads_bs([fnin], ico=True)
-    bounds = Ads2bounds(Ads, bs)
+    for fnin in fns_in:
+        Ads, bs = loadc_Ads_bs([fnin], ico=True)
+        bounds = Ads2bounds(Ads, bs)
 
-    pipn_net = 0
-    pipn_solved = [0, 0, 0, 0]
-    pipn_covered = [0, 0, 0, 0]
-    wiren_net = 0
-    wiren_solved = [0, 0, 0, 0]
-    wiren_covered = [0, 0, 0, 0]
+        for tile in tilej['tiles'].values():
+            pips = tile['pips']
+            for k, v in pips.items():
+                pips[k] = bounds.get('PIP_' + v, [None, None, None, None])
 
-    for tile in tilej['tiles'].values():
-        pips = tile['pips']
-        for k, v in pips.items():
-            pips[k] = bounds.get('PIP_' + v, [None, None, None, None])
-            pipn_net += 1
-            for i in range(4):
-                if pips[k][i]:
-                    pipn_solved[i] += 1
-                if pips[k][i] is not None:
-                    pipn_covered[i] += 1
+            wires = tile['wires']
+            for k, v in wires.items():
+                wires[k] = bounds.get('WIRE_' + v, [None, None, None, None])
 
-        wires = tile['wires']
-        for k, v in wires.items():
-            wires[k] = bounds.get('WIRE_' + v, [None, None, None, None])
-            wiren_net += 1
-            for i in range(4):
-                if wires[k][i]:
-                    wiren_solved[i] += 1
-                if wires[k][i] is not None:
-                    wiren_covered[i] += 1
-
-    for corner, corneri in timfuz.corner_s2i.items():
-        print('Corner %s' % corner)
-        print(
-            '  Pips: %u / %u solved, %u / %u covered' %
-            (pipn_solved[corneri], pipn_net, pipn_covered[corneri], pipn_net))
-        print(
-            '  Wires: %u / %u solved, %u / %u covered' % (
-                wiren_solved[corneri], wiren_net, wiren_covered[corneri],
-                wiren_net))
+    timfuz.tilej_stats(tilej)
 
     json.dump(
         tilej,
@@ -68,13 +42,19 @@ def main():
     parser = argparse.ArgumentParser(
         description=
         'Substitute timgrid timing model names for real timing values')
-    parser.add_argument('--tile-json', default='tiles.json', help='')
     parser.add_argument(
-        'fnin', default=None, help='Input flattened timing csv (flat.json)')
-    parser.add_argument('fnout', default=None, help='output tile .json')
+        '--timgrid-s',
+        default='../../timgrid/build/timgrid-s.json',
+        help='tilegrid timing delay symbolic input (timgrid-s.json)')
+    parser.add_argument(
+        '--out',
+        default='build/timgrid-vc.json',
+        help='tilegrid timing delay values at corner (timgrid-vc.json)')
+    parser.add_argument(
+        'fn_ins', nargs='+', help='Input flattened timing csv (flat.json)')
     args = parser.parse_args()
 
-    run(args.fnin, args.fnout, args.tile_json, verbose=False)
+    run(args.fn_ins, args.out, args.timgrid_s, verbose=False)
 
 
 if __name__ == '__main__':
diff --git a/fuzzers/007-timing/timfuz.py b/fuzzers/007-timing/timfuz.py
index 45569ed2..581de3a0 100644
--- a/fuzzers/007-timing/timfuz.py
+++ b/fuzzers/007-timing/timfuz.py
@@ -665,20 +665,20 @@ def load_sub(fn):
     return j
 
 
-def row_sub_syms(row, sub_json, strict=False, verbose=False):
+def row_sub_vars(row, sub_json, strict=False, verbose=False):
     if 0 and verbose:
         print("")
         print(row.items())
 
-    delsyms = 0
+    delvars = 0
     for k in sub_json['drop_names']:
         try:
             del row[k]
-            delsyms += 1
+            delvars += 1
         except KeyError:
             pass
     if verbose:
-        print("Deleted %u symbols" % delsyms)
+        print("Deleted %u variables" % delvars)
 
     if verbose:
         print('Checking pivots')
@@ -750,7 +750,7 @@ def run_sub_json(Ads, sub_json, strict=False, verbose=False):
             print('Row %u w/ %u elements' % (rowi, len(row)))
 
         row_orig = dict(row)
-        row_sub_syms(row, sub_json, strict=strict, verbose=verbose)
+        row_sub_vars(row, sub_json, strict=strict, verbose=verbose)
         nrows += 1
         if row_orig != row:
             nsubs += 1
@@ -817,3 +817,33 @@ def corners2csv(bs):
     assert len(bs) == 4
     corners = ["None" if b is None else str(b) for b in bs]
     return ' '.join(corners)
+
+
+def tilej_stats(tilej):
+    stats = {}
+    for etype in ('pips', 'wires'):
+        tm = stats.setdefault(etype, {})
+        tm['net'] = 0
+        tm['solved'] = [0, 0, 0, 0]
+        tm['covered'] = [0, 0, 0, 0]
+
+    for tile in tilej['tiles'].values():
+        for etype in ('pips', 'wires'):
+            pips = tile[etype]
+            for k, v in pips.items():
+                stats[etype]['net'] += 1
+                for i in range(4):
+                    if pips[k][i]:
+                        stats[etype]['solved'][i] += 1
+                    if pips[k][i] is not None:
+                        stats[etype]['covered'][i] += 1
+
+    for corner, corneri in corner_s2i.items():
+        print('Corner %s' % corner)
+        for etype in ('pips', 'wires'):
+            net = stats[etype]['net']
+            solved = stats[etype]['solved'][corneri]
+            covered = stats[etype]['covered'][corneri]
+            print(
+                '  %s: %u / %u solved, %u / %u covered' %
+                (etype, solved, net, covered, net))
diff --git a/fuzzers/007-timing/timgrid/Makefile b/fuzzers/007-timing/timgrid/Makefile
index af0a72da..30458303 100644
--- a/fuzzers/007-timing/timgrid/Makefile
+++ b/fuzzers/007-timing/timgrid/Makefile
@@ -5,7 +5,7 @@ build/timgrid.txt: generate.tcl
 	cd build && vivado -mode batch -source ../generate.tcl
 
 build/timgrid.json: build/timgrid.txt
-	cd build && python3 ../tile_txt2json.py --speed-json ../../speed/build/speed.json timgrid.txt timgrid.json
+	cd build && python3 ../tile_txt2json.py --speed-json ../../speed/build/speed.json timgrid.txt timgrid-s.json
 
 clean:
 	rm -rf build
diff --git a/fuzzers/007-timing/tile_combine.py b/fuzzers/007-timing/timgrid_vc2v.py
similarity index 92%
rename from fuzzers/007-timing/tile_combine.py
rename to fuzzers/007-timing/timgrid_vc2v.py
index 940d628f..8c188d81 100644
--- a/fuzzers/007-timing/tile_combine.py
+++ b/fuzzers/007-timing/timgrid_vc2v.py
@@ -5,6 +5,7 @@ import os
 import time
 import json
 from collections import OrderedDict
+import timfuz
 
 corner_s2i = OrderedDict(
     [
@@ -77,6 +78,7 @@ def check_corner_minmax(tilej, verbose=False):
     print('Checking for min/max consistency')
     checks = 0
     bad = 0
+
     for tilev in tilej['tiles'].values():
 
         def process_type(etype):
@@ -102,7 +104,10 @@ def check_corner_minmax(tilej, verbose=False):
 
         process_type('pips')
         process_type('wires')
-    print('minmax: %u / %u bad' % (bad, checks))
+
+    print('')
+    print('minmax: %u / %u pairs bad pairs adjusted' % (bad, checks))
+    timfuz.tilej_stats(tilej)
 
 
 def check_corners_minmax(tilej, verbose=False):
@@ -127,8 +132,9 @@ def main():
 
     parser = argparse.ArgumentParser(
         description='Combine multiple tile corners into one .json file')
-    parser.add_argument('--out', required=True, help='Combined .json file')
-    parser.add_argument('fnins', nargs='+', help='Input .json files')
+    parser.add_argument(
+        '--out', required=True, help='Combined timgrid-v.json files')
+    parser.add_argument('fnins', nargs='+', help='Input timgrid-vc.json files')
     args = parser.parse_args()
 
     run(args.fnins, args.out, verbose=False)
diff --git a/fuzzers/007-timing/timing_txt2csv.py b/fuzzers/007-timing/timing_txt2csv.py
index 3f0e62af..0ba2b36d 100644
--- a/fuzzers/007-timing/timing_txt2csv.py
+++ b/fuzzers/007-timing/timing_txt2csv.py
@@ -1,11 +1,9 @@
 #!/usr/bin/env python3
 
 from timfuz import Benchmark, A_di2ds
-import numpy as np
 import glob
 import math
 import json
-import sympy
 import sys
 from collections import OrderedDict
 

From 03ed7a333b033d6b3889e398c29fa6e4bcee49e7 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Mon, 17 Sep 2018 16:16:55 -0700
Subject: [PATCH 54/55] timfuz: move extra files experiment => minitest since
 not a fuzzer

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 {experiments => minitests}/timfuz/node_unique.py | 0
 {experiments => minitests}/timfuz/perf_test.py   | 0
 {experiments => minitests}/timfuz/pip_unique.py  | 0
 {experiments => minitests}/timfuz/wire_unique.py | 0
 4 files changed, 0 insertions(+), 0 deletions(-)
 rename {experiments => minitests}/timfuz/node_unique.py (100%)
 rename {experiments => minitests}/timfuz/perf_test.py (100%)
 rename {experiments => minitests}/timfuz/pip_unique.py (100%)
 rename {experiments => minitests}/timfuz/wire_unique.py (100%)

diff --git a/experiments/timfuz/node_unique.py b/minitests/timfuz/node_unique.py
similarity index 100%
rename from experiments/timfuz/node_unique.py
rename to minitests/timfuz/node_unique.py
diff --git a/experiments/timfuz/perf_test.py b/minitests/timfuz/perf_test.py
similarity index 100%
rename from experiments/timfuz/perf_test.py
rename to minitests/timfuz/perf_test.py
diff --git a/experiments/timfuz/pip_unique.py b/minitests/timfuz/pip_unique.py
similarity index 100%
rename from experiments/timfuz/pip_unique.py
rename to minitests/timfuz/pip_unique.py
diff --git a/experiments/timfuz/wire_unique.py b/minitests/timfuz/wire_unique.py
similarity index 100%
rename from experiments/timfuz/wire_unique.py
rename to minitests/timfuz/wire_unique.py

From 863bfc53ef9beea18a6a93bdd5c2e1737c04f483 Mon Sep 17 00:00:00 2001
From: John McMaster <johndmcmaster@gmail.com>
Date: Mon, 17 Sep 2018 18:53:04 -0700
Subject: [PATCH 55/55] timfuz: fix minitest formatting issue

Signed-off-by: John McMaster <johndmcmaster@gmail.com>
---
 minitests/timfuz/perf_test.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/minitests/timfuz/perf_test.py b/minitests/timfuz/perf_test.py
index 77d0aefe..a857db13 100644
--- a/minitests/timfuz/perf_test.py
+++ b/minitests/timfuz/perf_test.py
@@ -119,7 +119,8 @@ def run(
 def main():
     import argparse
 
-    parser = argparse.ArgumentParser(description='Matrix solving performance tests')
+    parser = argparse.ArgumentParser(
+        description='Matrix solving performance tests')
 
     parser.add_argument('--verbose', action='store_true', help='')
     parser.add_argument('--sparse', action='store_true', help='')