#!/usr/bin/env python3 from timfuz import simplify_rows, print_eqns, print_eqns_np, sort_equations, col_dist, index_names import numpy as np import math import sys import datetime import os import time import copy from collections import OrderedDict def lte_const(row_ref, row_cmp): '''Return true if all constants are smaller magnitude in row_cmp than row_ref''' #return False for k, vc in row_cmp.items(): vr = row_ref.get(k, None) # Not in reference? if vr is None: return False if vr < vc: return False return True def sub_rows(row_ref, row_cmp): '''Do row_ref - row_cmp''' #ret = {} ret = OrderedDict() ks = set(row_ref.keys()) ks.update(set(row_cmp.keys())) for k in ks: vr = row_ref.get(k, 0) vc = row_cmp.get(k, 0) res = vr - vc if res: ret[k] = res return ret def derive_eq_by_row(Ads, b, verbose=0, col_lim=0, cmp_heuristic=True): ''' Derive equations by subtracting whole rows cmp_heuristic: drop large generated rows since these are unlikely to constrain the solution Given equations like: t0 >= 10 t0 + t1 >= 15 t0 + t1 + t2 >= 17 When I look at these, I think of a solution something like: t0 = 10f t1 = 5 t2 = 2 However, linprog tends to choose solutions like: t0 = 17 t1 = 0 t2 = 0 To this end, add additional constraints by finding equations that are subsets of other equations How to do this in a reasonable time span? Also equations are sparse, which makes this harder to compute ''' assert len(Ads) == len(b), 'Ads, b length mismatch' rows = len(Ads) # Index equations into hash maps so can lookup sparse elements quicker assert len(Ads) == len(b) Ads_ret = copy.copy(Ads) assert len(Ads) == len(Ads_ret) #print('Finding subsets') ltes = 0 b_ret = list(b) sys.stdout.write('Deriving rows (%u) ' % rows) sys.stdout.flush() progress = int(max(1, rows / 100)) b_warns = 0 for row_refi, row_ref in enumerate(Ads): if row_refi % progress == 0: sys.stdout.write('.') sys.stdout.flush() if col_lim and len(row_ref) > col_lim: continue for row_cmpi, row_cmp in enumerate(Ads): if row_refi == row_cmpi or col_lim and len(row_cmp) > col_lim: continue if not lte_const(row_ref, row_cmp): continue ltes += 1 if verbose: print('') print('match') print(' ', row_ref, b[row_refi]) print(' ', row_cmp, b[row_cmpi]) # Reduce row_new = sub_rows(row_ref, row_cmp) # Did this actually significantly reduce the search space? # should be a relatively small number of rows and be significantly smaller than at least one of them def is_smaller_row(): # Keep any generally small rows if len(row_new) <= 8: return True # And anything that reduced at least one row by half # Ex: going from 120 and 100 element rows to a 20 element row return len(row_new) <= len(row_cmp) / 2 or len( row_new) <= len(row_ref) / 2 if cmp_heuristic and not is_smaller_row(): continue b_new = b[row_refi] - b[row_cmpi] # Definitely possible # Maybe filter these out if they occur? if verbose: print(b_new) # Also inverted sign if b_new < 0: if verbose: print("Unexpected b") b_warns += 1 continue if verbose: print('OK') Ads_ret.append(row_new) b_ret.append(b_new) print(' done') #A_ub_ret = A_di2np(Ads2, cols=cols) print( 'Derive row: %d => %d rows using %d lte' % (len(b), len(b_ret), ltes)) print('Dropped %u invalid equations' % b_warns) assert len(Ads_ret) == len(b_ret) return Ads_ret, b_ret def derive_eq_by_col(Ads, b_ub, verbose=0, keep_orig=True): ''' Derive equations by subtracting out all bounded constants (ie "known" columns) XXX: is this now redundant with derive_row? Seems like a degenerate case, although maybe quicker ''' rows = len(Ads) # Index equations with a single constraint knowns = {} sys.stdout.write('Derive col indexing ') sys.stdout.flush() progress = max(1, rows / 100) for row_refi, row_refd in enumerate(Ads): if row_refi % progress == 0: sys.stdout.write('.') sys.stdout.flush() if len(row_refd) == 1: k, v = list(row_refd.items())[0] # assume simplify_equations handles de-duplicating new_b = 1.0 * b_ub[row_refi] / v assert k not in knowns, "Got new %s w/ val %u, old val %u" % ( k, new_b, knowns[k]) knowns[k] = new_b print(' done') #knowns_set = set(knowns.keys()) print('%d constrained' % len(knowns)) ''' Now see what we can do Rows that are already constrained: eliminate TODO: maybe keep these if this would violate their constraint Otherwise eliminate the original row and generate a simplified result now ''' b_ret = [] Ads_ret = [] sys.stdout.write('Derive col main ') sys.stdout.flush() progress = max(1, rows / 100) for row_refi, row_refd in enumerate(Ads): if row_refi % progress == 0: sys.stdout.write('.') sys.stdout.flush() b_ref = b_ub[row_refi] if keep_orig: Ads_ret.append(row_refd) b_ret.append(b_ref) # Reduce as much as possible #row_new = {} row_new = OrderedDict() b_new = b_ref # Copy over single entries if len(row_refd) == 1: row_new = row_refd else: for k, v in row_refd.items(): if k in knowns: # Remove column and take out corresponding delay b_new -= v * knowns[k] # Copy over else: row_new[k] = v # Possibly reduced all usable contants out if len(row_new) == 0: continue # invalid? if b_new < 0: continue if not keep_orig or row_new != row_refd: Ads_ret.append(row_new) b_ret.append(b_new) print(' done') print('Derive col: %d => %d rows' % (len(b_ub), len(b_ret))) return Ads_ret, b_ret # iteratively increasing column limit until all columns are added def massage_equations( Ads, b, verbose=False, corner=None, iter_lim=1, col_lim=100000): #col_lim = 15 ''' Subtract equations from each other to generate additional constraints Helps provide additional guidance to solver for realistic delays Ex: given: a >= 10 a + b >= 100 A valid solution is: a = 100 However, a better solution is something like a = 10 b = 90 This creates derived constraints to provide more realistic results Equation pipeline Some operations may generate new equations Simplify after these to avoid unnecessary overhead on redundant constraints Similarly some operations may eliminate equations, potentially eliminating a column (ie variable) Remove these columns as necessary to speed up solving ''' assert len(Ads) == len(b), 'Ads, b length mismatch' def check_cols(): assert len(index_names(Ads)) == cols def debug(what): check_cols() if 1 or verbose: print('') print_eqns(Ads, b, verbose=verbose, label=what, lim=20) col_dist(Ads, what) #check_feasible_d(Ads, b) # Try to (intelligently) subtract equations to generate additional constraints # This helps avoid putting all delay in a single shared variable dstart = len(b) cols = len(index_names(Ads)) # Each iteration one more column is allowed until all columns are included # (and the system is stable) di = 0 while True: print n_orig = len(b) print('Loop %d, lim %d' % (di + 1, col_lim)) # Meat of the operation Ads, b = derive_eq_by_row(Ads, b, col_lim=col_lim, cmp_heuristic=True) debug("der_rows") # Run another simplify pass since new equations may have overlap with original Ads, b = simplify_rows(Ads, b, corner=corner) print('Derive row: %d => %d equations' % (n_orig, len(b))) debug("der_rows simp") # derive_cols is mostly degenerate case of derive_rows # however, it will sub out single variables a lot faster if there are a lot of them # linear vs above quadratic, might as well keep it in if 1: n_orig2 = len(b) # Meat of the operation Ads, b = derive_eq_by_col(Ads, b) debug("der_cols") # Run another simplify pass since new equations may have overlap with original Ads, b = simplify_rows(Ads, b, corner=corner) print( 'Derive col %d: %d => %d equations' % (di + 1, n_orig2, len(b))) debug("der_cols simp") # Doesn't help computation, but helps debugging Ads, b = sort_equations(Ads, b) debug("loop done") col_dist(Ads, 'derive done iter %d, lim %d' % (di, col_lim), lim=12) rows = len(Ads) di += 1 dend = len(b) # possible that a new equation was generated and taken away, but close enough if n_orig == len(b) and col_lim >= cols or di >= iter_lim: break col_lim += col_lim / 5 print('') print('Derive net: %d => %d' % (dstart, dend)) print('') # Was experimentting to see how much the higher order columns really help # Helps debug readability Ads, b = sort_equations(Ads, b) debug("final (sorted)") print('') print('Massage final: %d => %d rows' % (dstart, dend)) cols_end = len(index_names(Ads)) print('Massage final: %d => %d cols' % (cols, cols_end)) assert cols_end == cols return Ads, b