rulegen3:: more improvements

2025-07-15 23:52:50 +00:00 · 2022-08-17 17:40:12 +02:00 · 2022-08-17 17:40:12 +02:00 · 80c3dfcd34
commit 80c3dfcd34
parent a441ab474f
1 changed files with 128 additions and 63 deletions
--- a/rulegen3.cpp
+++ b/rulegen3.cpp
@ -513,7 +513,19 @@ struct transducer_transitions {
 inline void print(hstream& hs, transducer_transitions* h) { print(hs, "T", index_pointer(h)); }
 inline void print(hstream& hs, const transducer_state& s) { print(hs, "S", tie(s.tstate1, s.tstate2, s.relation)); }

-using transducer = map<transducer_state, transducer_transitions>;
+template<class T> size_t hsh(T t) { return std::hash<T>()(t); }
+
+struct tshash {
+  size_t operator() (const transducer_state& s) const {
+    size_t res = hsh(s.tstate1) ^ (hsh(s.tstate2) << 16);
+    res ^= size_t(s.relation) + 0x9e3779b9 + (res << 6) + (res >> 2);
+    return res;
+    }
+  };
+
+using tpair = pair<const transducer_state, transducer_transitions>;
+
+using transducer = std::unordered_map<transducer_state, transducer_transitions, tshash>;

 transducer autom;
 int comp_step;
@ -546,7 +558,15 @@ tcell* get_move(tcell *c, int dir) {
  return c->cmove(dir);
  }

+struct tuplehash {
+  size_t operator() (const tuple<tcell*, int, int>& tu) const { return hsh(get<0>(tu)) + (hsh(get<1>(tu)) << 8) + (hsh(get<2>(tu)) << 16); }
+  };
+
+std::unordered_map<tuple<tcell*, int, int>, tcell*, tuplehash> rmmemo;
+
 tcell *rev_move2(tcell *t, int dir1, int dir2) {
+  auto& memo = rmmemo[{t, dir1, dir2}];
+  if(memo) return memo;
  if(dir1 != ENDED) t = rev_move(t, dir1);
  if(dir2 != ENDED) {
    t = t->cmove(dir2);
@ -555,7 +575,7 @@ tcell *rev_move2(tcell *t, int dir1, int dir2) {
    }
  twalker tw = t; get_parent_dir(tw);
  if(t->dist && t->parent_dir == MYSTERY) throw rulegen_failure("no parent_dir assigned after rev_move2!");
-  return t;
+  return memo = t;
  }

 vector<int> desc(tcell *t) {
@ -664,10 +684,20 @@ void compose_with(const transducer& tr, const transducer& dir, transducer& resul
    transducer_transitions *ires;
    const transducer_transitions *t1;
    const transducer_transitions *t2;
-    bool operator < (const searcher& s2) const { return tie(ts1, ts2, ts3, tat, fin1, fin2, fin3, ires, t1, t2) < tie(s2.ts1, s2.ts2, s2.ts3, s2.tat, s2.fin1, s2.fin2, s2.fin3, s2.ires, s2.t1, s2.t2); };
+    bool operator == (const searcher& s2) const { return tie(fin1, fin2, fin3, ires, t1, t2) == tie(s2.fin1, s2.fin2, s2.fin3, s2.ires, s2.t1, s2.t2); };
    };

-  set<searcher> in_queue;
+  struct searchhash {
+    size_t operator() (const searcher& s) const {
+      size_t res = size_t(s.fin1+2*s.fin2+4*s.fin3);
+      res ^= size_t(s.ires) + 0x9e3779b9 + (res << 6) + (res >> 2);
+      res ^= size_t(s.t1) + 0x9e3779b9 + (res << 6) + (res >> 2);
+      res ^= size_t(s.t2) + 0x9e3779b9 + (res << 6) + (res >> 2);
+      return res;
+      }
+    };
+
+  std::unordered_set<searcher, searchhash> in_queue;
  vector<searcher> q;
  auto enqueue = [&] (const searcher& s) {
    if(in_queue.count(s)) return;
@ -684,54 +714,68 @@ void compose_with(const transducer& tr, const transducer& dir, transducer& resul
    searcher sch = searcher{ ts.tstate1, ts.tstate1, ts.tstate1, false, false, false, t.at, &(result[ts]), &(tr.at(ts)), &(dir.at(ts)) };
    enqueue(sch);
    }
+  
+  int tdc = 0, tdc2 = 0;

  for(int i=0; i<isize(q); i++) {
    auto sch = q[i];
    if(sch.t1->accepting_directions && sch.t2->accepting_directions)
      sch.ires->accepting_directions = 1;

-    int dirs1 = isize(treestates[sch.ts1].rules);
-    int dirs2 = isize(treestates[sch.ts2].rules);
-    int dirs3 = isize(treestates[sch.ts3].rules);
    searcher next;
-    for(int d1=ENDED; d1<dirs1; d1++) {
-      if(d1 != ENDED && sch.fin1) break;
-      auto r1 = get_abs_rule1(sch.ts1, d1);
-      if(r1 < 0) continue;
-      for(int d2=ENDED; d2<dirs2; d2++) {
-        if(d2 != ENDED && sch.fin2) break;
-        auto r2 = get_abs_rule1(sch.ts2, d2);
-        if(r2 < 0) continue;
-        next.t1 = sch.t1;
-        if(d1 != ENDED || d2 != ENDED) {
-          if(!sch.t1->t.count({d1, d2})) continue;
-          next.t1 = sch.t1->t.at({d1, d2});
-          }
-        for(int d3=ENDED; d3<dirs3; d3++) {
-          if(d3 != ENDED && sch.fin3) break;
-          auto r3 = get_abs_rule1(sch.ts3, d3);
-          if(r3 < 0) continue;
-          next.t2 = sch.t2;
-          if(d2 != ENDED || d3 != ENDED) {
-            if(!sch.t2->t.count({d2, d3})) continue;
-            next.t2 = sch.t2->t.at({d2, d3});
-            }
+    
+    auto try_d3 = [&] (int d1, int d2, int r1, int r2) {
+      tdc++;

-          next.ts1 = r1; next.fin1 = d1 == ENDED;
-          next.ts2 = r2; next.fin2 = d2 == ENDED;
-          next.ts3 = r3; next.fin3 = d3 == ENDED;
-          next.tat = rev_move2(sch.tat, d1, d3);
-          auto nstate_key = transducer_state { next.ts1, next.ts3, next.tat };
+      auto try_done = [&] (int d3, int r3) {
+        tdc2++;
+        next.ts1 = r1; next.fin1 = d1 == ENDED;
+        next.ts2 = r2; next.fin2 = d2 == ENDED;
+        next.ts3 = r3; next.fin3 = d3 == ENDED;
+        next.tat = rev_move2(sch.tat, d1, d3);
+        auto nstate_key = transducer_state { next.ts1, next.ts3, next.tat };

-          next.ires = sch.ires;
-          if(d1 != ENDED || d3 != ENDED)
-            next.ires = sch.ires->t[{d1, d3}] = &(result[nstate_key]);
+        next.ires = sch.ires;
+        if(d1 != ENDED || d3 != ENDED)
+          next.ires = sch.ires->t[{d1, d3}] = &(result[nstate_key]);

-          enqueue(next);
-          }
+        enqueue(next);
+        };
+      
+      if(d2 == ENDED) {
+        next.t2 = sch.t2;
+        try_done(ENDED, sch.ts3);
        }
+      
+      auto p = sch.t2->t.lower_bound({d2, -999});
+      while(p != sch.t2->t.end() && p->first.first == d2) {
+        int d3 = p->first.second;
+        if(sch.fin3 && d3 != ENDED) break; // we can break right away
+        auto r3 = get_abs_rule1(sch.ts3, d3);
+        next.t2 = p->second;
+        try_done(d3, r3);
+        p++;
+        }
+      };
+    
+    next.t1 = sch.t1;
+    try_d3(ENDED, ENDED, sch.ts1, sch.ts2);
+
+    for(auto& p12: sch.t1->t) {
+      int d1 = p12.first.first;
+      int d2 = p12.first.second;
+      if(sch.fin1 && d1 != ENDED) break; /* we can break right away -- no more to find */
+      if(sch.fin2 && d2 != ENDED) continue; /* ... but here we cannot */
+      auto r1 = get_abs_rule1(sch.ts1, d1);
+      auto r2 = get_abs_rule1(sch.ts2, d2);
+
+      next.t1 = p12.second;
+
+      try_d3(d1, d2, r1, r2);
      }
    }
+
+  println(hlog, "composition queue = ", isize(q), " tdc = ", tie(tdc, tdc2));
  }

 void throw_identity_errors(const transducer& id, const vector<int>& cyc) {
@ -1052,11 +1096,14 @@ EX void find_multiple_interpretation() {
  throw rulegen_failure("no multiple interpretation found");
  }

+EX int max_err_iter = 4;
+
 EX void test_transducers() {
  if(flags & w_skip_transducers) return;
  autom.clear();
  int iterations = 0;
  int multiple_interpretations = 0;
+  int err_iter = 0;
  while(true) {
    next_iteration:
    check_timeout();
@ -1067,10 +1114,20 @@ EX void test_transducers() {
    struct searcher {
      int ts;
      vector<transducer_transitions*> pstates;
-      bool operator < (const searcher& s2) const { return tie(ts, pstates) < tie(s2.ts, s2.pstates); }
+      // bool operator < (const searcher& s2) const { return tie(ts, pstates) < tie(s2.ts, s2.pstates); }
+      bool operator == (const searcher& s2) const { return tie(ts, pstates) == tie(s2.ts, s2.pstates); }
      };

-    set<searcher> in_queue;
+    struct searchhash {
+      size_t operator() (const searcher& s) const {
+        size_t res = hsh(s.ts);
+        // https://stackoverflow.com/questions/20511347/a-good-hash-function-for-a-vector
+        for(auto p: s.pstates) res ^= size_t(p) + 0x9e3779b9 + (res << 6) + (res >> 2);
+        return res;
+        }
+      };
+
+    std::unordered_set<searcher, searchhash> in_queue;
    vector<searcher> q;
    vector<int> parent_id;
    vector<int> parent_dir;
@ -1090,7 +1147,8 @@ EX void test_transducers() {
      searcher sch = searcher{ ts.tstate1, { &(autom[ts]) } };
      enqueue(sch, -1, -1);
      }
-    for(int i=0; i<isize(q); i++) {
+
+    auto process = [&] (int i) {
      searcher sch = q[i];

      int dirs = isize(treestates[sch.ts].rules);
@ -1101,25 +1159,26 @@ EX void test_transducers() {
        for(auto v: sch.pstates) if(v->accepting_directions & (1<<dir)) qty++;
        for(auto v: sch.pstates) for(auto& p: v->t) if(p.first.first == ENDED && (p.second->accepting_directions & (1<<dir))) qty++;
        if(qty > 1) {
-
-          vstate vs;
-          vector<int> path1;
-          int at = build_vstate(vs, path1, parent_dir, parent_id, i, [&] (int i) { return q[i].ts; });
-          println(hlog, "after path = ", path1, " got multiple interpretation");
-          for(auto v: sch.pstates) if(v->accepting_directions & (1<<dir)) println(hlog, "state ", v);
-          for(auto v: sch.pstates) for(auto& p: v->t) if(p.first.first == ENDED && (p.second->accepting_directions & (1<<dir))) println(hlog, "state ", v, " after accepting END/", p.first.second);
-          println(hlog, "starting at state: ", q[at].ts, " reached state ", q[i].ts);
-
-          at = i;
-          while(true) {
-            println(hlog, "state ", q[at].ts, " vs ", q[at].pstates, " dir = ", parent_dir[at]);
-            at = parent_id[at];
-            if(at == -1) break;
-            }
-
          multiple_interpretations++;
          // print_transducer(autom);
-          if(!(flags & w_r3_all_errors)) find_multiple_interpretation();
+          if(!(flags & w_r3_all_errors)) {
+            vstate vs;
+            vector<int> path1;
+            int at = build_vstate(vs, path1, parent_dir, parent_id, i, [&] (int i) { return q[i].ts; });
+            println(hlog, "after path = ", path1, " got multiple interpretation");
+            for(auto v: sch.pstates) if(v->accepting_directions & (1<<dir)) println(hlog, "state ", v);
+            for(auto v: sch.pstates) for(auto& p: v->t) if(p.first.first == ENDED && (p.second->accepting_directions & (1<<dir))) println(hlog, "state ", v, " after accepting END/", p.first.second);
+            println(hlog, "starting at state: ", q[at].ts, " reached state ", q[i].ts);
+
+            at = i;
+            while(true) {
+              println(hlog, "state ", q[at].ts, " vs ", q[at].pstates, " dir = ", parent_dir[at]);
+              at = parent_id[at];
+              if(at == -1) break;
+              }
+
+            find_multiple_interpretation();
+            }
          }
        if(qty == 0) {
          vstate vs;
@ -1171,11 +1230,15 @@ EX void test_transducers() {
        next.pstates.resize(ip - next.pstates.begin());
        enqueue(next, i, s);
        }
-      }
+      };
+
+    for(int i=0; i<isize(q); i++) process(i);
    
    if(changes) {
-      println(hlog, "changes = ", changes, " with ", isize(autom), " states");
-      goto next_iteration;
+      println(hlog, "changes = ", changes, " with ", isize(autom), " states, queue size = ", isize(q), ", add = ", isize(important)-impcount, " MI = ", multiple_interpretations);
+      if(isize(important) > impcount || multiple_interpretations) err_iter++;
+      if(err_iter < max_err_iter) goto next_iteration;
+      if(err_iter == max_err_iter) max_err_iter++;
      }

    if((flags & w_r3_all_errors) && isize(important) > impcount) throw rulegen_retry("errors found by transducers");
@ -1185,7 +1248,7 @@ EX void test_transducers() {
      find_multiple_interpretation();
      }

-    println(hlog, "transducers found successfully after ", iterations, " iterations, ", isize(autom), " states checked, queue size = ", isize(q));
+    println(hlog, "transducers found successfully after ", iterations, " iterations, ", isize(autom), " states checked, queue size = ", isize(q), " rmmemo size = ", isize(rmmemo));
    
    vector<vector<transducer>> special(isize(t_origin));
    for(int tid=0; tid<isize(t_origin); tid++) {
@ -1534,6 +1597,8 @@ EX void cleanup3() {
  qroad_for.clear();
  qroad_memo.clear();
  possible_parents.clear();
+  rmmemo.clear();
+  max_err_iter = 4;
  }

 #if CAP_COMMANDLINE