diffblue
diff --git a/‎regression/goto-synthesizer/CMakeLists.txt
Lines changed: 1 addition & 2 deletions b/‎regression/goto-synthesizer/CMakeLists.txt
Lines changed: 1 addition & 2 deletions
diff --git a/‎regression/goto-synthesizer/Makefile
Lines changed: 3 additions & 3 deletions b/‎regression/goto-synthesizer/Makefile
Lines changed: 3 additions & 3 deletions
diff --git a/‎regression/goto-synthesizer/chain.sh
Lines changed: 12 additions & 6 deletions b/‎regression/goto-synthesizer/chain.sh
Lines changed: 12 additions & 6 deletions
diff --git a/‎regression/goto-synthesizer/loop_contracts_synthesis_01/test.desc
Lines changed: 1 addition & 1 deletion b/‎regression/goto-synthesizer/loop_contracts_synthesis_01/test.desc
Lines changed: 1 addition & 1 deletion
diff --git a/‎regression/goto-synthesizer/loop_contracts_synthesis_02/main.c
Lines changed: 17 additions & 0 deletions b/‎regression/goto-synthesizer/loop_contracts_synthesis_02/main.c
Lines changed: 17 additions & 0 deletions
diff --git a/‎regression/goto-synthesizer/loop_contracts_synthesis_02/test.desc
Lines changed: 11 additions & 0 deletions b/‎regression/goto-synthesizer/loop_contracts_synthesis_02/test.desc
Lines changed: 11 additions & 0 deletions
diff --git a/‎regression/goto-synthesizer/loop_contracts_synthesis_03/main.c
Lines changed: 16 additions & 0 deletions b/‎regression/goto-synthesizer/loop_contracts_synthesis_03/main.c
Lines changed: 16 additions & 0 deletions
diff --git a/‎regression/goto-synthesizer/loop_contracts_synthesis_03/test.desc
Lines changed: 12 additions & 0 deletions b/‎regression/goto-synthesizer/loop_contracts_synthesis_03/test.desc
Lines changed: 12 additions & 0 deletions
diff --git a/‎regression/goto-synthesizer/loop_contracts_synthesis_04/main.c
Lines changed: 17 additions & 0 deletions b/‎regression/goto-synthesizer/loop_contracts_synthesis_04/main.c
Lines changed: 17 additions & 0 deletions
diff --git a/‎regression/goto-synthesizer/loop_contracts_synthesis_04/test.desc
Lines changed: 11 additions & 0 deletions b/‎regression/goto-synthesizer/loop_contracts_synthesis_04/test.desc
Lines changed: 11 additions & 0 deletions
diff --git a/‎src/analyses/dependence_graph.cpp
Lines changed: 49 additions & 0 deletions b/‎src/analyses/dependence_graph.cpp
Lines changed: 49 additions & 0 deletions
diff --git a/‎src/analyses/dependence_graph.h
Lines changed: 19 additions & 2 deletions b/‎src/analyses/dependence_graph.h
Lines changed: 19 additions & 2 deletions
diff --git a/‎src/goto-instrument/contracts/contracts.cpp
Lines changed: 25 additions & 2 deletions b/‎src/goto-instrument/contracts/contracts.cpp
Lines changed: 25 additions & 2 deletions
diff --git a/‎src/goto-instrument/contracts/contracts.h
Lines changed: 13 additions & 0 deletions b/‎src/goto-instrument/contracts/contracts.h
Lines changed: 13 additions & 0 deletions
diff --git a/‎src/goto-instrument/contracts/utils.cpp
Lines changed: 31 additions & 0 deletions b/‎src/goto-instrument/contracts/utils.cpp
Lines changed: 31 additions & 0 deletions
@@ -12,9 +12,8 @@ else()
   set(gcc_only_string "")
 endif()
 
-
 add_test_pl_tests(
-    "${CMAKE_CURRENT_SOURCE_DIR}/chain.sh $<TARGET_FILE:goto-cc> $<TARGET_FILE:goto-synthesizer> $<TARGET_FILE:cbmc> ${is_windows}"
+  "${CMAKE_CURRENT_SOURCE_DIR}/chain.sh $<TARGET_FILE:goto-cc> $<TARGET_FILE:goto-instrument> $<TARGET_FILE:goto-synthesizer> $<TARGET_FILE:cbmc> ${is_windows}"
 )
 
 ## Enabling these causes a very significant increase in the time taken to run the regressions
 
@@ -14,16 +14,16 @@ else
 endif
 
 test:
-	@../test.pl -e -p -c '../chain.sh $(exe) ../../../src/goto-synthesizer/goto-synthesizer ../../../src/cbmc/cbmc $(is_windows)' -X smt-backend $(GCC_ONLY)
+	@../test.pl -e -p -c '../chain.sh $(exe) ../../../src/goto-instrument/goto-instrument ../../../src/goto-synthesizer/goto-synthesizer ../../../src/cbmc/cbmc $(is_windows)' -X smt-backend $(GCC_ONLY)
 
 test-cprover-smt2:
-	@../test.pl -e -p -c '../chain.sh $(exe) ../../../src/goto-synthesizer/goto-synthesizer "../../../src/cbmc/cbmc --cprover-smt2" $(is_windows)' \
+	@../test.pl -e -p -c '../chain.sh $(exe) ../../../src/goto-instrument/goto-instrument ../../../src/goto-synthesizer/goto-synthesizer "../../../src/cbmc/cbmc --cprover-smt2" $(is_windows)' \
 					  -X broken-smt-backend -X thorough-smt-backend \
 					  -X broken-cprover-smt-backend -X thorough-cprover-smt-backend \
 					  -s cprover-smt2 $(GCC_ONLY)
 
 test-z3:
-	@../test.pl -e -p -c '../chain.sh $(exe) ../../../src/goto-synthesizer/goto-synthesizer "../../../src/cbmc/cbmc --z3" $(is_windows)' \
+	@../test.pl -e -p -c '../chain.sh $(exe) ../../../src/goto-instrument/goto-instrument ../../../src/goto-synthesizer/goto-synthesizer "../../../src/cbmc/cbmc --z3" $(is_windows)' \
 					  -X broken-smt-backend -X thorough-smt-backend \
 					  -X broken-z3-smt-backend -X thorough-z3-smt-backend \
 					  -s z3 $(GCC_ONLY)
 
@@ -3,14 +3,15 @@
 set -e
 
 goto_cc=$1
-goto_synthesizer=$2
-cbmc=$3
-is_windows=$4
+goto_instrument=$2
+goto_synthesizer=$3
+cbmc=$4
+is_windows=$5
 
 name=${*:$#}
 name=${name%.c}
 
-args=${*:5:$#-5}
+args=${*:6:$#-6}
 if [[ "$args" != *" _ "* ]]
 then
   args_inst=$args
@@ -27,7 +28,9 @@ else
 fi
 
 rm -f "${name}-mod.gb"
-$goto_synthesizer ${args_inst} "${name}.gb" "${name}-mod.gb"
+rm -f "${name}-mod-2.gb"
+echo "Running goto-instrument: "
+$goto_instrument ${args_inst} "${name}.gb" "${name}-mod.gb"
 if [ ! -e "${name}-mod.gb" ] ; then
   cp "$name.gb" "${name}-mod.gb"
 elif echo $args_inst | grep -q -- "--dump-c" ; then
@@ -41,4 +44,7 @@ elif echo $args_inst | grep -q -- "--dump-c" ; then
 
   rm "${name}-mod.c"
 fi
-$cbmc "${name}-mod.gb" ${args_cbmc}
+echo "Running goto-synthesizer: "
+$goto_synthesizer "${name}-mod.gb" "${name}-mod-2.gb"
+echo "Running CBMC: "
+$cbmc "${name}-mod-2.gb" ${args_cbmc}
@@ -1,6 +1,6 @@
 CORE
 main.c
-
+--pointer-check
 ^EXIT=0$
 ^SIGNAL=0$
 ^\[main\.\d+\] line 10 Check loop invariant before entry: SUCCESS$
 
@@ -0,0 +1,17 @@
+#define SIZE 80
+
+void main()
+{
+  unsigned len;
+  __CPROVER_assume(len <= SIZE);
+  __CPROVER_assume(len >= 8);
+  char *array = malloc(len);
+  unsigned s = 0;
+
+  for(unsigned i = 0; i < SIZE; ++i)
+  {
+    if(i == len - 1)
+      break;
+    s += array[i];
+  }
+}
@@ -0,0 +1,11 @@
+CORE
+main.c
+--pointer-check
+^EXIT=0$
+^SIGNAL=0$
+^\[main.pointer\_dereference.\d+\] .* SUCCESS$
+^VERIFICATION SUCCESSFUL$
+--
+--
+This test shows that loop invariants using range predicates can be correctly
+synthesized for programs with only pointer checks but no other assertions.
@@ -0,0 +1,16 @@
+#define SIZE 80
+
+void main()
+{
+  unsigned long len;
+  __CPROVER_assume(len <= SIZE);
+  __CPROVER_assume(len >= 8);
+  char *array = malloc(len);
+  const char *end = array + len;
+  unsigned s = 0;
+
+  while(array != end)
+  {
+    s += *array++;
+  }
+}
@@ -0,0 +1,12 @@
+CORE
+main.c
+--pointer-check
+^EXIT=0$
+^SIGNAL=0$
+^\[main.pointer\_dereference.\d+\] .* SUCCESS$
+^VERIFICATION SUCCESSFUL$
+--
+--
+This test shows that loop invariants using range predicates and same-object
+predicates can be correctly synthesized for programs with only pointer
+checks but no other assertions.
@@ -0,0 +1,17 @@
+#define SIZE 80
+
+void main()
+{
+  unsigned long len;
+  __CPROVER_assume(len <= SIZE);
+  __CPROVER_assume(len >= 8);
+  char *array = malloc(len);
+  unsigned long s = 0;
+
+  unsigned long j = 0;
+  for(unsigned long i = 0; i < len; i++)
+  {
+    s += array[j];
+    j++;
+  }
+}
@@ -0,0 +1,11 @@
+CORE
+main.c
+--pointer-check
+^EXIT=0$
+^SIGNAL=0$
+^\[main.pointer\_dereference.\d+\] .* SUCCESS$
+^VERIFICATION SUCCESSFUL$
+--
+--
+This test shows that the loop-invariant synthesizer can enumerate
+strengthening clauses for invariant-not-preserved violation.
@@ -383,6 +383,55 @@ void dependence_grapht::add_dep(
   nodes[n_to].in[n_from].add(kind);
 }
 
+bool dependence_grapht::is_flow_dependent(
+  const goto_programt::const_targett &from,
+  const goto_programt::const_targett &to)
+{
+  std::set<node_indext> visited;
+  const dep_graph_domaint &from_domain = static_cast<const dep_graph_domaint &>(
+    *storage->abstract_state_before(from, *domain_factory));
+  const dep_graph_domaint &to_domain = static_cast<const dep_graph_domaint &>(
+    *storage->abstract_state_before(to, *domain_factory));
+  return is_flow_dependent(from_domain, to_domain, visited);
+}
+
+bool dependence_grapht::is_flow_dependent(
+  const dep_graph_domaint &from,
+  const dep_graph_domaint &to,
+  std::set<node_indext> &visited)
+{
+  // Is `to` control dependent on `from`?
+  for(const auto node : to.get_control_deps())
+  {
+    const auto &node_domain = (*this)[node];
+    if(visited.count(node_domain.get_node_id()))
+      continue;
+
+    visited.insert(node_domain.get_node_id());
+
+    if(
+      from.get_node_id() == node_domain.get_node_id() ||
+      is_flow_dependent(from, node_domain, visited))
+      return true;
+  }
+
+  // Is `to` data dependent on `from`?
+  for(const auto node : to.get_data_deps())
+  {
+    const auto &node_domain = (*this)[node];
+    if(!visited.insert(node_domain.get_node_id()).second)
+      continue;
+
+    if(
+      from.get_node_id() == node_domain.get_node_id() ||
+      is_flow_dependent(from, node_domain, visited))
+    {
+      return true;
+    }
+  }
+  return false;
+}
+
 void dep_graph_domaint::populate_dep_graph(
   dependence_grapht &dep_graph, goto_programt::const_targett this_loc) const
 {
 
@@ -67,6 +67,7 @@ class dep_graph_domaint:public ai_domain_baset
 {
 public:
   typedef grapht<dep_nodet>::node_indext node_indext;
+  typedef std::set<goto_programt::const_targett> depst;
 
   explicit dep_graph_domaint(node_indext id)
     : has_values(false), node_id(id), has_changed(false)
@@ -167,13 +168,20 @@ class dep_graph_domaint:public ai_domain_baset
   void populate_dep_graph(
     dependence_grapht &, goto_programt::const_targett) const;
 
+  const depst &get_control_deps() const
+  {
+    return control_deps;
+  }
+  const depst &get_data_deps() const
+  {
+    return data_deps;
+  }
+
 private:
   tvt has_values;
   node_indext node_id;
   bool has_changed;
 
-  typedef std::set<goto_programt::const_targett> depst;
-
   // Set of locations with control instructions on which the instruction at this
   // location has a control dependency on
   depst control_deps;
@@ -279,7 +287,16 @@ class dependence_grapht:
     return rd;
   }
 
+  /// Decide whether the instruction `to` is flow dependent on `from`.
+  bool is_flow_dependent(
+    const goto_programt::const_targett &from,
+    const goto_programt::const_targett &to);
+
 protected:
+  bool is_flow_dependent(
+    const dep_graph_domaint &from,
+    const dep_graph_domaint &to,
+    std::set<node_indext> &visited);
   friend dep_graph_domain_factoryt;
   friend dep_graph_domaint;
   const namespacet &ns;
 
@@ -59,6 +59,7 @@ void code_contractst::check_apply_loop_contracts(
   const irep_idt &mode)
 {
   const auto loop_head_location = loop_head->source_location();
+  const unsigned loop_number = loop_end->loop_number;
 
   // Vector representing a (possibly multidimensional) decreases clause
   const auto &decreases_clause_exprs = decreases_clause.operands();
@@ -142,7 +143,7 @@ void code_contractst::check_apply_loop_contracts(
   // i.e., the loop guard was satisfied.
   const auto entered_loop =
     new_tmp_symbol(
-      bool_typet(), loop_head_location, mode, symbol_table, "__entered_loop")
+      bool_typet(), loop_head_location, mode, symbol_table, ENTERED_LOOP)
       .symbol_expr();
   pre_loop_head_instrs.add(
     goto_programt::make_decl(entered_loop, loop_head_location));
@@ -173,7 +174,7 @@ void code_contractst::check_apply_loop_contracts(
   // instrumentation of the loop.
   const auto in_base_case =
     new_tmp_symbol(
-      bool_typet(), loop_head_location, mode, symbol_table, "__in_base_case")
+      bool_typet(), loop_head_location, mode, symbol_table, IN_BASE_CASE)
       .symbol_expr();
   pre_loop_head_instrs.add(
     goto_programt::make_decl(in_base_case, loop_head_location));
@@ -440,6 +441,28 @@ void code_contractst::check_apply_loop_contracts(
     loop_end,
     add_pragma_disable_assigns_check(pre_loop_end_instrs));
 
+  // Record original loop number for some instrumented instructions.
+  for(goto_programt::const_targett it_instr =
+        goto_function.body.instructions.begin();
+      it_instr != goto_function.body.instructions.end();
+      it_instr++)
+  {
+    // Don't override original loop numbers.
+    if(original_loop_number_map.count(it_instr) != 0)
+      continue;
+
+    // Store loop number for
+    // ASSIGN ENTERED_LOOP = TRUE
+    if(
+      is_assignment_to_instrumented_variable(it_instr, ENTERED_LOOP) &&
+      it_instr->assign_rhs() == true_exprt())
+      original_loop_number_map[it_instr] = loop_number;
+
+    // Store loop number for loop havoc.
+    if(is_loop_havoc(*it_instr))
+      original_loop_number_map[it_instr] = loop_number;
+  }
+
   // change the back edge into assume(false) or assume(guard)
   loop_end->turn_into_assume();
   loop_end->condition_nonconst() = boolean_negate(loop_end->condition());
 
@@ -122,6 +122,12 @@ class code_contractst
   symbol_tablet &get_symbol_table();
   goto_functionst &get_goto_functions();
 
+  std::unordered_map<goto_programt::const_targett, unsigned, const_target_hash>
+  get_original_loop_number_map() const
+  {
+    return original_loop_number_map;
+  }
+
   namespacet ns;
 
 protected:
@@ -137,6 +143,13 @@ class code_contractst
   /// Name of loops we are going to unwind.
   std::list<std::string> loop_names;
 
+  /// Store the map from instrumented instructions for loop contracts to their
+  /// original loop numbers. Following instrumented instructions are stored.
+  /// 1. loop-havoc   ---   begin of transformed loops
+  /// 2. ASSIGN ENTERED_LOOP = TRUE   ---   end of transformed loops
+  std::unordered_map<goto_programt::const_targett, unsigned, const_target_hash>
+    original_loop_number_map;
+
 public:
   /// \brief Enforce contract of a single function
   void enforce_contract(const irep_idt &function);
 
@@ -447,3 +447,34 @@ void generate_history_variables_initialization(
   // Add all the history variable initialization instructions
   program.destructive_append(history);
 }
+
+bool is_transformed_loop_end(const goto_programt::const_targett &target)
+{
+  // The end of the loop end of transformed loop is
+  // ASSIGN entered_loop = true
+  if(!is_assignment_to_instrumented_variable(target, ENTERED_LOOP))
+    return false;
+
+  return target->assign_rhs() == true_exprt();
+}
+
+bool is_assignment_to_instrumented_variable(
+  const goto_programt::const_targett &target,
+  std::string var_name)
+{
+  INVARIANT(
+    var_name == IN_BASE_CASE || var_name == ENTERED_LOOP,
+    "var_name is not of instrumented variables.");
+
+  if(!target->is_assign())
+    return false;
+
+  if(can_cast_expr<symbol_exprt>(target->assign_lhs()))
+  {
+    const auto &lhs = to_symbol_expr(target->assign_lhs());
+    return id2string(lhs.get_identifier()).find("::" + var_name) !=
+           std::string::npos;
+  }
+
+  return false;
+}
Original file line number	Diff line number	Diff line change
`@@ -12,9 +12,8 @@ else()`
`12`	`12`	`set(gcc_only_string "")`
`13`	`13`	`endif()`
`14`	`14`
`15`		`-`
`16`	`15`	`add_test_pl_tests(`
`17`		`- "${CMAKE_CURRENT_SOURCE_DIR}/chain.sh $<TARGET_FILE:goto-cc> $<TARGET_FILE:goto-synthesizer> $<TARGET_FILE:cbmc> ${is_windows}"`
	`16`	`+ "${CMAKE_CURRENT_SOURCE_DIR}/chain.sh $<TARGET_FILE:goto-cc> $<TARGET_FILE:goto-instrument> $<TARGET_FILE:goto-synthesizer> $<TARGET_FILE:cbmc> ${is_windows}"`
`18`	`17`	`)`
`19`	`18`
`20`	`19`	`## Enabling these causes a very significant increase in the time taken to run the regressions`