diffblue · thomasspriggs · Jul 13, 2023 · Jul 5, 2023 · Jun 7, 2023 · Jun 7, 2023
diff --git a/regression/cbmc-incr-smt2/structs/large_array_of_struct_nondet_index.c b/regression/cbmc-incr-smt2/structs/large_array_of_struct_nondet_index.c
@@ -0,0 +1,18 @@
+#include <assert.h>
+
+#define ARRAY_SIZE 10000
+
+int main()
+{
+  struct my_structt
+  {
+    int eggs;
+    int ham;
+  };
+  struct my_structt struct_array[ARRAY_SIZE];
+  int x;
+  __CPROVER_assume(x > 0 && x < ARRAY_SIZE);
+  struct_array[x].eggs = 3;
+  assert(struct_array[x].eggs + struct_array[x].ham != 10);
+  assert(struct_array[x].eggs + struct_array[x].ham != 11);
+}
diff --git a/regression/cbmc-incr-smt2/structs/large_array_of_struct_nondet_index.desc b/regression/cbmc-incr-smt2/structs/large_array_of_struct_nondet_index.desc
@@ -0,0 +1,18 @@
+CORE
+large_array_of_struct_nondet_index.c
+--trace
+Passing problem to incremental SMT2 solving
+^EXIT=10$
+^SIGNAL=0$
+line 16 assertion struct_array\[x\]\.eggs \+ struct_array\[x\]\.ham != 10\: FAILURE
+line 17 assertion struct_array\[x\]\.eggs \+ struct_array\[x\]\.ham != 11\: FAILURE
+\{\s*\.eggs=\d+,\s*\.ham=7\s*\}
+\{\s*\.eggs=\d+,\s*\.ham=8\s*\}
+x=\d{1,4}\s
+struct_array\[\(signed (long )+int\)x\]\.eggs=3
+--
+--
+This test covers support for examples with large arrays of structs using nondet
+indexes including trace generation. This combination of features is chosen in
+order to avoid array cell sensitivity or struct field sensitivity simplifying
+away the relevant `member_exprt` and `with_exprt` expressions.
diff --git a/regression/cbmc/array-cell-sensitivity9/test.desc b/regression/cbmc/array-cell-sensitivity9/test.desc
@@ -1,4 +1,4 @@
-CORE
+CORE new-smt-backend
 test.c
 --show-vcc
 main::1::array!0@1#2\[\[0\]\]..x =

diff --git a/regression/cbmc/array-cell-sensitivity9/test_execution.desc b/regression/cbmc/array-cell-sensitivity9/test_execution.desc
@@ -1,4 +1,4 @@
-CORE
+CORE new-smt-backend
 test.c
 
 ^VERIFICATION SUCCESSFUL$

diff --git a/regression/cbmc/field-sensitivity-trace-wrong-counterexample-1/test.desc b/regression/cbmc/field-sensitivity-trace-wrong-counterexample-1/test.desc
@@ -1,4 +1,4 @@
-CORE
+CORE new-smt-backend
 test.c
 --trace
 ^EXIT=10$

diff --git a/regression/cbmc/simplify_singleton_interval_7690/test_smt2.desc b/regression/cbmc/simplify_singleton_interval_7690/test_smt2.desc
@@ -1,4 +1,4 @@
-CORE smt-backend
+CORE smt-backend new-smt-backend
 singleton_interval_in_assume_7690.c
 --pointer-check
 ^\[stk_push\.pointer_dereference\.17] line \d+ dereference failure: pointer outside object bounds in stk-\>elems\[\(signed (long|long long) int\)stk-\>top\]: SUCCESS$

@@ -5,18 +5,24 @@
 #include <util/bitvector_expr.h>
 #include <util/bitvector_types.h>
 #include <util/make_unique.h>
+#include <util/namespace.h>
+#include <util/range.h>
+#include <util/simplify_expr.h>
 
 #include <solvers/flattening/boolbv_width.h>
 
+#include <algorithm>
+#include <numeric>
 #include <queue>
 
 struct_encodingt::struct_encodingt(const namespacet &ns)
-  : boolbv_width{util_make_unique<boolbv_widtht>(ns)}
+  : boolbv_width{util_make_unique<boolbv_widtht>(ns)}, ns{ns}
 {
 }
 
 struct_encodingt::struct_encodingt(const struct_encodingt &other)
-  : boolbv_width{util_make_unique<boolbv_widtht>(*other.boolbv_width)}
+  : boolbv_width{util_make_unique<boolbv_widtht>(*other.boolbv_width)},
+    ns{other.ns}
 {
 }
 
@@ -45,6 +51,57 @@
   return type;
 }
 
+/// \brief Extracts the component/field names and new values from a `with_exprt`
+///        which expresses a new struct value where one or more members of a
+///        struct have had their values substituted with new values.
+/// \note  This is implemented using direct access to the operands and other
+///        underlying irept interfaces, because the interface for `with_exprt`
+///        only supports a single `where` / `new_value` pair and does not
+///        support extracting the name from the `where` operand.
+static std::unordered_map<irep_idt, exprt>
+extricate_updates(const with_exprt &struct_expr)
+{
+  std::unordered_map<irep_idt, exprt> pairs;
+  auto current_operand = struct_expr.operands().begin();
+  // Skip the struct being updated in order to begin with the pairs.
+  current_operand++;
+  while(current_operand != struct_expr.operands().end())
+  {
+    INVARIANT(
+      current_operand->id() == ID_member_name,
+      "operand is expected to be the name of a member");
+    auto name = current_operand->find(ID_component_name).id();
+    ++current_operand;
+    INVARIANT(
+      current_operand != struct_expr.operands().end(),
+      "every name is expected to be followed by a paired value");
+    pairs[name] = *current_operand;
+    ++current_operand;
+  }
+  POSTCONDITION(!pairs.empty());
+  return pairs;
+}
+
+static exprt encode(const with_exprt &with, const namespacet &ns)
+{
+  const auto tag_type = type_checked_cast<struct_tag_typet>(with.type());
+  const auto struct_type =
+    type_checked_cast<struct_typet>(ns.follow(with.type()));
+  const auto updates = extricate_updates(with);
+  const auto components =
+    make_range(struct_type.components())
+      .map([&](const struct_union_typet::componentt &component) -> exprt {
+        const auto &update = updates.find(component.get_name());
+        if(update != updates.end())
+          return update->second;
+        else
+          return member_exprt{
+            with.old(), component.get_name(), component.type()};
+      })
+      .collect<exprt::operandst>();
+  return struct_exprt{components, tag_type};
+}
+
 static exprt encode(const struct_exprt &struct_expr)
 {
   INVARIANT(
@@ -55,6 +112,49 @@
   return concatenation_exprt{struct_expr.operands(), struct_expr.type()};
 }
 
+static std::size_t count_trailing_bit_width(
+  const struct_typet &type,
+  const irep_idt name,
+  const boolbv_widtht &boolbv_width)
+{
+  auto member_component_rit = std::find_if(
+    type.components().rbegin(),
+    type.components().rend(),
+    [&](const struct_union_typet::componentt &component) {
+      return component.get_name() == name;
+    });
+  INVARIANT(
+    member_component_rit != type.components().rend(),
+    "Definition of struct type should include named component.");
+  const auto trailing_widths =
+    make_range(type.components().rbegin(), member_component_rit)
+      .map([&](const struct_union_typet::componentt &component) -> std::size_t {
+        return boolbv_width(component.type());
+      });
+  return std::accumulate(
+    trailing_widths.begin(), trailing_widths.end(), std::size_t{0});
+}
+
+/// The member expression selects the value of a field from a struct. The
+/// struct is encoded as a single bitvector where the first field is stored
+/// in the highest bits. The second field is stored in the next highest set of
+/// bits and so on. As offsets are indexed from the lowest bit, any field can be
+/// selected by extracting the range of bits starting from an offset based on
+/// the combined width of the fields which follow the field being selected.
+exprt struct_encodingt::encode_member(const member_exprt &member_expr) const
+{
+  const auto &struct_type = type_checked_cast<struct_typet>(
+    ns.get().follow(member_expr.compound().type()));
+  const std::size_t offset_bits = count_trailing_bit_width(
+    struct_type, member_expr.get_component_name(), *boolbv_width);
+  const auto member_bits_width = (*boolbv_width)(member_expr.type());
+  return extractbits_exprt{
+    member_expr.compound(),
+    offset_bits + member_bits_width - 1,
+    offset_bits,
+    member_expr.type()};
+}
+
 exprt struct_encodingt::encode(exprt expr) const
 {
   std::queue<exprt *> work_queue;
@@ -63,11 +163,46 @@
   {
     exprt &current = *work_queue.front();
     work_queue.pop();
+    // Note that "with" expressions are handled before type encoding in order to
+    // facilitate checking that they are applied to structs rather than arrays.
+    if(const auto with_expr = expr_try_dynamic_cast<with_exprt>(current))
+      if(can_cast_type<struct_tag_typet>(current.type()))
+        current = ::encode(*with_expr, ns);
     current.type() = encode(current.type());
     if(const auto struct_expr = expr_try_dynamic_cast<struct_exprt>(current))
       current = ::encode(*struct_expr);
+    if(const auto member_expr = expr_try_dynamic_cast<member_exprt>(current))
+      current = encode_member(*member_expr);
     for(auto &operand : current.operands())
       work_queue.push(&operand);
   }
   return expr;
 }
+
+exprt struct_encodingt::decode(
+  const exprt &encoded,
+  const struct_tag_typet &original_type) const
+{
+  // The algorithm below works by extracting each of the separate fields from
+  // the combined encoded value using a `member_exprt` which is itself encoded
+  // into a `bit_extract_exprt`. These separated fields can then be combined
+  // using a `struct_exprt`. This is expected to duplicate the input encoded
+  // expression for each of the fields. However for the case where the input
+  // encoded expression is a `constant_exprt`, expression simplification will be
+  // able simplify away the duplicated portions of the constant and the bit
+  // extraction expressions. This yields a clean struct expression where each
+  // field is a separate constant containing the data solely relevant to that
+  // field.
+  INVARIANT(
+    can_cast_type<bv_typet>(encoded.type()),
+    "Structs are expected to be encoded into bit vectors.");
+  const struct_typet definition = ns.get().follow_tag(original_type);
+  exprt::operandst encoded_fields;
+  for(const auto &component : definition.components())
+  {
+    encoded_fields.push_back(typecast_exprt::conditional_cast(
+      encode(member_exprt{typecast_exprt{encoded, original_type}, component}),
+      component.type()));
+  }
+  return simplify_expr(struct_exprt{encoded_fields, original_type}, ns);
+}
@@ -10,6 +10,8 @@
 
 class namespacet;
 class boolbv_widtht;
+class member_exprt;
+class struct_tag_typet;
 
 /// Encodes struct types/values into non-struct expressions/types.
 class struct_encodingt final
@@ -21,9 +23,16 @@ class struct_encodingt final
 
   typet encode(typet type) const;
   exprt encode(exprt expr) const;
+  /// Reconstructs a struct expression of the \p original_type using the data
+  /// from the bit vector \p encoded expression.
+  exprt
+  decode(const exprt &encoded, const struct_tag_typet &original_type) const;
 
 private:
   std::unique_ptr<boolbv_widtht> boolbv_width;
+  std::reference_wrapper<const namespacet> ns;
+
+  exprt encode_member(const member_exprt &member_expr) const;
 };
 
 #endif // CPROVER_SOLVERS_SMT2_INCREMENTAL_STRUCT_ENCODING_H