Skip to content

Commit 65a1161

Browse files
authored
Merge branch 'main' into warn-user-zero-addr
2 parents 7a75500 + 68184ab commit 65a1161

File tree

3 files changed

+69
-40
lines changed

3 files changed

+69
-40
lines changed

CHANGELOG.md

+4
Original file line numberDiff line numberDiff line change
@@ -39,6 +39,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
3939
so we don't get too large buffers as counterexamples
4040
- More symbolic overapproximation for Balance and ExtCodeHash opcodes, fixing
4141
CodeHash SMT representation
42+
- PNeg + PGT/PGEq/PLeq/PLT simplification rules
4243
- We no longer dispatch Props to SMT that can be solved by a simplification
4344
- Allow user to change the verbosity level via `--verb`. For the moment, this is only to
4445
print some warnings related to zero-address dereference and to print `hemv test`'s
@@ -66,6 +67,9 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
6667
fully explore. Printing of issues is also now much more organized
6768
- `hevm test`'s flag ` --verbose` is now `--verb`, which also increases verbosity
6869
for other elements of the system
70+
- Expressions that are commutative are now canonicalized to have the smaller
71+
value on the LHS. This can significantly help with simplifications, automatically
72+
determining when (Eq a b) is true when a==b modulo commutativity
6973

7074
## [0.54.2] - 2024-12-12
7175

src/EVM/Expr.hs

+46-29
Original file line numberDiff line numberDiff line change
@@ -72,16 +72,26 @@ normArgs sym conc l r = case (l, r) of
7272
where
7373
doOp = op2 sym conc
7474

75+
-- Same as `normArgs`, but for commutative operators it orders the arguments canonically
76+
-- This helps in cases when (PEq x1 x2) is comparing x1 and x2 that are equivalent modulo commutativity.
77+
-- In such cases, normArgsOrd will make sure x1 and x2 look the same.
78+
-- NOTE: This is compatible with `Lit` being always on the left, as `Lit` is always
79+
-- less than any other expression
80+
normArgsOrd :: (Expr EWord -> Expr EWord -> Expr EWord) -> (W256 -> W256 -> W256) -> Expr EWord -> Expr EWord -> Expr EWord
81+
normArgsOrd sym conc l r = if l <= r then doOp l r else doOp r l
82+
where
83+
doOp = op2 sym conc
84+
7585
-- Integers
7686

7787
add :: Expr EWord -> Expr EWord -> Expr EWord
78-
add = normArgs Add (+)
88+
add = normArgsOrd Add (+)
7989

8090
sub :: Expr EWord -> Expr EWord -> Expr EWord
8191
sub = op2 Sub (-)
8292

8393
mul :: Expr EWord -> Expr EWord -> Expr EWord
84-
mul = normArgs Mul (*)
94+
mul = normArgsOrd Mul (*)
8595

8696
div :: Expr EWord -> Expr EWord -> Expr EWord
8797
div = op2 Div (\x y -> if y == 0 then 0 else Prelude.div x y)
@@ -156,21 +166,21 @@ sgt = op2 SGT (\x y ->
156166
in if sx > sy then 1 else 0)
157167

158168
eq :: Expr EWord -> Expr EWord -> Expr EWord
159-
eq = normArgs Eq (\x y -> if x == y then 1 else 0)
169+
eq = normArgsOrd Eq (\x y -> if x == y then 1 else 0)
160170

161171
iszero :: Expr EWord -> Expr EWord
162172
iszero = op1 IsZero (\x -> if x == 0 then 1 else 0)
163173

164174
-- Bits
165175

166176
and :: Expr EWord -> Expr EWord -> Expr EWord
167-
and = normArgs And (.&.)
177+
and = normArgsOrd And (.&.)
168178

169179
or :: Expr EWord -> Expr EWord -> Expr EWord
170-
or = normArgs Or (.|.)
180+
or = normArgsOrd Or (.|.)
171181

172182
xor :: Expr EWord -> Expr EWord -> Expr EWord
173-
xor = normArgs Xor Data.Bits.xor
183+
xor = normArgsOrd Xor Data.Bits.xor
174184

175185
not :: Expr EWord -> Expr EWord
176186
not = op1 Not complement
@@ -706,9 +716,9 @@ pattern MappingSlot :: ByteString -> Expr EWord -> Expr EWord
706716
pattern MappingSlot idx key = Keccak (WriteWord (Lit 0) key (ConcreteBuf idx))
707717

708718
-- storage slots for arrays are determined by (keccak(bytes32(id)) + offset)
709-
-- note that `normArgs` puts the Lit as the 2nd argument to `Add`
719+
-- note that `normArgs` puts the Lit as the 1st argument to `Add`
710720
pattern ArraySlotWithOffs :: ByteString -> Expr EWord -> Expr EWord
711-
pattern ArraySlotWithOffs id offset = Add (Keccak (ConcreteBuf id)) offset
721+
pattern ArraySlotWithOffs id offset = Add offset (Keccak (ConcreteBuf id))
712722

713723
-- special pattern to match the 0th element because the `Add` term gets simplified out
714724
pattern ArraySlotZero :: ByteString -> Expr EWord
@@ -1063,9 +1073,6 @@ simplify e = if (mapExpr go e == e)
10631073
-- literal addresses
10641074
go (WAddr (LitAddr a)) = Lit $ into a
10651075

1066-
-- XOR normalization
1067-
go (Xor a b) = EVM.Expr.xor a b
1068-
10691076
-- simple div/mod/add/sub
10701077
go (Div o1@(Lit _) o2@(Lit _)) = EVM.Expr.div o1 o2
10711078
go (SDiv o1@(Lit _) o2@(Lit _)) = EVM.Expr.sdiv o1 o2
@@ -1094,7 +1101,6 @@ simplify e = if (mapExpr go e == e)
10941101
-- Notice: all Add is normalized, hence the 1st argument is
10951102
-- expected to be Lit, if any. Hence `orig` needs to be the
10961103
-- 2nd argument for Add. However, Sub is not normalized
1097-
go (Add (Lit x) (Add (Lit y) orig)) = add (Lit (x+y)) orig
10981104
-- add + sub NOTE: every combination of Sub is needed (2)
10991105
go (Add (Lit x) (Sub (Lit y) orig)) = sub (Lit (x+y)) orig
11001106
go (Add (Lit x) (Sub orig (Lit y))) = add (Lit (x-y)) orig
@@ -1107,18 +1113,33 @@ simplify e = if (mapExpr go e == e)
11071113
go (Sub (Lit x) (Add (Lit y) orig)) = sub (Lit (x-y)) orig
11081114
go (Sub (Add (Lit x) orig) (Lit y) ) = add (Lit (x-y)) orig
11091115

1116+
-- Add+Add / Mul+Mul / Xor+Xor simplifications, taking
1117+
-- advantage of associativity and commutativity
1118+
-- Since Lit is smallest in the ordering, it will always be the first argument
1119+
-- hence these will collect Lits. See `simp-assoc..` tests
1120+
go (Add (Lit a) (Add (Lit b) x)) = add (Lit (a+b)) x
1121+
go (Mul (Lit a) (Mul (Lit b) x)) = mul (Lit (a*b)) x
1122+
go (Xor (Lit a) (Xor (Lit b) x)) = EVM.Expr.xor (Lit (Data.Bits.xor a b)) x
1123+
go (Add a (Add b c)) = add (l !! 0) (add (l !! 1) (l !! 2))
1124+
where l = sort [a, b, c]
1125+
go (Mul a (Mul b c)) = mul (l !! 0) (mul (l !! 1) (l !! 2))
1126+
where l = sort [a, b, c]
1127+
go (Xor a (Xor b c)) = x (l !! 0) (x (l !! 1) (l !! 2))
1128+
where l = sort [a, b, c]
1129+
x = EVM.Expr.xor
1130+
go (Or a (Or b c)) = o (l !! 0) (o (l !! 1) (l !! 2))
1131+
where l = sort [a, b, c]
1132+
o = EVM.Expr.or
1133+
go (And a (And b c)) = an (l !! 0) (an (l !! 1) (l !! 2))
1134+
where l = sort [a, b, c]
1135+
an = EVM.Expr.and
1136+
11101137
-- redundant add / sub
11111138
go (Sub (Add a b) c)
11121139
| a == c = b
11131140
| b == c = a
11141141
| otherwise = sub (add a b) c
11151142

1116-
-- Add is associative. We are doing left-growing trees because LIT is
1117-
-- arranged to the left. This way, they accumulate in all combinations.
1118-
-- See `sim-assoc-add` test cases in test.hs
1119-
go (Add a (Add b c)) = add (add a b) c
1120-
go (Add (Add (Lit a) x) (Lit b)) = add (Lit (a+b)) x
1121-
11221143
-- add / sub identities
11231144
go (Add a b)
11241145
| b == (Lit 0) = a
@@ -1129,6 +1150,9 @@ simplify e = if (mapExpr go e == e)
11291150
| b == (Lit 0) = a
11301151
| otherwise = sub a b
11311152

1153+
-- XOR normalization
1154+
go (Xor a b) = EVM.Expr.xor a b
1155+
11321156
-- SHL / SHR by 0
11331157
go (SHL a v)
11341158
| a == (Lit 0) = v
@@ -1137,12 +1161,6 @@ simplify e = if (mapExpr go e == e)
11371161
| a == (Lit 0) = v
11381162
| otherwise = shr a v
11391163

1140-
-- doubled And
1141-
go o@(And a (And b c))
1142-
| a == c = (And a b)
1143-
| a == b = (And b c)
1144-
| otherwise = o
1145-
11461164
-- Bitwise AND & OR. These MUST preserve bitwise equivalence
11471165
go (And a b)
11481166
| a == b = a
@@ -1182,11 +1200,6 @@ simplify e = if (mapExpr go e == e)
11821200
(Lit 0, _) -> Lit 0
11831201
_ -> EVM.Expr.min a b
11841202

1185-
-- Mul is associative. We are doing left-growing trees because LIT is
1186-
-- arranged to the left. This way, they accumulate in all combinations.
1187-
-- See `sim-assoc-add` test cases in test.hs
1188-
go (Mul a (Mul b c)) = mul (mul a b) c
1189-
go (Mul (Mul (Lit a) x) (Lit b)) = mul (Lit (a*b)) x
11901203

11911204
-- Some trivial mul eliminations
11921205
go (Mul a b) = case (a, b) of
@@ -1268,6 +1281,10 @@ simplifyProp prop =
12681281
-- negations
12691282
go (PNeg (PBool b)) = PBool (Prelude.not b)
12701283
go (PNeg (PNeg a)) = a
1284+
go (PNeg (PGT a b)) = PLEq a b
1285+
go (PNeg (PGEq a b)) = PLT a b
1286+
go (PNeg (PLT a b)) = PGEq a b
1287+
go (PNeg (PLEq a b)) = PGT a b
12711288

12721289
-- Empty buf
12731290
go (PEq (Lit 0) (BufLength k)) = peq k (ConcreteBuf "")

test/test.hs

+19-11
Original file line numberDiff line numberDiff line change
@@ -354,8 +354,7 @@ tests = testGroup "hevm"
354354
let simpExpr = mapExprM Expr.decomposeStorage expr
355355
-- putStrLnM $ T.unpack $ formatExpr (fromJust simpExpr)
356356
assertEqualM "Decompose did not succeed." (isJust simpExpr) True
357-
-- TODO check what's going on here. Likely the "arbitrary write through array" is the reason why we fail
358-
, expectFail $ test "decompose-6-fail" $ do
357+
, test "decompose-6-fail" $ do
359358
Just c <- solcRuntime "MyContract"
360359
[i|
361360
contract MyContract {
@@ -560,11 +559,11 @@ tests = testGroup "hevm"
560559
let simp = Expr.simplifyProp $ PLT (Max (Lit 5) (BufLength (AbstractBuf "txdata"))) (Lit 99)
561560
assertEqualM "max-buflength rules" simp $ PLT (BufLength (AbstractBuf "txdata")) (Lit 99)
562561
, test "simp-assoc-add1" $ do
563-
let simp = Expr.simplify $ Add (Var "a") (Add (Var "b") (Var "c"))
564-
assertEqualM "assoc rules" simp $ Add (Add (Var "a") (Var "b")) (Var "c")
562+
let simp = Expr.simplify $ Add (Add (Var "c") (Var "a")) (Var "b")
563+
assertEqualM "assoc rules" simp $ Add (Var "a") (Add (Var "b") (Var "c"))
565564
, test "simp-assoc-add2" $ do
566-
let simp = Expr.simplify $ Add (Lit 1) (Add (Var "b") (Var "c"))
567-
assertEqualM "assoc rules" simp $ Add (Add (Lit 1) (Var "b")) (Var "c")
565+
let simp = Expr.simplify $ Add (Add (Lit 1) (Var "c")) (Var "b")
566+
assertEqualM "assoc rules" simp $ Add (Lit 1) (Add (Var "b") (Var "c"))
568567
, test "simp-assoc-add3" $ do
569568
let simp = Expr.simplify $ Add (Lit 1) (Add (Lit 2) (Var "c"))
570569
assertEqualM "assoc rules" simp $ Add (Lit 3) (Var "c")
@@ -579,16 +578,22 @@ tests = testGroup "hevm"
579578
assertEqualM "assoc rules" simp $ Lit 10
580579
, test "simp-assoc-add-7" $ do
581580
let simp = Expr.simplify $ Add (Var "a") (Add (Var "b") (Lit 2))
582-
assertEqualM "assoc rules" simp $ Add (Add (Lit 2) (Var "a")) (Var "b")
581+
assertEqualM "assoc rules" simp $ Add (Lit 2) (Add (Var "a") (Var "b"))
583582
, test "simp-assoc-add8" $ do
584583
let simp = Expr.simplify $ Add (Add (Var "a") (Add (Lit 0x2) (Var "b"))) (Add (Var "c") (Add (Lit 0x2) (Var "d")))
585-
assertEqualM "assoc rules" simp $ Add (Add (Add (Add (Lit 0x4) (Var "a")) (Var "b")) (Var "c")) (Var "d")
584+
assertEqualM "assoc rules" simp $ Add (Lit 4) (Add (Var "a") (Add (Var "b") (Add (Var "c") (Var "d"))))
586585
, test "simp-assoc-mul1" $ do
587-
let simp = Expr.simplify $ Mul (Var "a") (Mul (Var "b") (Var "c"))
588-
assertEqualM "assoc rules" simp $ Mul (Mul (Var "a") (Var "b")) (Var "c")
586+
let simp = Expr.simplify $ Mul (Mul (Var "b") (Var "a")) (Var "c")
587+
assertEqualM "assoc rules" simp $ Mul (Var "a") (Mul (Var "b") (Var "c"))
589588
, test "simp-assoc-mul2" $ do
590589
let simp = Expr.simplify $ Mul (Lit 2) (Mul (Var "a") (Lit 3))
591590
assertEqualM "assoc rules" simp $ Mul (Lit 6) (Var "a")
591+
, test "simp-assoc-xor1" $ do
592+
let simp = Expr.simplify $ Xor (Lit 2) (Xor (Var "a") (Lit 3))
593+
assertEqualM "assoc rules" simp $ Xor (Lit 1) (Var "a")
594+
, test "simp-assoc-xor2" $ do
595+
let simp = Expr.simplify $ Xor (Lit 2) (Xor (Var "b") (Xor (Var "a") (Lit 3)))
596+
assertEqualM "assoc rules" simp $ Xor (Lit 1) (Xor (Var "a") (Var "b"))
592597
, test "simp-zero-write-extend-buffer-len" $ do
593598
let
594599
expr = BufLength $ CopySlice (Lit 0) (Lit 0x10) (Lit 0) (AbstractBuf "buffer") (ConcreteBuf "bimm")
@@ -1509,7 +1514,10 @@ tests = testGroup "hevm"
15091514
|]
15101515
let sig = Just (Sig "fun(uint256,uint256)" [AbiUIntType 256, AbiUIntType 256])
15111516
(_, k) <- withDefaultSolver $ \s -> checkAssert s defaultPanicCodes c sig [] defaultVeriOpts
1512-
putStrLnM $ "Ret: " <> (show k)
1517+
let numErrs = sum $ map (fromEnum . isError) k
1518+
assertEqualM "number of errors (i.e. copySlice issues) is 1" 1 numErrs
1519+
let errStrings = mapMaybe EVM.SymExec.getError k
1520+
assertEqualM "All errors are from copyslice" True $ all ("CopySlice" `List.isInfixOf`) errStrings
15131521
,
15141522
test "symbolic-copyslice" $ do
15151523
Just c <- solcRuntime "MyContract"

0 commit comments

Comments
 (0)