from z3 import *

bool check(uint32_t x, uint32_t y)
{
    return x*x*y + (3+x)*(7+y) == 1337;
}

# Define x, y as bit vectors of size 32 bits
x, y = BitVecs('x y', 32)

# Initialize the solver
solver = Solver()

# Add constraint
solver.add(x*x*y + (3+x)*(7+y) == 1337)

# Check if the set of constraints is satisfiable
if solver.check() == sat:
    # Get model and print it nicely
    m = solver.model()
    print(f"x = {m[x]}\ny = {m[y]}")

x = 204374014
y = 334463242

bool verify_license(char *code)
{
    size_t sz = strlen(code);
    if (sz != 6) return false;

    char flag = 'A';
    for (int i = 0; i < sz; i++)
    {
        if ((code[i] >= '0' && code[i] <= '9') ||
            (code[i] >= 'A' && code[i] <= 'Z'))
        {
            flag = flag ^ code[i];
        }
        else
        {
            return false;
        }
    }

    return flag == 'Z';
}

# Define code
# List (array) of 6 bit vectors of size 8 bits (char) 
code = [BitVec(f"c{i}", 8) for i in range(6)]

# Define flag
# Bit vector of size 8 bits with a concrete value 'A'
flag = BitVecVal(ord('A'), 8)

# Initialize the solver
solver = Solver()

# Iterate over all chars of code
for c in code:
    # Add constraint
    # The character has to lay within the valid range
    solver.add(Or(
        And(c >= ord('0'), c <= ord('9')),
        And(c >= ord('A'), c <= ord('Z'))
    ))
    
    # Update the flag bit vector
    flag = flag ^ c

# Add constraint
# The end value of flag has to be 'Z'
solver.add(flag == ord('Z'))

# Check if the set of constraints is satisfiable
if solver.check() == sat:
    # Get model and print it nicely
    m = solver.model()
    s = ''.join(chr(m[c].as_long()) for c in code)
    print(f"code = {s}")

code = E2JJ4X

# ... run previous code ...
# Add the extra constraints
solver.add(code[0] == ord('A'))
solver.add(code[1] == ord('B'))
solver.add(code[2] == ord('C'))
solver.add(code[3] == ord('D'))

# Define a list to hold the valid solutions
s = []

# While the set of constraints is satisfiable
while solver.check() == sat:    
    # Get model
    m = solver.model()
    
    # Save solution
    s.append(''.join(
        chr(m[c].as_long()) for c in code)
    )
    
    # Add constraint
    # Exclude current solution
    solver.add(
        Not(And([c == m[c] for c in code]))
    )

# Print the outcome
print(f"{len(s)} valid codes start with ABCD:\n---")
print("\n".join(s))

22 valid codes start with ABCD:
---
ABCDGX
ABCDFY
ABCDRM
ABCDVI
ABCDWH
ABCDOP
ABCDNQ
ABCDJU
ABCDZE
ABCDXG
ABCDHW
ABCDIV
ABCDKT
ABCDLS
ABCDTK
ABCDEZ
ABCDMR
ABCDYF
ABCDQN
ABCDUJ
ABCDPO
ABCDSL

solver.add(exp1 == exp2)
if (solver.check() == sat): # INCORRECT

uint32_t obf_op1(uint32_t x, uint32_t y)
{
    return (x ^ y) + 2*(x & y);
}

uint32_t obf_op2(uint32_t x, uint32_t y)
{
    return (x | y) - y + (~x & y);
}

# Return true if the expressions are equivalent
def check_semantic_equivalence(exp1, exp2):
    solver = Solver()
    solver.add(exp1 != exp2)
    return solver.check() == unsat

# Define x, y as bit vectors of size 32 bits
x, y = BitVecs('x y', 32)

# Define a list of operations to check against
basic_operations = [
    x + y,
    x - y,
    x * y,
    x & y,
    x | y,
    x ^ y
]

# Define the two obfuscated operations
obf_op1 = (x ^ y) + 2*(x & y)
obf_op2 = (x | y) - y + (~x & y)

# Check if the obfuscated expressions match the semantics
# of some of the basic operations
for op in basic_operations:
    if check_semantic_equivalence(op, obf_op1):
        print(f"{op} == {obf_op1}")
        
    if check_semantic_equivalence(op, obf_op2):
        print(f"{op} == {obf_op2}")

x + y == (x ^ y) + 2*(x & y)
x ^ y == (x | y) - y + (~x & y)

uint8_t opaques(uint8_t x, uint8_t y)
{
    uint8_t z;

    if ((uint8_t)(151 * (39 * ((x ^ y) + 2 * (x & y)) + 23) + 111) >
        (uint8_t)((x ^ y) + 2 * (x & y)))
    {
        z = x & y;
    }

    else if ((uint8_t)(x-y + 2*(~x&y) - (x^y)) == 0x17)
    {
        z = x | y;
    }

    else if (
        (uint8_t)(195 +
                  97*x +
                  159*y +
                  194*~(x | ~y) +
                  159*(x ^ y) +
                  (163 + x + 255*y + 2*~(x | ~y) + 255*(x ^ y))*
                  (232 + 248*x + 8*y + 240*~(x | ~y) + 8*(x ^ y)) - 57) < 100
    )
    {
        z = x ^ y;
    }

    else {
        z = 0;
    }

    return z;
}

# Detect conditional statements that are always false
def check_false_predicate(p):
    solver = Solver()
    solver.add(p)
    return solver.check() == unsat

# Detect conditional statements that are always true
def check_true_predicate(p):
    solver = Solver()
    solver.add(Not(p)) # <-- Not(p)
    return solver.check() == unsat
        
# Define x, y as bit vectors of size 8 bits
x, y = BitVecs('x y', 8)

# Define the conditional statements to check
predicates = [
    # if ...
    151*(39*((x ^ y) + 2*(x & y)) + 23) + 111 >
    (x ^ y) + 2*(x & y),
    
    # else if ...
    x-y + 2*(~x&y) - (x^y) == 0x17,

    # else if ...
    195 +
    97*x +
    159*y +
    194*~(x | ~y) +
    159*(x ^ y) +
    (163 + x + 255*y + 2*~(x | ~y) + 255*(x ^ y))*
    (232 + 248*x + 8*y + 240*~(x | ~y) + 8*(x ^ y)) - 57 < 100
]

# Iterate over all conditional statements
# Check whether they are opaque predicates
for p in predicates:
    if check_false_predicate(p):
        print(f"ALWAYS FALSE\n---\n{p}\n")
        
    elif check_true_predicate(p):
        print(f"ALWAYS TRUE\n---\n{p}\n")

ALWAYS FALSE
---
151*(39*((x ^ y) + 2*(x & y)) + 23) + 111 >
(x ^ y) + 2*(x & y)

ALWAYS FALSE
---
x - y + 2*(~x & y) - (x ^ y) == 23

ALWAYS TRUE
---
195 +
97*x +
159*y +
194*~(x | ~y) +
159*(x ^ y) +
(163 + x + 255*y + 2*~(x | ~y) + 255*(x ^ y))*
(232 + 248*x + 8*y + 240*~(x | ~y) + 8*(x ^ y)) -
57 <
100

uint8_t deobf_opaques(uint8_t x, uint8_t y)
{
    uint8_t z = x ^ y;
    return z
}

# Define the opaques function
# Nested Z3's control-flow constructs
def opaques(p1, p2, p3):
    return If(p1, x & y, If(p2, x | y, If(p3, x ^ y, 0)))

# Define x, y as bit vectors of size 8 bits
x, y = BitVecs('x y', 8)

# Unpack the three conditional statements
p1, p2, p3 = [p for p in predicates]

# Verify that the function is equivalent to an XOR
check_semantic_equivalence(
    opaques(p1, p2, p3),
    x ^ y
)

True

Operation	Math	Code
AND	$\land$	&
OR	$\lor$	\|
NOT	$\neg$	~
XOR	$\oplus$	^

A gentle introduction to SMT-based program analysis

SAT¶

SMT¶

Program analysis with the help of an SMT solver¶

Input crafting¶

Model counting¶

Semantic equivalence¶

Detect opaque predicates¶

Encode control-flow¶

Final notes¶

References¶

Training¶