Skip to content
Projects
Groups
Snippets
Help
This project
Loading...
Sign in / Register
Toggle navigation
C
cwe_checker
Overview
Overview
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
fact-depend
cwe_checker
Commits
0359ea16
Unverified
Commit
0359ea16
authored
Nov 10, 2022
by
van den Bosch
Committed by
GitHub
Nov 10, 2022
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
Expression propagation rewrite (#356)
parent
8372c99a
Expand all
Hide whitespace changes
Inline
Side-by-side
Showing
7 changed files
with
250 additions
and
26 deletions
+250
-26
main.rs
src/caller/src/main.rs
+1
-2
mod.rs
...we_checker_lib/src/analysis/expression_propagation/mod.rs
+228
-0
tests.rs
..._checker_lib/src/analysis/expression_propagation/tests.rs
+0
-0
mod.rs
src/cwe_checker_lib/src/analysis/mod.rs
+1
-0
blk.rs
src/cwe_checker_lib/src/intermediate_representation/blk.rs
+18
-9
expression.rs
...checker_lib/src/intermediate_representation/expression.rs
+1
-1
project.rs
...we_checker_lib/src/intermediate_representation/project.rs
+1
-14
No files found.
src/caller/src/main.rs
View file @
0359ea16
...
...
@@ -81,7 +81,7 @@ fn main() {
/// Return `Ok(file_path)` only if `file_path` points to an existing file.
fn
check_file_existence
(
file_path
:
&
str
)
->
Result
<
String
,
String
>
{
if
std
::
fs
::
metadata
(
&
file_path
)
if
std
::
fs
::
metadata
(
file_path
)
.map_err
(|
err
|
format!
(
"{}"
,
err
))
?
.is_file
()
{
...
...
@@ -127,7 +127,6 @@ fn run_with_ghidra(args: &CmdlineArgs) {
// because it uses up huge amounts of RAM and computation time on some binaries.
modules
.retain
(|
module
|
module
.name
!=
"CWE78"
);
}
let
binary_file_path
=
PathBuf
::
from
(
args
.binary
.clone
()
.unwrap
());
let
binary
:
Vec
<
u8
>
=
std
::
fs
::
read
(
&
binary_file_path
)
.unwrap_or_else
(|
_
|
{
panic!
(
...
...
src/cwe_checker_lib/src/analysis/expression_propagation/mod.rs
0 → 100644
View file @
0359ea16
//! This module contains a fixpoint computation for intra-procedual expression propagation
//! and contains a function for inserting such expressions.
use
super
::
fixpoint
::
Computation
;
use
super
::
forward_interprocedural_fixpoint
::
GeneralizedContext
;
use
crate
::
analysis
::
forward_interprocedural_fixpoint
::
create_computation
;
use
crate
::
analysis
::
graph
::
Graph
;
use
crate
::
analysis
::
graph
::
Node
;
use
crate
::
analysis
::
interprocedural_fixpoint_generic
::
NodeValue
;
use
crate
::
intermediate_representation
::
*
;
use
std
::
collections
::
HashMap
;
/// The context struct for the expression propagation fixpoint computation.
///
/// The computation is a intra procedural forward fixpoint calculation
/// that stores at each node the set of registers with their propagated expressions.
/// This expressions can be used for expression propagation among basic blocks.
pub
struct
Context
<
'a
>
{
graph
:
&
'a
Graph
<
'a
>
,
}
impl
<
'a
>
Context
<
'a
>
{
/// Create a new context object for the given project and control flow graph.
pub
fn
new
(
graph
:
&
'a
Graph
)
->
Context
<
'a
>
{
Context
{
graph
}
}
}
impl
<
'a
>
crate
::
analysis
::
forward_interprocedural_fixpoint
::
Context
<
'a
>
for
Context
<
'a
>
{
type
Value
=
HashMap
<
Variable
,
Expression
>
;
fn
get_graph
(
&
self
)
->
&
Graph
<
'a
>
{
self
.graph
}
/// Merges two values by intersecting their variable-expression pairs.
fn
merge
(
&
self
,
value1
:
&
Self
::
Value
,
value2
:
&
Self
::
Value
)
->
Self
::
Value
{
value1
.iter
()
.filter
(|(
var
,
expr
)|
value2
.get
(
var
)
==
Some
(
expr
))
.map
(|(
var
,
expr
)|
(
var
.clone
(),
expr
.clone
()))
.collect
()
}
/// Adds the expression for the assigned variable to the table.
///
/// Invalid pairs are removed and new expressions are supplemented if possible.
fn
update_def
(
&
self
,
value
:
&
Self
::
Value
,
def
:
&
Term
<
Def
>
)
->
Option
<
Self
::
Value
>
{
let
mut
insertable_expressions
=
value
.clone
();
match
&
def
.term
{
Def
::
Assign
{
var
,
value
:
expression
,
}
=>
{
// Extend the considered expression with already known expressions.
let
mut
extended_expression
=
expression
.clone
();
for
input_var
in
expression
.input_vars
()
.into_iter
()
{
if
let
Some
(
expr
)
=
insertable_expressions
.get
(
input_var
)
{
extended_expression
.substitute_input_var
(
input_var
,
expr
)
}
}
insertable_expressions
.insert
(
var
.clone
(),
extended_expression
.clone
());
// Expressions dependent on the assigned variable are no longer insertable.
insertable_expressions
.retain
(|
_input_var
,
input_expr
|
{
!
input_expr
.input_vars
()
.into_iter
()
.any
(|
x
|
x
==
var
)
});
Some
(
insertable_expressions
)
}
Def
::
Load
{
var
,
address
:
_expression
,
}
=>
{
// Expressions dependent on the assigned variable are no longer insertable
insertable_expressions
.retain
(|
_input_var
,
input_expr
|
{
!
input_expr
.input_vars
()
.into_iter
()
.any
(|
x
|
x
==
var
)
});
Some
(
insertable_expressions
)
}
Def
::
Store
{
..
}
=>
Some
(
insertable_expressions
),
}
}
fn
update_call_stub
(
&
self
,
_value_before_call
:
&
Self
::
Value
,
_call
:
&
Term
<
Jmp
>
,
)
->
Option
<
Self
::
Value
>
{
Some
(
HashMap
::
new
())
}
fn
update_jump
(
&
self
,
value
:
&
Self
::
Value
,
_jump
:
&
Term
<
Jmp
>
,
_untaken_conditional
:
Option
<&
Term
<
Jmp
>>
,
_target
:
&
Term
<
Blk
>
,
)
->
Option
<
Self
::
Value
>
{
Some
(
value
.clone
())
}
fn
update_call
(
&
self
,
_value
:
&
Self
::
Value
,
_call
:
&
Term
<
Jmp
>
,
_target
:
&
Node
,
_calling_convention
:
&
Option
<
String
>
,
)
->
Option
<
Self
::
Value
>
{
None
// This propagation is intra-procedural
}
fn
update_return
(
&
self
,
_value
:
Option
<&
Self
::
Value
>
,
_value_before_call
:
Option
<&
Self
::
Value
>
,
_call_term
:
&
Term
<
Jmp
>
,
_return_term
:
&
Term
<
Jmp
>
,
_calling_convention
:
&
Option
<
String
>
,
)
->
Option
<
Self
::
Value
>
{
Some
(
HashMap
::
new
())
// Start with no prior knowledge
}
fn
specialize_conditional
(
&
self
,
value
:
&
Self
::
Value
,
_condition
:
&
Expression
,
_block_before_condition
:
&
Term
<
Blk
>
,
_is_true
:
bool
,
)
->
Option
<
Self
::
Value
>
{
Some
(
value
.clone
())
}
}
/// Performs the fixpoint algorithm and returns the computation.
///
/// Panics, if the computation does not stabilizes.
fn
compute_expression_propagation
<
'a
>
(
graph
:
&
'a
Graph
,
)
->
Computation
<
GeneralizedContext
<
'a
,
Context
<
'a
>>>
{
let
context
=
Context
::
new
(
graph
);
let
mut
computation
=
create_computation
(
context
,
None
);
for
node
in
graph
.node_indices
()
{
if
let
Node
::
BlkStart
(
_blk
,
_sub
)
=
graph
[
node
]
{
// A start in the CFG has no incoming edges in the CFG and
// are mostly due to cases where the control flow graph is incomplete.
// We assume that no expressions are insertable at such starting nodes.
// Additionally, we initialize every function's entrypoint.
if
graph
.neighbors_directed
(
node
,
petgraph
::
Incoming
)
.next
()
.is_none
()
||
graph
[
node
]
.get_sub
()
.term.blocks
.first
()
==
Some
(
graph
[
node
]
.get_block
())
{
computation
.set_node_value
(
node
,
NodeValue
::
Value
(
HashMap
::
new
()));
}
}
}
computation
.compute_with_max_steps
(
100
);
if
!
computation
.has_stabilized
()
{
panic!
(
"Fixpoint for expression propagation did not stabilize."
);
}
computation
}
/// Returns the computed result for every basic block.
///
/// This returns the table of variable-expression pairs that hold at the beginning of the blocks.
fn
extract_results
<
'a
>
(
graph
:
&
Graph
,
computation
:
Computation
<
GeneralizedContext
<
'a
,
Context
<
'a
>>>
,
)
->
HashMap
<
Tid
,
HashMap
<
Variable
,
Expression
>>
{
let
mut
results
=
HashMap
::
new
();
for
node
in
graph
.node_indices
()
{
if
let
Node
::
BlkStart
(
blk
,
_sub
)
=
graph
[
node
]
{
if
let
Some
(
NodeValue
::
Value
(
insertables
))
=
computation
.get_node_value
(
node
)
{
results
.insert
(
blk
.tid
.clone
(),
insertables
.clone
());
}
}
}
results
}
/// Replaces for every basic block all propagated expressions.
///
/// This uses the expression propagation of basic blocks, thus performs intra-basic-block insertion of expressions.
fn
insert_expressions
(
inseratables
:
HashMap
<
Tid
,
HashMap
<
Variable
,
Expression
>>
,
program
:
&
mut
Program
,
)
{
for
sub
in
program
.subs
.values_mut
()
{
for
block
in
sub
.term.blocks
.iter_mut
()
{
block
.propagate_input_expressions
(
inseratables
.get
(
&
block
.tid
)
.cloned
());
}
}
}
/// Merges consecutive assignment expressions for the same variable.
fn
merge_same_var_assignments
(
project
:
&
mut
Project
)
{
for
sub
in
project
.program.term.subs
.values_mut
()
{
for
blk
in
sub
.term.blocks
.iter_mut
()
{
blk
.merge_def_assignments_to_same_var
();
}
}
}
/// Replaces variables by expressions that can be propagated within functions.
///
/// This is performed by a fixpoint computation and might panic, if it does not stabilize.
pub
fn
propagate_input_expression
(
project
:
&
mut
Project
)
{
let
extern_subs
=
project
.program
.term
.extern_symbols
.keys
()
.cloned
()
.collect
();
merge_same_var_assignments
(
project
);
let
graph
=
crate
::
analysis
::
graph
::
get_program_cfg
(
&
project
.program
,
extern_subs
);
let
computation
=
compute_expression_propagation
(
&
graph
);
let
results
=
extract_results
(
&
graph
,
computation
);
insert_expressions
(
results
,
&
mut
project
.program.term
);
}
#[cfg(test)]
mod
tests
;
src/cwe_checker_lib/src/analysis/expression_propagation/tests.rs
0 → 100644
View file @
0359ea16
This diff is collapsed.
Click to expand it.
src/cwe_checker_lib/src/analysis/mod.rs
View file @
0359ea16
...
...
@@ -3,6 +3,7 @@
pub
mod
backward_interprocedural_fixpoint
;
pub
mod
dead_variable_elimination
;
pub
mod
expression_propagation
;
pub
mod
fixpoint
;
pub
mod
forward_interprocedural_fixpoint
;
pub
mod
function_signature
;
...
...
src/cwe_checker_lib/src/intermediate_representation/blk.rs
View file @
0359ea16
use
super
::
*
;
use
crate
::
utils
::
log
::
LogMessage
;
use
std
::{
collections
::
HashSet
,
fmt
};
use
std
::{
collections
::{
HashMap
,
HashSet
},
fmt
,
};
/// A basic block is a sequence of `Def` instructions followed by up to two `Jmp` instructions.
///
...
...
@@ -74,11 +77,17 @@ impl Term<Blk> {
/// Note that substitution is only possible
/// if the input variables of the input expression itself did not change since the definition of said variable.
///
/// The expression propagation
allows the corresponding [`Project` normalization pass](Project::normalize
)
/// to further simplify the generated expressions
/// The expression propagation
is used in [`expression_propagation` normalization pass](crate::analysis::expression_propagation
)
/// to further simplify the generated expressions
using a fixpoint algorithm
/// and allows more dead stores to be removed during [dead variable elimination](crate::analysis::dead_variable_elimination).
pub
fn
propagate_input_expressions
(
&
mut
self
)
{
let
mut
insertable_expressions
=
Vec
::
new
();
pub
fn
propagate_input_expressions
(
&
mut
self
,
apriori_insertable_expressions
:
Option
<
HashMap
<
Variable
,
Expression
>>
,
)
{
let
mut
insertable_expressions
=
HashMap
::
new
();
if
let
Some
(
insertables
)
=
apriori_insertable_expressions
{
insertable_expressions
=
insertables
;
}
for
def
in
self
.term.defs
.iter_mut
()
{
match
&
mut
def
.term
{
Def
::
Assign
{
...
...
@@ -90,13 +99,13 @@ impl Term<Blk> {
expression
.substitute_input_var
(
input_var
,
input_expr
);
}
// expressions dependent on the assigned variable are no longer insertable
insertable_expressions
.retain
(|
(
input_var
,
input_expr
)
|
{
insertable_expressions
.retain
(|
input_var
,
input_expr
|
{
input_var
!=
var
&&
!
input_expr
.input_vars
()
.into_iter
()
.any
(|
x
|
x
==
var
)
});
// If the value of the assigned variable does not depend on the former value of the variable,
// then it is insertable for future expressions.
if
!
expression
.input_vars
()
.into_iter
()
.any
(|
x
|
x
==
var
)
{
insertable_expressions
.
push
((
var
.clone
(),
expression
.clone
()
));
insertable_expressions
.
insert
(
var
.clone
(),
expression
.clone
(
));
}
}
Def
::
Load
{
...
...
@@ -108,7 +117,7 @@ impl Term<Blk> {
expression
.substitute_input_var
(
input_var
,
input_expr
);
}
// expressions dependent on the assigned variable are no longer insertable
insertable_expressions
.retain
(|
(
input_var
,
input_expr
)
|
{
insertable_expressions
.retain
(|
input_var
,
input_expr
|
{
input_var
!=
var
&&
!
input_expr
.input_vars
()
.into_iter
()
.any
(|
x
|
x
==
var
)
});
}
...
...
@@ -269,7 +278,7 @@ mod tests {
},
};
block
.merge_def_assignments_to_same_var
();
block
.propagate_input_expressions
();
block
.propagate_input_expressions
(
None
);
let
result_defs
=
vec!
[
Def
::
assign
(
"tid_1"
,
...
...
src/cwe_checker_lib/src/intermediate_representation/expression.rs
View file @
0359ea16
...
...
@@ -188,7 +188,7 @@ impl Expression {
}
}
/// Substitute every occurence of `input_var` in `self` with the given `replace_with_expression`.
/// Substitute every occur
r
ence of `input_var` in `self` with the given `replace_with_expression`.
pub
fn
substitute_input_var
(
&
mut
self
,
input_var
:
&
Variable
,
...
...
src/cwe_checker_lib/src/intermediate_representation/project.rs
View file @
0359ea16
...
...
@@ -209,19 +209,6 @@ impl Project {
log_messages
}
/// Propagate input expressions along variable assignments.
///
/// The propagation only occurs inside basic blocks
/// but not across basic block boundaries.
fn
propagate_input_expressions
(
&
mut
self
)
{
for
sub
in
self
.program.term.subs
.values_mut
()
{
for
block
in
sub
.term.blocks
.iter_mut
()
{
block
.merge_def_assignments_to_same_var
();
block
.propagate_input_expressions
();
}
}
}
/// Run some normalization passes over the project.
///
/// Passes:
...
...
@@ -239,7 +226,7 @@ impl Project {
let
mut
logs
=
self
.remove_references_to_nonexisting_tids_and_retarget_non_returning_calls
();
make_block_to_sub_mapping_unique
(
self
);
self
.propagate_input_expressions
(
);
crate
::
analysis
::
expression_propagation
::
propagate_input_expression
(
self
);
self
.substitute_trivial_expressions
();
crate
::
analysis
::
dead_variable_elimination
::
remove_dead_var_assignments
(
self
);
propagate_control_flow
(
self
);
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment