import textwrap import pytest import capa.rules from capa.features.insn import Number, Offset from capa.features import String def test_rule_ctor(): r = capa.rules.Rule("test rule", capa.rules.FUNCTION_SCOPE, Number(1), {}) assert r.evaluate({Number(0): {1}}) == False assert r.evaluate({Number(1): {1}}) == True def test_rule_yaml(): rule = textwrap.dedent( """ rule: meta: name: test rule author: user@domain.com scope: function examples: - foo1234 - bar5678 features: - and: - number: 1 - number: 2 """ ) r = capa.rules.Rule.from_yaml(rule) assert r.evaluate({Number(0): {1}}) == False assert r.evaluate({Number(0): {1}, Number(1): {1}}) == False assert r.evaluate({Number(0): {1}, Number(1): {1}, Number(2): {1}}) == True assert ( r.evaluate({Number(0): {1}, Number(1): {1}, Number(2): {1}, Number(3): {1}}) == True ) def test_rule_yaml_complex(): rule = textwrap.dedent( """ rule: meta: name: test rule features: - or: - and: - number: 1 - number: 2 - or: - number: 3 - 2 or more: - number: 4 - number: 5 - number: 6 """ ) r = capa.rules.Rule.from_yaml(rule) assert ( r.evaluate({Number(5): {1}, Number(6): {1}, Number(7): {1}, Number(8): {1}}) == True ) assert r.evaluate({Number(6): {1}, Number(7): {1}, Number(8): {1}}) == False def test_rule_yaml_descriptions(): rule = textwrap.dedent(''' rule: meta: name: test rule features: - and: - number: 1 = This is the number 1 - string: This program cannot be run in DOS mode. description: MS-DOS stub message - count(number(2 = AF_INET/SOCK_DGRAM)): 2 ''') r = capa.rules.Rule.from_yaml(rule) assert r.evaluate({Number(1): {1}, Number(2): {2, 3}, String('This program cannot be run in DOS mode.'): {4}}) == True def test_rule_yaml_not(): rule = textwrap.dedent( """ rule: meta: name: test rule features: - and: - number: 1 - not: - number: 2 """ ) r = capa.rules.Rule.from_yaml(rule) assert r.evaluate({Number(1): {1}}) == True assert r.evaluate({Number(1): {1}, Number(2): {1}}) == False def test_rule_yaml_count(): rule = textwrap.dedent( """ rule: meta: name: test rule features: - count(number(100)): 1 """ ) r = capa.rules.Rule.from_yaml(rule) assert r.evaluate({Number(100): {}}) == False assert r.evaluate({Number(100): {1}}) == True assert r.evaluate({Number(100): {1, 2}}) == False def test_rule_yaml_count_range(): rule = textwrap.dedent( """ rule: meta: name: test rule features: - count(number(100)): (1, 2) """ ) r = capa.rules.Rule.from_yaml(rule) assert r.evaluate({Number(100): {}}) == False assert r.evaluate({Number(100): {1}}) == True assert r.evaluate({Number(100): {1, 2}}) == True assert r.evaluate({Number(100): {1, 2, 3}}) == False def test_invalid_rule_feature(): with pytest.raises(capa.rules.InvalidRule): capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: test rule features: - foo: true """ ) ) with pytest.raises(capa.rules.InvalidRule): capa.rules.Rule.from_yaml(textwrap.dedent(''' rule: meta: name: test rule scope: file features: - characteristic: nzxor ''')) with pytest.raises(capa.rules.InvalidRule): capa.rules.Rule.from_yaml(textwrap.dedent(''' rule: meta: name: test rule scope: function features: - characteristic: embedded pe ''')) with pytest.raises(capa.rules.InvalidRule): capa.rules.Rule.from_yaml(textwrap.dedent(''' rule: meta: name: test rule scope: basic block features: - characteristic: embedded pe ''')) def test_lib_rules(): rules = capa.rules.RuleSet([ capa.rules.Rule.from_yaml(textwrap.dedent(''' rule: meta: name: a lib rule lib: true features: - api: CreateFileA ''')), capa.rules.Rule.from_yaml(textwrap.dedent(''' rule: meta: name: test rule scope: basic block features: - characteristic(embedded pe): true """ ) ) def test_lib_rules(): rules = capa.rules.RuleSet( [ capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: a lib rule lib: true features: - api: CreateFileA """ ) ), capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: a standard rule lib: false features: - api: CreateFileW """ ) ), ] ) assert len(rules.function_rules) == 1 def test_subscope_rules(): rules = capa.rules.RuleSet([ capa.rules.Rule.from_yaml(textwrap.dedent(''' rule: meta: name: test rule scope: file features: - and: - characteristic: embedded pe - function: - and: - characteristic: nzxor - characteristic: switch ''')) ]) # the file rule scope will have one rules: # - `test rule` assert len(rules.file_rules) == 1 # the function rule scope have one rule: # - the rule on which `test rule` depends assert len(rules.function_rules) == 1 def test_duplicate_rules(): with pytest.raises(capa.rules.InvalidRule): rules = capa.rules.RuleSet( [ capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: rule-name features: - api: CreateFileA """ ) ), capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: rule-name features: - api: CreateFileW """ ) ), ] ) def test_missing_dependency(): with pytest.raises(capa.rules.InvalidRule): rules = capa.rules.RuleSet( [ capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: dependent rule features: - match: missing rule """ ) ), ] ) def test_invalid_rules(): with pytest.raises(capa.rules.InvalidRule): r = capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: test rule features: - characteristic: number(1) ''')) with pytest.raises(capa.rules.InvalidRule): r = capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: test rule features: - characteristic: count(number(100)) ''')) def test_number_symbol(): rule = textwrap.dedent( """ rule: meta: name: test rule features: - and: - number: 1 - number: 0xFFFFFFFF - number: 2 = symbol name - number: 3 = symbol name - number: 4 = symbol name = another name - number: 0x100 = symbol name - number: 0x11 = (FLAG_A | FLAG_B) """ ) r = capa.rules.Rule.from_yaml(rule) children = list(r.statement.get_children()) assert (Number(1) in children) == True assert (Number(0xFFFFFFFF) in children) == True assert (Number(2, "symbol name") in children) == True assert (Number(3, "symbol name") in children) == True assert (Number(4, "symbol name = another name") in children) == True assert (Number(0x100, "symbol name") in children) == True def test_count_number_symbol(): rule = textwrap.dedent( """ rule: meta: name: test rule features: - or: - count(number(2 = symbol name)): 1 - count(number(0x100 = symbol name)): 2 or more - count(number(0x11 = (FLAG_A | FLAG_B))): 2 or more """ ) r = capa.rules.Rule.from_yaml(rule) assert r.evaluate({Number(2): {}}) == False assert r.evaluate({Number(2): {1}}) == True assert r.evaluate({Number(2): {1, 2}}) == False assert r.evaluate({Number(0x100, "symbol name"): {1}}) == False assert r.evaluate({Number(0x100, "symbol name"): {1, 2, 3}}) == True def test_invalid_number(): with pytest.raises(capa.rules.InvalidRule): r = capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: test rule features: - number: "this is a string" """ ) ) with pytest.raises(capa.rules.InvalidRule): r = capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: test rule features: - number: 2= """ ) ) with pytest.raises(capa.rules.InvalidRule): r = capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: test rule features: - number: symbol name = 2 """ ) ) def test_offset_symbol(): rule = textwrap.dedent( """ rule: meta: name: test rule features: - and: - offset: 1 - offset: 2 = symbol name - offset: 3 = symbol name - offset: 4 = symbol name = another name - offset: 0x100 = symbol name """ ) r = capa.rules.Rule.from_yaml(rule) children = list(r.statement.get_children()) assert (Offset(1) in children) == True assert (Offset(2, "symbol name") in children) == True assert (Offset(3, "symbol name") in children) == True assert (Offset(4, "symbol name = another name") in children) == True assert (Offset(0x100, "symbol name") in children) == True def test_count_offset_symbol(): rule = textwrap.dedent( """ rule: meta: name: test rule features: - or: - count(offset(2 = symbol name)): 1 - count(offset(0x100 = symbol name)): 2 or more - count(offset(0x11 = (FLAG_A | FLAG_B))): 2 or more """ ) r = capa.rules.Rule.from_yaml(rule) assert r.evaluate({Offset(2): {}}) == False assert r.evaluate({Offset(2): {1}}) == True assert r.evaluate({Offset(2): {1, 2}}) == False assert r.evaluate({Offset(0x100, "symbol name"): {1}}) == False assert r.evaluate({Offset(0x100, "symbol name"): {1, 2, 3}}) == True def test_invalid_offset(): with pytest.raises(capa.rules.InvalidRule): r = capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: test rule features: - offset: "this is a string" """ ) ) with pytest.raises(capa.rules.InvalidRule): r = capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: test rule features: - offset: 2= """ ) ) with pytest.raises(capa.rules.InvalidRule): r = capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: test rule features: - offset: symbol name = 2 """ ) ) def test_filter_rules(): rules = capa.rules.RuleSet( [ capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: rule 1 author: joe features: - api: CreateFile """ ) ), capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: rule 2 features: - string: joe """ ) ), ] ) rules = rules.filter_rules_by_meta("joe") assert len(rules) == 1 assert "rule 1" in rules.rules def test_filter_rules_dependencies(): rules = capa.rules.RuleSet( [ capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: rule 1 features: - match: rule 2 """ ) ), capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: rule 2 features: - match: rule 3 """ ) ), capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: rule 3 features: - api: CreateFile """ ) ), ] ) rules = rules.filter_rules_by_meta("rule 1") assert len(rules.rules) == 3 assert "rule 1" in rules.rules assert "rule 2" in rules.rules assert "rule 3" in rules.rules def test_filter_rules_missing_dependency(): with pytest.raises(capa.rules.InvalidRule): capa.rules.RuleSet( [ capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: rule 1 author: joe features: - match: rule 2 """ ) ), ] ) def test_rules_namespace_dependencies(): rules = [ capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: rule 1 namespace: ns1/nsA features: - api: CreateFile """ ) ), capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: rule 2 namespace: ns1/nsB features: - api: CreateFile """ ) ), capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: rule 3 features: - match: ns1/nsA """ ) ), capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: rule 4 features: - match: ns1 """ ) ), ] r3 = set( map(lambda r: r.name, capa.rules.get_rules_and_dependencies(rules, "rule 3")) ) assert "rule 1" in r3 assert "rule 2" not in r3 assert "rule 4" not in r3 r4 = set( map(lambda r: r.name, capa.rules.get_rules_and_dependencies(rules, "rule 4")) ) assert "rule 1" in r4 assert "rule 2" in r4 assert "rule 3" not in r4