# Copyright (C) 2020 FireEye, Inc. All Rights Reserved. # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at: [package root]/LICENSE.txt # Unless required by applicable law or agreed to in writing, software distributed under the License # is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and limitations under the License. import textwrap import capa.rules import capa.engine import capa.features.insn import capa.features.common from capa.rules import Scope from capa.features import * from capa.features.insn import * from capa.features.common import * def match(rules, features, va, scope=Scope.FUNCTION): """ use all matching algorithms and verify that they compute the same result. then, return those results to the caller so they can make their asserts. """ features1, matches1 = capa.engine.match(rules, features, va) ruleset = capa.rules.RuleSet(rules) features2, matches2 = ruleset.match(scope, features, va) for feature, locations in features1.items(): assert feature in features2 assert locations == features2[feature] for rulename, results in matches1.items(): assert rulename in matches2 assert len(results) == len(matches2[rulename]) return features1, matches1 def test_match_simple(): rule = textwrap.dedent( """ rule: meta: name: test rule namespace: testns1/testns2 features: - number: 100 """ ) r = capa.rules.Rule.from_yaml(rule) features, matches = match([r], {capa.features.insn.Number(100): {1, 2}}, 0x0) assert "test rule" in matches assert MatchedRule("test rule") in features assert MatchedRule("testns1") in features assert MatchedRule("testns1/testns2") in features def test_match_range_exact(): rule = textwrap.dedent( """ rule: meta: name: test rule features: - count(number(100)): 2 """ ) r = capa.rules.Rule.from_yaml(rule) # just enough matches _, matches = match([r], {capa.features.insn.Number(100): {1, 2}}, 0x0) assert "test rule" in matches # not enough matches _, matches = match([r], {capa.features.insn.Number(100): {1}}, 0x0) assert "test rule" not in matches # too many matches _, matches = match([r], {capa.features.insn.Number(100): {1, 2, 3}}, 0x0) assert "test rule" not in matches def test_match_range_range(): rule = textwrap.dedent( """ rule: meta: name: test rule features: - count(number(100)): (2, 3) """ ) r = capa.rules.Rule.from_yaml(rule) # just enough matches _, matches = match([r], {capa.features.insn.Number(100): {1, 2}}, 0x0) assert "test rule" in matches # enough matches _, matches = match([r], {capa.features.insn.Number(100): {1, 2, 3}}, 0x0) assert "test rule" in matches # not enough matches _, matches = match([r], {capa.features.insn.Number(100): {1}}, 0x0) assert "test rule" not in matches # too many matches _, matches = match([r], {capa.features.insn.Number(100): {1, 2, 3, 4}}, 0x0) assert "test rule" not in matches def test_match_range_exact_zero(): rule = textwrap.dedent( """ rule: meta: name: test rule features: - count(number(100)): 0 """ ) r = capa.rules.Rule.from_yaml(rule) # feature isn't indexed - good. _, matches = match([r], {}, 0x0) assert "test rule" in matches # feature is indexed, but no matches. # i don't think we should ever really have this case, but good to check anyways. _, matches = match([r], {capa.features.insn.Number(100): {}}, 0x0) assert "test rule" in matches # too many matches _, matches = match([r], {capa.features.insn.Number(100): {1}}, 0x0) assert "test rule" not in matches def test_match_range_with_zero(): rule = textwrap.dedent( """ rule: meta: name: test rule features: - count(number(100)): (0, 1) """ ) r = capa.rules.Rule.from_yaml(rule) # ok _, matches = match([r], {}, 0x0) assert "test rule" in matches _, matches = match([r], {capa.features.insn.Number(100): {}}, 0x0) assert "test rule" in matches _, matches = match([r], {capa.features.insn.Number(100): {1}}, 0x0) assert "test rule" in matches # too many matches _, matches = match([r], {capa.features.insn.Number(100): {1, 2}}, 0x0) assert "test rule" not in matches def test_match_adds_matched_rule_feature(): """show that using `match` adds a feature for matched rules.""" rule = textwrap.dedent( """ rule: meta: name: test rule features: - number: 100 """ ) r = capa.rules.Rule.from_yaml(rule) features, _ = match([r], {capa.features.insn.Number(100): {1}}, 0x0) assert capa.features.common.MatchedRule("test rule") in features def test_match_matched_rules(): """show that using `match` adds a feature for matched rules.""" rules = [ capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: test rule1 features: - number: 100 """ ) ), capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: test rule2 features: - match: test rule1 """ ) ), ] features, _ = match( capa.rules.topologically_order_rules(rules), {capa.features.insn.Number(100): {1}}, 0x0, ) assert capa.features.common.MatchedRule("test rule1") in features assert capa.features.common.MatchedRule("test rule2") in features # the ordering of the rules must not matter, # the engine should match rules in an appropriate order. features, _ = match( capa.rules.topologically_order_rules(reversed(rules)), {capa.features.insn.Number(100): {1}}, 0x0, ) assert capa.features.common.MatchedRule("test rule1") in features assert capa.features.common.MatchedRule("test rule2") in features def test_match_namespace(): rules = [ capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: CreateFile API namespace: file/create/CreateFile features: - api: CreateFile """ ) ), capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: WriteFile API namespace: file/write features: - api: WriteFile """ ) ), capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: file-create features: - match: file/create """ ) ), capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: filesystem-any features: - match: file """ ) ), ] features, matches = match( capa.rules.topologically_order_rules(rules), {capa.features.insn.API("CreateFile"): {1}}, 0x0, ) assert "CreateFile API" in matches assert "file-create" in matches assert "filesystem-any" in matches assert capa.features.common.MatchedRule("file") in features assert capa.features.common.MatchedRule("file/create") in features assert capa.features.common.MatchedRule("file/create/CreateFile") in features features, matches = match( capa.rules.topologically_order_rules(rules), {capa.features.insn.API("WriteFile"): {1}}, 0x0, ) assert "WriteFile API" in matches assert "file-create" not in matches assert "filesystem-any" in matches def test_match_substring(): rules = [ capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: test rule features: - and: - substring: abc """ ) ), ] features, _ = match( capa.rules.topologically_order_rules(rules), {capa.features.common.String("aaaa"): {1}}, 0x0, ) assert capa.features.common.MatchedRule("test rule") not in features features, _ = match( capa.rules.topologically_order_rules(rules), {capa.features.common.String("abc"): {1}}, 0x0, ) assert capa.features.common.MatchedRule("test rule") in features features, _ = match( capa.rules.topologically_order_rules(rules), {capa.features.common.String("111abc222"): {1}}, 0x0, ) assert capa.features.common.MatchedRule("test rule") in features features, _ = match( capa.rules.topologically_order_rules(rules), {capa.features.common.String("111abc"): {1}}, 0x0, ) assert capa.features.common.MatchedRule("test rule") in features features, _ = match( capa.rules.topologically_order_rules(rules), {capa.features.common.String("abc222"): {1}}, 0x0, ) assert capa.features.common.MatchedRule("test rule") in features def test_match_regex(): rules = [ capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: test rule features: - and: - string: /.*bbbb.*/ """ ) ), capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: rule with implied wildcards features: - and: - string: /bbbb/ """ ) ), capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: rule with anchor features: - and: - string: /^bbbb/ """ ) ), ] features, _ = match( capa.rules.topologically_order_rules(rules), {capa.features.insn.Number(100): {1}}, 0x0, ) assert capa.features.common.MatchedRule("test rule") not in features features, _ = match( capa.rules.topologically_order_rules(rules), {capa.features.common.String("aaaa"): {1}}, 0x0, ) assert capa.features.common.MatchedRule("test rule") not in features features, _ = match( capa.rules.topologically_order_rules(rules), {capa.features.common.String("aBBBBa"): {1}}, 0x0, ) assert capa.features.common.MatchedRule("test rule") not in features features, _ = match( capa.rules.topologically_order_rules(rules), {capa.features.common.String("abbbba"): {1}}, 0x0, ) assert capa.features.common.MatchedRule("test rule") in features assert capa.features.common.MatchedRule("rule with implied wildcards") in features assert capa.features.common.MatchedRule("rule with anchor") not in features def test_match_regex_ignorecase(): rules = [ capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: test rule features: - and: - string: /.*bbbb.*/i """ ) ), ] features, _ = match( capa.rules.topologically_order_rules(rules), {capa.features.common.String("aBBBBa"): {1}}, 0x0, ) assert capa.features.common.MatchedRule("test rule") in features def test_match_regex_complex(): rules = [ capa.rules.Rule.from_yaml( textwrap.dedent( r""" rule: meta: name: test rule features: - or: - string: /.*HARDWARE\\Key\\key with spaces\\.*/i """ ) ), ] features, _ = match( capa.rules.topologically_order_rules(rules), {capa.features.common.String(r"Hardware\Key\key with spaces\some value"): {1}}, 0x0, ) assert capa.features.common.MatchedRule("test rule") in features def test_match_regex_values_always_string(): rules = [ capa.rules.Rule.from_yaml( textwrap.dedent( """ rule: meta: name: test rule features: - or: - string: /123/ - string: /0x123/ """ ) ), ] features, _ = match( capa.rules.topologically_order_rules(rules), {capa.features.common.String("123"): {1}}, 0x0, ) assert capa.features.common.MatchedRule("test rule") in features features, _ = match( capa.rules.topologically_order_rules(rules), {capa.features.common.String("0x123"): {1}}, 0x0, ) assert capa.features.common.MatchedRule("test rule") in features def test_match_not(): rule = textwrap.dedent( """ rule: meta: name: test rule namespace: testns1/testns2 features: - not: - number: 99 """ ) r = capa.rules.Rule.from_yaml(rule) _, matches = match([r], {capa.features.insn.Number(100): {1, 2}}, 0x0) assert "test rule" in matches def test_match_not_not(): rule = textwrap.dedent( """ rule: meta: name: test rule namespace: testns1/testns2 features: - not: - not: - number: 100 """ ) r = capa.rules.Rule.from_yaml(rule) _, matches = match([r], {capa.features.insn.Number(100): {1, 2}}, 0x0) assert "test rule" in matches def test_match_operand_number(): rule = textwrap.dedent( """ rule: meta: name: test rule features: - and: - operand[0].number: 0x10 """ ) r = capa.rules.Rule.from_yaml(rule) assert capa.features.insn.OperandNumber(0, 0x10) in {capa.features.insn.OperandNumber(0, 0x10)} _, matches = match([r], {capa.features.insn.OperandNumber(0, 0x10): {1, 2}}, 0x0) assert "test rule" in matches # mismatching index _, matches = match([r], {capa.features.insn.OperandNumber(1, 0x10): {1, 2}}, 0x0) assert "test rule" not in matches # mismatching value _, matches = match([r], {capa.features.insn.OperandNumber(0, 0x11): {1, 2}}, 0x0) assert "test rule" not in matches def test_match_operand_offset(): rule = textwrap.dedent( """ rule: meta: name: test rule features: - and: - operand[0].offset: 0x10 """ ) r = capa.rules.Rule.from_yaml(rule) assert capa.features.insn.OperandOffset(0, 0x10) in {capa.features.insn.OperandOffset(0, 0x10)} _, matches = match([r], {capa.features.insn.OperandOffset(0, 0x10): {1, 2}}, 0x0) assert "test rule" in matches # mismatching index _, matches = match([r], {capa.features.insn.OperandOffset(1, 0x10): {1, 2}}, 0x0) assert "test rule" not in matches # mismatching value _, matches = match([r], {capa.features.insn.OperandOffset(0, 0x11): {1, 2}}, 0x0) assert "test rule" not in matches def test_match_property_access(): rule = textwrap.dedent( """ rule: meta: name: test rule features: - and: - property/read: System.IO.FileInfo::Length """ ) r = capa.rules.Rule.from_yaml(rule) assert capa.features.insn.Property("System.IO.FileInfo::Length", capa.features.common.FeatureAccess.READ) in { capa.features.insn.Property("System.IO.FileInfo::Length", capa.features.common.FeatureAccess.READ) } _, matches = match( [r], {capa.features.insn.Property("System.IO.FileInfo::Length", capa.features.common.FeatureAccess.READ): {1, 2}}, 0x0, ) assert "test rule" in matches # mismatching access _, matches = match( [r], {capa.features.insn.Property("System.IO.FileInfo::Length", capa.features.common.FeatureAccess.WRITE): {1, 2}}, 0x0, ) assert "test rule" not in matches # mismatching value _, matches = match( [r], {capa.features.insn.Property("System.IO.FileInfo::Size", capa.features.common.FeatureAccess.READ): {1, 2}}, 0x0, ) assert "test rule" not in matches