Merge branch 'master' of github.com:airbnb/streamalert into austin-me…

…rger
airbnb · Mar 21, 2018 · 75633f1 · 75633f1
2 parents 8cb1373 + e6bd483
commit 75633f1
Show file tree

Hide file tree

Showing 67 changed files with 2,931 additions and 2,712 deletions.
diff --git a/docs/source/rule-testing.rst b/docs/source/rule-testing.rst
@@ -1,30 +1,100 @@
 Rule Testing
 ============
 
-To test the accuracy of new rules, local tests can be written to verify that alerts trigger against valid input.  The ``manage.py`` CLI tool comes built-in with a ``lambda test`` command which does exactly this.
+To test the accuracy of new rules, local tests can be written to verify that alerts trigger against valid input.
+
+The ``manage.py`` CLI tool comes built-in with a ``lambda test`` command which does exactly this.
 
 Configuration
 ~~~~~~~~~~~~~
 
-To test a new rule, first create a new JSON file anywhere within ``tests/integration/rules`` named ``name_of_your_tests.json``.  This file should contain this exact structure::
-
-  {
-    "records": [
-      {
-        "data": {} or "",
-        "description": "information about this test",
-        "log": "log_type_from_logs.json",
-        "service": "kinesis" or "s3" or "sns" or "stream_alert_app",
-        "source": "kinesis_stream_name" or "s3_bucket_id" or "sns_topic_name" or "stream_alert_app_function_name",
-        "trigger_rules": [
-          "rule_01",
-          "rule_02"
-        ]
-      }
-    ]
-  }
-
-.. note:: Multiple tests can be included in one file simply by adding them to the "records" array within the `name_of_your_tests.json` file.
+To test a new rule, first create a new JSON file anywhere within the 'tests/integration/rules' directory with the ``.json`` extension.
+
+This file should contain the following structure:
+
+.. code-block:: json
+
+  [
+    {
+      "data": "Either a string, or JSON object",
+      "description": "This test should trigger or not trigger an alert",
+      "log": "The log name declared in logs.json",
+      "service": "The service sending the log - kinesis, s3, sns, or stream_alert_app",
+      "source": "The exact resource which sent the log - kinesis stream name, s3 bucket ID, SNS topic name, or stream_alert_app_function name",
+      "trigger_rules": [
+        "list of rule names which should generate alerts",
+        "another potential rule name could go here"
+      ]
+    }
+  ]
+
+.. note:: Multiple tests can be included in one file by adding them to the array above.
+
+When specifying the test data, it can be either of two fields:
+
+1. ``"data"``: An entire example record, with all necessary fields to properly classify
+2. ``"override_record"``: A subset of the example record, where only relevant fields are populated
+
+The advantage of option #2 is that the overall test event is much smaller.
+
+The testing framework will auto-populate the records behind the scenes with the remaining fields for that given log type.
+
+For example:
+
+.. code-block:: json
+
+  [
+    {
+      "data": {
+        "account": "123456789102",
+        "detail": {
+          "request": {
+            "eventName": "putObject",
+            "bucketName": "testBucket"
+          }
+        },
+        "detail-type": "API Call",
+        "id": "123456",
+        "region": "us-west-2",
+        "resources": [
+          "testBucket"
+        ],
+        "source": "aws.s3",
+        "time": "Jan 01 2018 12:00",
+        "version": "1.05"
+      },
+      "description": "An example test with a full cloudwatch event",
+      "log": "cloudwatch:events",
+      "service": "s3",
+      "source": "test-s3-bucket-name",
+      "trigger_rules": [
+        "my_fake_rule"
+      ]
+    }
+  ]
+
+Let's say a rule is only checking the value of ``source`` in the test event.  In that case, there's no added benefit to fill in all the other data.  Here is what the event would look like with ``override_record``:
+
+.. code-block:: json
+
+  [
+    {
+      "override_record": {
+        "source": "aws.s3"
+      },
+      "description": "An example test with a partial cloudwatch event",
+      "log": "cloudwatch:events",
+      "service": "s3",
+      "source": "test-s3-bucket-name",
+      "trigger_rules": [
+        "my_fake_rule"
+      ]
+    }
+  ]
+
+Both test events would have the same result, but with much less effort.
+
+.. note:: Either "override_record" or "data" is required in the test event
 
 Rule Test Reference
 -------------------
@@ -33,57 +103,87 @@ Rule Test Reference
 Key                        Type                  Required  Description
 -------------------------  --------------------  --------  -----------
 ``compress``               ``boolean``           No        Whether or not to compress records with ``gzip`` prior to testing. This is useful to simulate services that send gzipped data
-``data``                   ``{}`` or ``string``  Yes       All ``json`` log types should be in JSON object/dict format while others (``csv, kv, syslog``) should be ``string``
+``data``                   ``map or string``     Yes       The record to test against your rules.  All ``json`` log types should be in JSON object/dict format while others (``csv, kv, syslog``) should be ``string``
+``override_record``        ``map``               No        A partial record to use in test events, more information below
 ``description``            ``string``            Yes       A short sentence describing the intent of the test
 ``log``                    ``string``            Yes       The log type this test record should parse as. The value of this should be taken from the defined logs in ``conf/logs.json``
-``service``                ``string``            Yes       The name of the service which sent the log, e.g: `kinesis, s3, sns, or stream_alert_app`
+``service``                ``string``            Yes       The name of the service which sent the log, e.g: ``kinesis, s3, sns, or stream_alert_app``
 ``source``                 ``string``            Yes       The name of the Kinesis Stream or S3 bucket, SNS topic or StreamAlert App function where the data originated from. This value should match a source provided in ``conf/sources.json``
 ``trigger_rules``          ``list``              Yes       A list of zero or more rule names that this test record should trigger. An empty list implies this record should not trigger any alerts
 ``validate_schemas_only``  ``boolean``           No        Whether or not the test record should go through the rule processing engine. If set to ``true``, this record will only have validation performed
 =========================  ====================  ========  ===========
 
 For more examples, see the provided default rule tests in ``tests/integration/rules``
 
-Helpers
-~~~~~~~
+Running Tests
+~~~~~~~~~~~~~~
 
-It's often necessary to stub (dynamically fill in) values in our test data.  This could be due to time-based rules which utilize the ``last_hour`` `rule helper <rules.html#helpers>`_.  In order to test in these scenarios, a testing helper can be used.
+Tests are run via the ``manage.py`` script.  These tests include the ability to validate rules for
+accuracy, or send alerts to outputs to verify proper configuration.
 
-Helpers Functions
------------------
+When adding new rules, it is only necessary to run tests for the **rule processor**. If making code changes to the alert
+processor, such as adding a new output integration to send alerts to, tests for the **alert processor** should also be performed.
 
-``last_hour``: Generates a unix epoch time within the last hour (ex: ``1489105783``).
+To run integration tests for the **rule processor**:
 
-Usage
------
+.. code-block:: bash
 
-To use these helpers in rule testing, replace a specific log field value with the following::
+  $ python manage.py lambda test --processor rule
 
-  "<helper:helper_name_goes_here>"
+To run integration tests for the **alert processor**:
 
-For example, to replace a time based field with ``last_hour``:
+.. code-block:: bash
 
-.. code-block:: json
+  $ python manage.py lambda test --processor alert
 
-  {
-    "records": [
-      {
-        "data": {
-          "host": "app01.prod.mydomain.net",
-          "time": "<helper:last_hour>"
-        },
-        "description": "example usage of helpers",
-        "log": "host_time_log",
-        "service": "kinesis",
-        "source": "my_demo_kinesis_stream",
-        "trigger_rules": [
-          "last_hour_rule_name"
-        ]
-      }
-    ]
-  }
+To run end-to-end integration tests for **both processors**:
+
+.. code-block:: bash
+
+  $ python manage.py lambda test --processor all
+
+Integration tests can be restricted to **specific rules** to reduce time and output:
+
+.. code-block:: bash
+
+  $ python manage.py lambda test --processor rule --test-rules <rule_01> <rule_02>
+
+Integration tests can be restricted to **specific file names** to reduce time and output (the .json suffix is optional):
+
+.. code-block:: bash
+
+  $ python manage.py lambda test --processor rule --test-files <test_file_01.json> <test_file_02>
+
+
+Integration tests can send **live test alerts** to configured outputs for rules using a specified cluster.
+This can also be combined with an optional list of rules to use for tests (using the ``--rules`` argument):
+
+.. code-block:: bash
+
+  $ python manage.py live-test --cluster <cluster_name>
+
+Here is a sample command showing how to run tests against two rules included as integration tests in the default StreamAlert configuration:
+
+.. code-block:: bash
+
+  $ python manage.py lambda test --processor rule --rules cloudtrail_put_bucket_acl cloudtrail_root_account_usage
+
+This will produce output similar to the following::
+
+  cloudtrail_put_bucket_acl
+         [Pass]  [trigger=1]                   rule      (kinesis): An AWS S3 bucket with 'AllUsers' permission(s) will create an alert.
+         [Pass]  [trigger=1]                   rule      (kinesis): An AWS S3 bucket with 'AuthenticatedUsers' permission(s) will create an alert.
+         [Pass]  [trigger=0]                   rule      (kinesis): An AWS PutBucketAcl call without 'AuthenticatedUsers' & 'AllUsers' will not create an alert.
+
+  cloudtrail_root_account_usage
+         [Pass]  [trigger=1]                   rule      (kinesis): Use of the AWS 'Root' account will create an alert.
+         [Pass]  [trigger=0]                   rule      (kinesis): AWS 'Root' account activity initiated automatically by an AWS service on your behalf will not create an alert.
 
 
+
+  StreamAlertCLI [INFO]: (5/5) Successful Tests
+  StreamAlertCLI [INFO]: Completed
+
 Validate Log Schemas
 ~~~~~~~~~~~~~~~~~~~~
 
@@ -160,72 +260,41 @@ This will produce output similar to the following::
   StreamAlertCLI [ERROR]: (1/2) Failures
   StreamAlertCLI [ERROR]: (1/1) [cloudtrail_put_object_acl] Data is invalid due to missing key(s) in test record: 'eventVersion'. Rule: 'cloudtrail_put_object_acl'. Description: 'CloudTrail - PutObjectAcl - False Positive'
 
+  Helpers
+  ~~~~~~~
 
-Running Tests
-~~~~~~~~~~~~~~
-
-Tests can be run via the ``manage.py`` script. These tests include the ability to validate rules for
-accuracy and alert outputs for proper configuration.
-
-When adding new rules, it is only necessary to run tests for the **rule processor**. If making code changes to the alert
-processor, such as adding a new output integration to send alerts to, tests for the **alert processor** should also be performed.
-
-To run integration tests for the **rule processor**:
-
-.. code-block:: bash
+  It's occasionally necessary to dynamically fill in values in our test data.  This could be due to time-based rules which utilize the ``last_hour`` `rule helper <rules.html#helpers>`_.  In order to test in these scenarios, a testing helper can be used.
 
-  $ python manage.py lambda test --processor rule
+  Helpers Functions
+  -----------------
 
-To run integration tests for the **alert processor**:
+  ``last_hour``: Generates a unix epoch time within the last hour (ex: ``1489105783``).
 
-.. code-block:: bash
+  Usage
+  -----
 
-  $ python manage.py lambda test --processor alert
+  To use these helpers in rule testing, replace a specific log field value with the following::
 
-To run end-to-end integration tests for **both processors**:
+    "<helper:helper_name_goes_here>"
 
-.. code-block:: bash
+  For example, to replace a time based field with ``last_hour``:
 
-  $ python manage.py lambda test --processor all
-
-Integration tests can be restricted to **specific rules** to reduce time and output:
-
-.. code-block:: bash
-
-  $ python manage.py lambda test --processor rule --test-rules <rule_01> <rule_02>
-
-Integration tests can be restricted to **specific file names** to reduce time and output (the .json suffix is optional):
+  .. code-block:: json
 
-.. code-block:: bash
-
-  $ python manage.py lambda test --processor rule --test-files <test_file_01.json> <test_file_02>
-
-
-Integration tests can send **live test alerts** to configured outputs for rules using a specified cluster.
-This can also be combined with an optional list of rules to use for tests (using the ``--rules`` argument):
-
-.. code-block:: bash
-
-  $ python manage.py live-test --cluster <cluster_name>
-
-Here is a sample command showing how to run tests against two rules included as integration tests in the default StreamAlert configuration:
-
-.. code-block:: bash
-
-  $ python manage.py lambda test --processor rule --rules cloudtrail_put_bucket_acl cloudtrail_root_account_usage
-
-This will produce output similar to the following::
-
-  cloudtrail_put_bucket_acl
-         [Pass]  [trigger=1]                   rule      (kinesis): An AWS S3 bucket with 'AllUsers' permission(s) will create an alert.
-         [Pass]  [trigger=1]                   rule      (kinesis): An AWS S3 bucket with 'AuthenticatedUsers' permission(s) will create an alert.
-         [Pass]  [trigger=0]                   rule      (kinesis): An AWS PutBucketAcl call without 'AuthenticatedUsers' & 'AllUsers' will not create an alert.
-
-  cloudtrail_root_account_usage
-         [Pass]  [trigger=1]                   rule      (kinesis): Use of the AWS 'Root' account will create an alert.
-         [Pass]  [trigger=0]                   rule      (kinesis): AWS 'Root' account activity initiated automatically by an AWS service on your behalf will not create an alert.
-
-
-
-  StreamAlertCLI [INFO]: (5/5) Successful Tests
-  StreamAlertCLI [INFO]: Completed
+    {
+      "records": [
+        {
+          "data": {
+            "host": "app01.prod.mydomain.net",
+            "time": "<helper:last_hour>"
+          },
+          "description": "example usage of helpers",
+          "log": "host_time_log",
+          "service": "kinesis",
+          "source": "my_demo_kinesis_stream",
+          "trigger_rules": [
+            "last_hour_rule_name"
+          ]
+        }
+      ]
+    }
diff --git a/rules/community/binaryalert/binaryalert_yara_match.py b/rules/community/binaryalert/binaryalert_yara_match.py
@@ -4,9 +4,7 @@
 rule = StreamRules.rule
 
 
-@rule(
-    logs=['binaryalert'],
-    outputs=['aws-firehose:alerts'])
+@rule(logs=['binaryalert'])
 def binaryalert_yara_match(rec):
     """
     author:       Austin Byers (Airbnb CSIRT)

diff --git a/rules/community/cloudtrail/cloudtrail_critical_api_calls.py b/rules/community/cloudtrail/cloudtrail_critical_api_calls.py
@@ -6,9 +6,7 @@
 disable = StreamRules.disable()
 
 
-@rule(
-    logs=['cloudtrail:events'],
-    outputs=['aws-firehose:alerts'])
+@rule(logs=['cloudtrail:events'])
 def cloudtrail_critical_api_calls(rec):
     """
     author:           airbnb_csirt

diff --git a/rules/community/cloudtrail/cloudtrail_mfa_policy_abuse_attempt.py b/rules/community/cloudtrail/cloudtrail_mfa_policy_abuse_attempt.py
@@ -6,9 +6,7 @@
 disable = StreamRules.disable()
 
 
-@rule(
-    logs=['cloudtrail:events'],
-    outputs=['aws-firehose:alerts'])
+@rule(logs=['cloudtrail:events'])
 def cloudtrail_mfa_policy_abuse_attempt(rec):
     """
     author:           Scott Piper of Summit Route in collaboration with Duo Security

diff --git a/rules/community/cloudtrail/cloudtrail_network_acl_ingress_anywhere.py b/rules/community/cloudtrail/cloudtrail_network_acl_ingress_anywhere.py
@@ -6,7 +6,6 @@
 
 @rule(
     logs=['cloudwatch:events'],
-    outputs=['aws-firehose:alerts'],
     req_subkeys={
         'detail': ['eventName', 'requestParameters']
     })

diff --git a/rules/community/cloudtrail/cloudtrail_put_bucket_acl.py b/rules/community/cloudtrail/cloudtrail_put_bucket_acl.py
@@ -6,7 +6,6 @@
 
 @rule(
     logs=['cloudwatch:events'],
-    outputs=['aws-firehose:alerts'],
     req_subkeys={
         'detail': ['requestParameters', 'eventName']
     })

diff --git a/rules/community/cloudtrail/cloudtrail_put_object_acl_public.py b/rules/community/cloudtrail/cloudtrail_put_object_acl_public.py
@@ -7,7 +7,6 @@
 
 @rule(
     logs=['cloudwatch:events'],
-    outputs=['aws-firehose:alerts'],
     req_subkeys={
         'detail': ['requestParameters']
     })