Multiple IP Entity Syslog

Query

// This query assumes a feed of threat indicators is ingested/synchronized periodically, and each synchronization ingests new indicators and only old indicators that have been modified.
// Active threat indicators in Sentinel are renovated as ThreatIntelligenceIndicator events every ~12 days.
let query_frequency = 1h;
let query_period = 14d;
let query_wait = 0h;
let table_query_lookback = 2d;
let _TIBenignProperty =
    _GetWatchlist('ID-TIBenignProperty')
    | where Notes has_any ("[DestinationIPAddress]")
    | project IndicatorId, BenignProperty
;
let _TIExcludedSources = toscalar(
    _GetWatchlist('Activity-ExpectedSignificantActivity')
    | where Activity == "ThreatIndicatorSource"
    | summarize make_list(Auxiliar)
    );
let _IPv4Regex = toscalar(
    _GetWatchlist('RegEx-SingleRegularExpressions')
    | where UseCase == "Threat Intelligence Indicator IPv4"
    | project RegEx
    );
let _IPv6Regex = toscalar(
    _GetWatchlist('RegEx-SingleRegularExpressions')
    | where UseCase == "Threat Intelligence Indicator IPv6"
    | project RegEx
    );
let _TITableMatch = (table_start: datetime, table_end: datetime, only_new_ti: boolean, ti_start: datetime = datetime(null)) {
    // Scheduled Analytics rules have a query period limit of 14d
    let _Indicators =// materialize(
        ThreatIntelligenceIndicator
        | where TimeGenerated > ago(query_period)
        // Take the earliest TimeGenerated and the latest column info
        | summarize hint.strategy=shuffle
            minTimeGenerated = min(TimeGenerated),
            arg_max(TimeGenerated, Active, Description, ActivityGroupNames, IndicatorId, ThreatType, DomainName, Url, ExpirationDateTime, ConfidenceScore, SourceSystem, Tags, AdditionalInformation, ExternalIndicatorId, NetworkIP, NetworkSourceIP, NetworkDestinationIP, EmailSourceIpAddress)
            by IndicatorId
        // Remove inactive or expired indicators
        | where not(not(Active) or ExpirationDateTime < now())
        // Pick indicators that contain the desired entity type
        | mv-expand IPAddress = pack_array(NetworkIP, NetworkSourceIP, NetworkDestinationIP, EmailSourceIpAddress) to typeof(string)
        | where isnotempty(IPAddress)
        | extend TI_IPAddress = IPAddress
        // Remove indicators from specific sources
        | where not(AdditionalInformation has_any (_TIExcludedSources) or Description has_any (_TIExcludedSources))
        // Remove excluded indicators with benign properties
        | join kind=leftanti _TIBenignProperty on IndicatorId, $left.IPAddress == $right.BenignProperty
        // Deduplicate indicators by IPAddress column, equivalent to using join kind=innerunique afterwards
        | summarize hint.strategy=shuffle
            minTimeGenerated = min(minTimeGenerated),
            take_any(*)
            by IPAddress
        // If we want only new indicators, remove indicators received previously
        | where not(only_new_ti and minTimeGenerated < ti_start)
    //)
    ;
    //let _IndicatorsLength = toscalar(_Indicators | summarize count());
    //let _IndicatorsPrefilter = toscalar(
    //    _Indicators
    //    | extend AuxiliarField = tostring(extract(@"([0-9A-Za-f]+)[\.\:]", 1, IPAddress))
    //    | summarize make_set_if(AuxiliarField, isnotempty(AuxiliarField), 10000)
    //);
    //let _IndicatorsPrefilterLength = array_length(_IndicatorsPrefilter);
    let _TableEvents =
        Syslog
        | where TimeGenerated between (table_start .. table_end)
        // Filter events that may contain indicators
        | where isnotempty(SyslogMessage) and not(SyslogMessage has @'[preauth]')
        //| where not(Facility in ("auth", "authpriv") and not(ProcessName == "sudo") and (SyslogMessage has_any ("from", "Timeout before authentication") or (SyslogMessage has_any ("closed", "reset") and SyslogMessage has_all ("by", "port"))) and not(SyslogMessage has_any ("Disconnecting", "Disconnected", "Accepted", "disconnect")))
        //| where not(_IndicatorsPrefilterLength < 10000 and not(SyslogMessage has_any (_IndicatorsPrefilter))) // "has_any" limit 10000
        | mv-expand IPAddress = todynamic(dynamic_to_json(extract_all(strcat(@"\s", "(", _IPv4Regex, "|", _IPv6Regex, ")"), dynamic([1]), SyslogMessage))) to typeof(string)
        | where isnotempty(IPAddress) and not(isnotempty(parse_ipv4(IPAddress)) and (ipv4_is_private(IPAddress) or ipv4_is_in_any_range(IPAddress, "0.0.0.0/8", "127.0.0.0/8")))
        //| where not(_IndicatorsLength < 1000000 and not(IPAddress in (toscalar(_Indicators | summarize make_list(TI_IPAddress))))) // "in" limit 1.000.000
        | project-rename Syslog_TimeGenerated = TimeGenerated
    ;
    _Indicators
    | join kind=inner hint.strategy=shuffle _TableEvents on IPAddress
    // Take only a single event by key columns
    //| summarize hint.strategy=shuffle take_any(*) by IPAddress, HostName
    | project
        Syslog_TimeGenerated,
        Description,
        ActivityGroupNames,
        IndicatorId,
        ThreatType,
        DomainName,
        Url,
        ExpirationDateTime,
        ConfidenceScore,
        SourceSystem,
        Tags,
        AdditionalInformation,
        TI_IPAddress,
        NetworkIP,
        NetworkSourceIP,
        NetworkDestinationIP,
        EmailSourceIpAddress,
        HostName,
        HostIP,
        Facility,
        SeverityLevel,
        ProcessName,
        SyslogMessage
};
union// isfuzzy=true
    // Match      current table events                                all indicators available
    _TITableMatch(ago(query_frequency + query_wait), ago(query_wait), false),
    // Match      past table events                                                          new indicators since last query execution
    _TITableMatch(ago(table_query_lookback + query_wait), ago(query_frequency + query_wait), true, ago(query_frequency))
| summarize arg_max(Syslog_TimeGenerated, *) by IndicatorId, HostName
| extend
    timestamp = Syslog_TimeGenerated,
    HostCustomEntity = HostName,
    IPCustomEntity = TI_IPAddress

Explanation

This KQL query is designed to identify and match threat indicators with syslog events in Microsoft Sentinel. Here's a simplified breakdown of what the query does:

Setup and Definitions:
- The query defines several parameters and helper functions to manage time frames and filter criteria.
- It retrieves lists of benign properties and excluded sources from watchlists to filter out non-threatening indicators.
- It also retrieves regular expressions for matching IPv4 and IPv6 addresses.
Threat Indicator Processing:
- The query fetches threat indicators from the ThreatIntelligenceIndicator table that are active and not expired.
- It filters out indicators from excluded sources and those with benign properties.
- It deduplicates the indicators based on IP addresses and optionally filters out indicators that have been seen before.
Syslog Event Processing:
- The query retrieves syslog events from the Syslog table within specified time frames.
- It filters these events to find those containing IP addresses that match the threat indicators.
- It excludes private IP addresses and certain syslog messages that are not relevant.
Matching and Output:
- The query matches the processed threat indicators with the syslog events based on IP addresses.
- It combines current and past events with both all available indicators and new indicators since the last query execution.
- The results are summarized to show the most recent syslog event for each indicator and host combination.
- The final output includes details about the threat, such as description, threat type, and associated IP addresses, along with syslog event details.

In essence, this query is used to correlate threat intelligence data with syslog events to identify potential security threats in a network environment.

Details

Jose Sebastián Canós

Released: December 13, 2023

Tables

ThreatIntelligenceIndicatorSyslog

Keywords

ThreatIntelligenceIndicatorSyslogHostNameHostIPNetworkIPNetworkSourceIPNetworkDestinationIPEmailSourceIpAddressDomainNameUrlSourceSystemTagsAdditionalInformationIndicatorIdActivityGroupNamesThreatTypeDescriptionConfidenceScoreExpirationDateTimeFacilitySeverityLevelProcessNameSyslogMessage

Operators

letwherehas_anyprojecttoscalarsummarizemake_listproject-renameextendmv-expandisnotemptyjoinkind=leftantikind=innerhint.strategy=shufflepack_arraynotbetweendynamic_to_jsonextract_allstrcattodynamicparse_ipv4ipv4_is_privateipv4_is_in_any_rangearg_maxagounionby

Actions

GitHub

KQL Search