Log Analytics Advanced Queries

Advanced Queries from Azure Log Analytics can be a bit daunting at first, however below are some example Log Analytics Queries to help get you started:

Here are some links to more details:

Log Analytics Demo site – https://portal.loganalytics.io/demo#/discover/query/main
Kusto Course – https://www.pluralsight.com/courses/kusto-query-language-kql-from-scratch
Log Analytics new log search FAQ and known issues – https://docs.microsoft.com/en-us/azure/log-analytics/log-analytics-log-search-faq
Cheat Sheet – https://docs.microsoft.com/en-us/azure/log-analytics/log-analytics-log-search-transition
Language Reference – https://docs.loganalytics.io/docs/Language-Reference
Getting started guide (20 mins) – https://docs.loganalytics.io/docs/Learn/Getting-Started/Getting-started-with-queries

//---------------- 80% of what you'll ever do, 10 commands -------------------//
// search, where, take, count, summarize, bin, top, extend, project, distinct //
//----------------------------------------------------------------------------//

Top 5 running processes in the last 3 days

// Find all processes that started in the last 3 days. ID 4688: A new process has been created.

let RunProcesses = SecurityEvent

| where TimeGenerated > ago(3d)

| where EventID == “4688”;

// Find the 5 processes that were run the most

let Top5Processes =

RunProcesses

| summarize count() by Process

| top 5 by count_;

// Create a time chart of these 5 processes – hour by hour

RunProcesses

| where Process in (Top5Processes)

| summarize count() by bin (TimeGenerated, 1h), Process

| render timechart

Update

//Computers Missing Updates last week and still missing it.

let lastDayComputersMissingUpdates = Update

| where TimeGenerated between (ago(3d)..ago(2d))

| where Classification == “Critical Updates” and UpdateState != “Not needed” and UpdateState != “NotNeeded”

| summarize makeset(Computer);

Update

| where TimeGenerated > ago(1d)

| where Classification == “Critical Updates” and UpdateState != “Not needed” and UpdateState != “NotNeeded”

| where Computer in (lastDayComputersMissingUpdates)

| summarize UniqueUpdatesCount = dcount(Product) by Computer, OSType

//Security updates:

//Needed Security Updates & Critical Updates by Computer

Update

| where OSType != “Linux” and UpdateState == “Needed” and Optional == “false” and (Classification == “Security Updates” or Classification == “Critical Updates”)

| summarize UniqueUpdatesCount = count(), makeset(Title), makeset(KBID) by Computer

//Security updates:

//List of Computers missing updates and also detected high severity security dections

Update

| where TimeGenerated >= ago(7d)

| where UpdateState == “Needed”

| summarize UpdatesNeeded=makeset(Title), Updates=dcount(Title) by Computer

| join kind= innerunique

(

SecurityDetection

| where TimeGenerated >= ago(7d)

| where AlertSeverity == “High”

| summarize SecurityAlerts=makeset(AlertTitle), HighAlertsCount=count() by Computer

)

on Computer

| project-away Computer

Event Log

//find which accounts failed to logon on computers where we identify a security detection

let detections = toscalar(SecurityDetection

| summarize makeset(Computer));

SecurityEvent

| where Computer in (detections) and EventID == 4624

| summarize count() by Account

//Session Duration

SecurityEvent

| where EventID in (4624, 4634)

| project Computer, Account, TargetLogonId, TimeGenerated, EventID

| order by TimeGenerated asc, EventID asc

| summarize TimeList = makelist(TimeGenerated/1s, 100000) by Computer, Account, TargetLogonId

| extend SessionDuration = series_fir(TimeList, dynamic([1,-1]), false, false)

| mvexpand SessionDuration limit 1000000

| extend SessionDuration = todouble(SessionDuration)

| where SessionDuration != todouble(TimeList[0])

| project-away TimeList

| summarize count(), SessionDuration=avg(SessionDuration), dcount(TargetLogonId), dcount(Account) by Computer

| order by SessionDuration asc

//parse

SecurityEvent

| project Activity

| parse Activity with activityID ” – “ activityDesc

| take 100

SecurityEvent

| project Activity

| extend activityArr=split(Activity, ” – “)

| project Activity , activityArr, activityId=activityArr[0]

| take 100

SecurityEvent

| project Activity

| parse Activity with activityID ” – “ activityDesc

| summarize count() by activityID

Perf

//correlate Memory and CPU custom hours

let StartTime = datetime(2017-11-12 00:30);

let EndTime = datetime(2017-11-22 00:30);

Perf

| where CounterName == “% Processor Time”

| where TimeGenerated > StartTime and TimeGenerated < EndTime

| project TimeGenerated, Computer, cpu=CounterValue //project | Select the columns to include, rename or drop, and insert new computed columns

| join kind= inner ( //join | Merge the rows of two tables to form a new table by matching values of the specified column(s) from each table

Perf

| where CounterName == “% Committed Bytes In Use”

| where TimeGenerated > StartTime and TimeGenerated < EndTime

| project TimeGenerated , Computer, mem=CounterValue

) on TimeGenerated, Computer

| summarize avgCpu=avg(cpu), maxMem=max(mem) by Computer, TimeGenerated bin=1hr //summarize | Produces a table that aggregates the content of the input table

| render timechart

//correlate Memory and CPU the past hour

let StartTime = now(-1h);

let EndTime = now();

Perf

| where CounterName == “% Processor Time”

| where TimeGenerated > StartTime and TimeGenerated < EndTime

| project TimeGenerated, Computer, cpu=CounterValue //project | Select the columns to include, rename or drop, and insert new computed columns

| join kind= inner ( //join | Merge the rows of two tables to form a new table by matching values of the specified column(s) from each table

Perf

| where CounterName == “% Committed Bytes In Use”

| where TimeGenerated > StartTime and TimeGenerated < EndTime

| project TimeGenerated , Computer, mem=CounterValue

) on TimeGenerated, Computer

| summarize avgCpu=avg(cpu), maxMem=max(mem) by Computer, TimeGenerated bin=1hr //summarize | Produces a table that aggregates the content of the input table

| render timechart

//Performance of computers in a group

let group1 = Heartbeat | where Computer contains “1598” | summarize by Computer, group=“group1”;

let group2 = Heartbeat | where Computer contains “1599”| summarize by Computer, group=“group2”;

let combinedGroup= union group1, group2;

let projectedComputers = combinedGroup | summarize makeset(Computer);

Perf

| where ObjectName == “Processor”

| where CounterName == “% Processor Time”

| where Computer in (projectedComputers)

| summarize avg(CounterValue) by bin(TimeGenerated, 15m), Computer

| render timechart

//CPU Performance of computers

Perf

| where CounterName == “% Processor Time” and ObjectName == “Processor” and InstanceName == “_Total”

| summarize AVGCPU = avg(CounterValue) by bin(TimeGenerated, 1h), Computer

| sort by TimeGenerated desc

| render timechart

// Oql: Type:Perf CounterName=”% Processor Time” ObjectName=Processor InstanceName=_Total | measure avg(CounterValue) as AVGCPU by Computer | display linechart // WorkspaceId: {b438b4f6-912a-46d5-9cb1-b44069212abc} // Version: 0.1.115

//Moving Average Performance over 15 minutes

let endTime=now();

let timerange =1d;

let startTime=now() – timerange;

let mInterval=4;

let mAvgParm = repeat(1, mInterval);

Perf

| where ObjectName == “Processor”

| where CounterName == “% Processor Time”

| make-series avgCpu=avg(CounterValue) default=0 on TimeGenerated in range(startTime, endTime, 15m) by Computer

| extend moving_avgCpu = series_fir(avgCpu, mAvgParm)

| render timechart

// disk space

let PercentSpace = 50; //enter the threshold for the disk space percentage

Perf

| where ObjectName == “LogicalDisk” and CounterName == “% Free Space”

| summarize FreeSpace = min(CounterValue) by Computer, InstanceName

// | where InstanceName == “C:” or InstanceName == “D:” or InstanceName == “E:”

| where InstanceName contains “:”

// look for the colon in the drive letter

| where FreeSpace < PercentSpace

// set to < in normal circumstances

| sort by FreeSpace asc

| render barchart kind = unstacked

//Comparing performance in groups of computers

Perf

| where ObjectName == “Processor”

| where CounterName == “% Processor Time”

| extend group = case(Computer contains “1598”, “admgrup”, Computer contains “1599”, “bsgroup”, “other”)

| summarize avg(CounterValue) by bin(TimeGenerated, 1h) , group

| render timechart

Perf

| where ObjectName==“Processor” and CounterName==“% Processor Time”

| summarize avg(CounterValue) by Computer | where avg_CounterValue > 10

Perf

| where ObjectName==“Memory” and CounterName==“% Committed Bytes In Use”

| summarize avg(CounterValue) by Computer | where avg_CounterValue > 70

Perf

| where ObjectName == “Processor” and CounterName == “% Processor Time” and InstanceName == “_Total” and Computer in ((Heartbeat

| where OSType == “Windows”

| distinct Computer))

| summarize AggregatedValue = avg(CounterValue) by bin(TimeGenerated, 1h), Computer

| render timechart

Perf

| where TimeGenerated > ago(1d)

| where CounterName == “% Processor Time”

| summarize avg(CounterValue), percentiles(CounterValue, 50, 95) by bin(TimeGenerated, 1h)

| extend Threshold = 10 // set a refernce line

| render timechart

let StartTime = now()-5d; let EndTime = now()-4d; Perf | where CounterName == “% Processor Time” | where TimeGenerated > StartTime and TimeGenerated < EndTime and TimeGenerated < EndTime | project TimeGenerated, Computer, cpu=CounterValue | join kind= inner ( Perf | where CounterName == “% Used Memory” | where TimeGenerated > StartTime and TimeGenerated < EndTime | project TimeGenerated , Computer, mem=CounterValue ) on TimeGenerated, Computer | summarize avgCpu=avg(cpu), maxMem=max(mem) by TimeGenerated bin=30m | render timechart

// Performance trends

// Example output: The “Reference” line is from 3 days ago and the “Current” line is for the latest 24 hours. I was collecting the “Processor(_Total)\% Processor Time” perf counter.

let computerContains = “ejukebox”; // add name to define the computer you want to look at

let perfCounterName = “% Processor Time”; // change to be the perf counter you want to compare

let binSize = 15m; // using the bin function with 15 minute bins to aggregate average perf counter values

let refDelay = 3d; // reference data will be 3 days before now

let EndTime = now();

let StartTime = EndTime – 1d;

let ReferenceEndTime = EndTime – refDelay;

let ReferenceStartTime = StartTime – refDelay;

Perf

| where Computer contains computerContains and CounterName == perfCounterName

| where TimeGenerated between(StartTime .. EndTime) or TimeGenerated between(ReferenceStartTime .. ReferenceEndTime)

| extend RefTimeGenerated = iif( TimeGenerated between( StartTime .. EndTime ),TimeGenerated, TimeGenerated + refDelay) //extend | Create calculated columns and append them to the result set

| extend ID = iif( TimeGenerated between( StartTime .. EndTime ), “Current”, “Reference”)

| summarize avg(CounterValue) by ID, bin(RefTimeGenerated, binSize)

| render timechart

//All Performance data from a particular computer

Perf | where CounterName == “Current Disk Queue Length”

//Average CPU Utilization across all computers

Perf | where ObjectName == “Processor” and CounterName == “% Processor Time” and InstanceName == “_Total” | summarize AVGCPU = avg(Average) by Computer

//Maximum CPU Utilization across all computers

Perf | where CounterName == “% Processor Time” | summarize AggregatedValue = max(Max) by Computer

//Average Current Disk Queue length across all the instances of a given computer

Perf | where ObjectName == “LogicalDisk” and CounterName == “Current Disk Queue Length” and Computer == “MyComputerName” | summarize AggregatedValue = avg(Average) by InstanceName

//Hourly average of CPU usage across all computers

Perf | where CounterName == “% Processor Time” and InstanceName == “_Total” | summarize AggregatedValue = avg(CounterValue) by bin(TimeGenerated, 1h), Computer

//Hourly 70 percentile of every % percent counter for a particular computer

Perf | where Computer == “MyComputer” and CounterName startswith_cs “%” and InstanceName == “_Total” | summarize AggregatedValue = percentile(CounterValue, 70) by bin(TimeGenerated, 1h), CounterName

Perf | where CounterName == “% Processor Time” and InstanceName == “_Total” and Computer == “MyComputer” | summarize [“min(CounterValue)”] = min(CounterValue), [“avg(CounterValue)”] = avg(CounterValue), [“percentile75(CounterValue)”] = percentile(CounterValue, 75), [“max(CounterValue)”] = max(CounterValue) by bin(TimeGenerated, 1h), Computer

//All Performance data from the Database performance object for the master database from the named SQL Server instance INST2

Perf | where ObjectName == “MSSQL$INST2:Databases” and InstanceName == “master”

AzureDiagnostics

| where ResourceProvider == “MICROSOFT.NETWORK” and Category == “ApplicationGatewayFirewallLog”

| summarize Count=count() by details_file_s, action_s

| top 5 by Count desc

| render piechart

AzureDiagnostics

| where ResourceProvider == “MICROSOFT.NETWORK” and Category == “ApplicationGatewayFirewallLog”

| summarize Count=count() by clientIp_s, action_s

| top 5 by Count desc

| render piechart

AzureDiagnostics

| where ResourceProvider == “MICROSOFT.NETWORK” and Category == “ApplicationGatewayFirewallLog”

| summarize Count=count() by Message, action_s

| top 5 by Count desc

| render piechart

AzureDiagnostics

| where ResourceProvider == “MICROSOFT.NETWORK” and Category == “ApplicationGatewayPerformanceLog”

| project Time=TimeGenerated, Latency_ms=latency_d

| render timechart

AzureDiagnostics

| where ResourceProvider == “MICROSOFT.NETWORK” and Category == “ApplicationGatewayPerformanceLog”

| extend Throughput_Mb = (throughput_d/1000)/1000

| project Time=TimeGenerated, Throughput_Mb

| render timechart

AzureDiagnostics

| where ResourceProvider == “MICROSOFT.NETWORK” and Category == “ApplicationGatewayPerformanceLog”

| project Requests=requestCount_d, FailedRequests=failedRequestCount_d, TimeGenerated

| render timechart

WireData

| where Direction == “Outbound”

| sort by SessionStartTime desc

| summarize count(), makeset(SessionStartTime), makeset(SessionEndTime), makeset(LocalIP), makeset(RemoteIP), makeset(RemotePortNumber), makeset(SessionState), makeset(ProtocolName), makeset(IPVersion) by Computer

WireData

| where Direction == “Inbound”

| sort by SessionStartTime desc

WireData

| sort by SessionStartTime desc

search in (WireData) * | summarize AggregatedValue = sum(TotalBytes) by Computer | limit

search in (WireData) * | summarize AggregatedValue = count() by LocalIP

search in (WireData) * | summarize AggregatedValue = sum(TotalBytes) by ProcessName

search in (WireData) * | summarize AggregatedValue = sum(TotalBytes) by IPVersion

search in (WireData) Direction == “Outbound” | summarize AggregatedValue = count() by RemoteIP

Syslog | sort by TimeGenerated desc

| where SeverityLevel == “err”

| summarize count(), makeset(Facility), makeset(SyslogMessage), makeset(HostIP), makeset(ProcessName), makeset(Type) by Computer

Syslog | sort by TimeGenerated desc

| where SeverityLevel == “warn”

| summarize count(), makeset(Facility), makeset(SyslogMessage), makeset(HostIP), makeset(ProcessName), makeset(Type) by Computer

let EndTime = now();

let StartTime = EndTime – 1d;

DemoMirvac_CL

| where TimeGenerated between(StartTime .. EndTime)

| sort by TimeGenerated desc

| project Station_s, Song_s | render table

//The average response time over a period of 10 seconds for
//the 2 of the 4 microservices (Note Trips API you can monitor a single operation of the API).
ContainerLog 
//| top 500 by TimeGenerated// return the latest 500 results
| where TimeGenerated >= now(-30m) and TimeGenerated <= now()
| project TimeGenerated, LogEntry
| where LogEntry contains "request finished"
| extend LogEntry2 = todouble(extract(@"Request finished in ([0-9.]*)ms", 1, LogEntry))
| summarize LogEntry2=avg(LogEntry2) by bin(TimeGenerated, 10s)
| render timechart

Marc Kean

Azure Tech Consultant

Log Analytics Advanced Queries

Update

Event Log

Perf

Leave a comment Cancel reply

Log Analytics Advanced Queries

Update

Event Log

Perf

Share this:

Leave a comment Cancel reply