Merge branch '8.5' into backport/8.5/pr-141239

elastic · Sep 23, 2022 · a1b1633 · a1b1633
2 parents 4e90ce6 + 7c9a49b
commit a1b1633
Show file tree

Hide file tree

Showing 8 changed files with 186 additions and 39 deletions.
diff --git a/docs/management/images/runtime_field.png b/docs/management/images/runtime_field.png
diff --git a/docs/management/images/runtime_field_composite.png b/docs/management/images/runtime_field_composite.png
diff --git a/docs/management/manage-data-views.asciidoc b/docs/management/manage-data-views.asciidoc
@@ -77,9 +77,11 @@ Return `Hello World!`:
 emit("Hello World!");
 ----
 
+image:management/images/runtime_field.png[Runtime field with keyword type]
+
 [float]
 [[perform-a-calculation-on-a-single-field]]
-===== Perform a calculation on a single field
+==== Perform a calculation on a single field
 
 Calculate kilobytes from bytes:
 
@@ -90,7 +92,7 @@ emit(doc['bytes'].value / 1024)
 
 [float]
 [[return-substring]]
-===== Return a substring
+==== Return a substring
 
 Return the string that appears after the last slash in the URL:
 
@@ -108,9 +110,24 @@ emit("");
 ----
 
 [float]
-[[replace-nulls-with-blanks]]
-===== Replace nulls with blanks
+[[composite-runtime-field]]
+==== Return multiple fields with a composite runtime field
+
+A single runtime field can also produce multiple subfields when the type `Composite` is selected. The script editor provides default types that can be customized for each subfields.
 
+Return `keyword` and `double` type subfields. Note that the first argument for `emit` is the name of the subfield.
+
+[source,text]
+----
+emit('subfield_a', 'Hello');
+emit('subfield_b', 42);
+----
+
+image:management/images/runtime_field_composite.png[Runtime field with composite type]
+
+[float]
+[[replace-nulls-with-blanks]]
+==== Replace nulls with blanks
 Replace `null` values with `None`:
 
 [source,text]

diff --git a/...ugins/enterprise_search/server/lib/indices/fetch_ml_inference_pipeline_processors.test.ts b/...ugins/enterprise_search/server/lib/indices/fetch_ml_inference_pipeline_processors.test.ts
@@ -5,12 +5,16 @@
  * 2.0.
  */
 
+import { MlTrainedModelConfig } from '@elastic/elasticsearch/lib/api/typesWithBodyKey';
 import { ElasticsearchClient } from '@kbn/core/server';
+import { BUILT_IN_MODEL_TAG } from '@kbn/ml-plugin/common/constants/data_frame_analytics';
 
 import { InferencePipeline } from '../../../common/types/pipelines';
 
 import {
   fetchAndAddTrainedModelData,
+  getMlModelTypesForModelConfig,
+  getMlModelConfigsForModelIds,
   fetchMlInferencePipelineProcessorNames,
   fetchMlInferencePipelineProcessors,
   fetchPipelineProcessorInferenceData,
@@ -200,6 +204,95 @@ describe('fetchPipelineProcessorInferenceData lib function', () => {
   });
 });
 
+describe('getMlModelTypesForModelConfig lib function', () => {
+  const mockModel: MlTrainedModelConfig = {
+    inference_config: {
+      ner: {},
+    },
+    input: {
+      field_names: [],
+    },
+    model_id: 'test_id',
+    model_type: 'pytorch',
+    tags: ['test_tag'],
+  };
+  const builtInMockModel: MlTrainedModelConfig = {
+    inference_config: {
+      text_classification: {},
+    },
+    input: {
+      field_names: [],
+    },
+    model_id: 'test_id',
+    model_type: 'lang_ident',
+    tags: [BUILT_IN_MODEL_TAG],
+  };
+
+  it('should return the model type and inference config type', () => {
+    const expected = ['pytorch', 'ner'];
+    const response = getMlModelTypesForModelConfig(mockModel);
+    expect(response.sort()).toEqual(expected.sort());
+  });
+
+  it('should include the built in type', () => {
+    const expected = ['lang_ident', 'text_classification', BUILT_IN_MODEL_TAG];
+    const response = getMlModelTypesForModelConfig(builtInMockModel);
+    expect(response.sort()).toEqual(expected.sort());
+  });
+});
+
+describe('getMlModelConfigsForModelIds lib function', () => {
+  const mockClient = {
+    ml: {
+      getTrainedModels: jest.fn(),
+      getTrainedModelsStats: jest.fn(),
+    },
+  };
+
+  beforeEach(() => {
+    jest.clearAllMocks();
+  });
+
+  it('should fetch the models that we ask for', async () => {
+    mockClient.ml.getTrainedModels.mockImplementation(() =>
+      Promise.resolve(mockGetTrainedModelsData)
+    );
+    mockClient.ml.getTrainedModelsStats.mockImplementation(() =>
+      Promise.resolve(mockGetTrainedModelStats)
+    );
+
+    const input = {
+      'trained-model-id-1': {
+        isDeployed: true,
+        pipelineName: '',
+        trainedModelName: 'trained-model-id-1',
+        types: ['pytorch', 'ner'],
+      },
+      'trained-model-id-2': {
+        isDeployed: true,
+        pipelineName: '',
+        trainedModelName: 'trained-model-id-2',
+        types: ['pytorch', 'ner'],
+      },
+    } as Record<string, InferencePipeline>;
+
+    const expected = {
+      'trained-model-id-2': input['trained-model-id-2'],
+    };
+    const response = await getMlModelConfigsForModelIds(
+      mockClient as unknown as ElasticsearchClient,
+      ['trained-model-id-2']
+    );
+    expect(mockClient.ml.getTrainedModels).toHaveBeenCalledWith({
+      model_id: 'trained-model-id-2',
+    });
+    expect(mockClient.ml.getTrainedModelsStats).toHaveBeenCalledWith({
+      model_id: 'trained-model-id-2',
+    });
+    expect(response).toEqual(expected);
+  });
+});
+
 describe('fetchAndAddTrainedModelData lib function', () => {
   const mockClient = {
     ml: {

diff --git a/...ck/plugins/enterprise_search/server/lib/indices/fetch_ml_inference_pipeline_processors.ts b/...ck/plugins/enterprise_search/server/lib/indices/fetch_ml_inference_pipeline_processors.ts
@@ -5,6 +5,7 @@
  * 2.0.
  */
 
+import { MlTrainedModelConfig } from '@elastic/elasticsearch/lib/api/typesWithBodyKey';
 import { ElasticsearchClient } from '@kbn/core/server';
 import { BUILT_IN_MODEL_TAG } from '@kbn/ml-plugin/common/constants/data_frame_analytics';
 
@@ -65,39 +66,67 @@ export const fetchPipelineProcessorInferenceData = async (
   );
 };
 
-export const fetchAndAddTrainedModelData = async (
+export const getMlModelTypesForModelConfig = (trainedModel: MlTrainedModelConfig): string[] => {
+  if (!trainedModel) return [];
+
+  const isBuiltIn = trainedModel.tags?.includes(BUILT_IN_MODEL_TAG);
+
+  return [
+    trainedModel.model_type,
+    ...Object.keys(trainedModel.inference_config || {}),
+    ...(isBuiltIn ? [BUILT_IN_MODEL_TAG] : []),
+  ].filter((type): type is string => type !== undefined);
+};
+
+export const getMlModelConfigsForModelIds = async (
   client: ElasticsearchClient,
-  pipelineProcessorData: Record<string, InferencePipeline>
+  trainedModelNames: string[]
 ): Promise<Record<string, InferencePipeline>> => {
-  const trainedModelNames = Object.keys(pipelineProcessorData);
-
   const [trainedModels, trainedModelsStats] = await Promise.all([
     client.ml.getTrainedModels({ model_id: trainedModelNames.join() }),
     client.ml.getTrainedModelsStats({ model_id: trainedModelNames.join() }),
   ]);
 
+  const modelConfigs: Record<string, InferencePipeline> = {};
+
   trainedModels.trained_model_configs.forEach((trainedModelData) => {
     const trainedModelName = trainedModelData.model_id;
 
-    if (pipelineProcessorData.hasOwnProperty(trainedModelName)) {
-      const isBuiltIn = trainedModelData.tags.includes(BUILT_IN_MODEL_TAG);
-
-      pipelineProcessorData[trainedModelName].types = [
-        trainedModelData.model_type,
-        ...Object.keys(trainedModelData.inference_config || {}),
-        ...(isBuiltIn ? [BUILT_IN_MODEL_TAG] : []),
-      ].filter((type): type is string => type !== undefined);
+    if (trainedModelNames.includes(trainedModelName)) {
+      modelConfigs[trainedModelName] = {
+        isDeployed: false,
+        pipelineName: '',
+        trainedModelName,
+        types: getMlModelTypesForModelConfig(trainedModelData),
+      };
     }
   });
 
   trainedModelsStats.trained_model_stats.forEach((trainedModelStats) => {
     const trainedModelName = trainedModelStats.model_id;
-    if (pipelineProcessorData.hasOwnProperty(trainedModelName)) {
+    if (modelConfigs.hasOwnProperty(trainedModelName)) {
       const isDeployed = trainedModelStats.deployment_stats?.state === 'started';
-      pipelineProcessorData[trainedModelName].isDeployed = isDeployed;
+      modelConfigs[trainedModelName].isDeployed = isDeployed;
     }
   });
 
+  return modelConfigs;
+};
+
+export const fetchAndAddTrainedModelData = async (
+  client: ElasticsearchClient,
+  pipelineProcessorData: Record<string, InferencePipeline>
+): Promise<Record<string, InferencePipeline>> => {
+  const trainedModelNames = Object.keys(pipelineProcessorData);
+  const modelConfigs = await getMlModelConfigsForModelIds(client, trainedModelNames);
+
+  for (const [modelName, modelData] of Object.entries(modelConfigs)) {
+    if (pipelineProcessorData.hasOwnProperty(modelName)) {
+      pipelineProcessorData[modelName].types = modelData.types;
+      pipelineProcessorData[modelName].isDeployed = modelData.isDeployed;
+    }
+  }
+
   return pipelineProcessorData;
 };
 

diff --git a/x-pack/plugins/enterprise_search/server/lib/pipelines/create_pipeline_definitions.test.ts b/x-pack/plugins/enterprise_search/server/lib/pipelines/create_pipeline_definitions.test.ts
@@ -41,7 +41,9 @@ describe('createIndexPipelineDefinitions util function', () => {
 describe('formatMlPipelineBody util function', () => {
   const modelId = 'my-model-id';
   let modelInputField = 'my-model-input-field';
-  const modelType = 'my-model-type';
+  const modelType = 'pytorch';
+  const inferenceConfigKey = 'my-model-type';
+  const modelTypes = ['pytorch', 'my-model-type'];
   const modelVersion = 3;
   const sourceField = 'my-source-field';
   const destField = 'my-dest-field';
@@ -59,7 +61,6 @@ describe('formatMlPipelineBody util function', () => {
   it('should return the pipeline body', async () => {
     const expectedResult = {
       description: '',
-      version: 1,
       processors: [
         {
           remove: {
@@ -69,37 +70,41 @@ describe('formatMlPipelineBody util function', () => {
         },
         {
           inference: {
-            model_id: modelId,
-            target_field: `ml.inference.${destField}`,
             field_map: {
               [sourceField]: modelInputField,
             },
+            model_id: modelId,
+            target_field: `ml.inference.${destField}`,
           },
         },
         {
           append: {
             field: '_source._ingest.processors',
             value: [
               {
-                type: modelType,
                 model_id: modelId,
                 model_version: modelVersion,
                 processed_timestamp: '{{{ _ingest.timestamp }}}',
+                types: modelTypes,
               },
             ],
           },
         },
       ],
+      version: 1,
     };
 
     const mockResponse = {
       count: 1,
       trained_model_configs: [
         {
+          inference_config: {
+            [inferenceConfigKey]: {},
+          },
+          input: { field_names: [modelInputField] },
           model_id: modelId,
-          version: modelVersion,
           model_type: modelType,
-          input: { field_names: [modelInputField] },
+          version: modelVersion,
         },
       ],
     };
@@ -131,7 +136,6 @@ describe('formatMlPipelineBody util function', () => {
     modelInputField = 'MODEL_INPUT_FIELD';
     const expectedResult = {
       description: '',
-      version: 1,
       processors: [
         {
           remove: {
@@ -141,36 +145,40 @@ describe('formatMlPipelineBody util function', () => {
         },
         {
           inference: {
-            model_id: modelId,
-            target_field: `ml.inference.${destField}`,
             field_map: {
               [sourceField]: modelInputField,
             },
+            model_id: modelId,
+            target_field: `ml.inference.${destField}`,
           },
         },
         {
           append: {
             field: '_source._ingest.processors',
             value: [
               {
-                type: modelType,
                 model_id: modelId,
                 model_version: modelVersion,
                 processed_timestamp: '{{{ _ingest.timestamp }}}',
+                types: modelTypes,
               },
             ],
           },
         },
       ],
+      version: 1,
     };
     const mockResponse = {
       count: 1,
       trained_model_configs: [
         {
+          inference_config: {
+            [inferenceConfigKey]: {},
+          },
+          input: { field_names: [] },
           model_id: modelId,
-          version: modelVersion,
           model_type: modelType,
-          input: { field_names: [] },
+          version: modelVersion,
         },
       ],
     };