From ac5865b575ad8707c78243764763f946d7308fe7 Mon Sep 17 00:00:00 2001 From: rjawesome Date: Mon, 1 Jul 2024 13:48:20 -0700 Subject: [PATCH] single subquery queue --- package.json | 1 + src/index.ts | 3 +- src/record.ts | 690 ---------------------- src/transformers/biothings_transformer.ts | 2 +- src/transformers/transformer.ts | 9 +- src/transformers/trapi_transformer.ts | 2 +- src/types.ts | 45 +- 7 files changed, 9 insertions(+), 743 deletions(-) delete mode 100644 src/record.ts diff --git a/package.json b/package.json index a90aecf..30a6e97 100644 --- a/package.json +++ b/package.json @@ -60,6 +60,7 @@ "dependencies": { "@biothings-explorer/utils": "workspace:../utils", "@biothings-explorer/types": "workspace:../types", + "@biothings-explorer/smartapi-kg": "workspace:../smartapi-kg", "@commitlint/cli": "^17.8.1", "@commitlint/config-conventional": "^11.0.0", "async": "^3.2.4", diff --git a/src/index.ts b/src/index.ts index 68b99fd..be6e626 100644 --- a/src/index.ts +++ b/src/index.ts @@ -8,10 +8,9 @@ import TRAPITransformer from "./transformers/trapi_transformer"; import EBIProteinTransformer from "./transformers/ebi_protein_transformer"; import JQTransformer from "./transformers/jq_transformer"; import { BTEQueryObject } from "./types"; -import { Record } from "./record"; +import { Record } from "@biothings-explorer/types"; import Debug from "debug"; const debug = Debug("bte:api-response-transform:index"); -export * from "./record"; export * from "./types"; export default class Transformer { diff --git a/src/record.ts b/src/record.ts deleted file mode 100644 index 2d3001d..0000000 --- a/src/record.ts +++ /dev/null @@ -1,690 +0,0 @@ -import crypto from "crypto"; -import _ from "lodash"; -import { TrapiSource } from "@biothings-explorer/types"; - -function hash(string: string) { - return crypto.createHash("md5").update(string).digest("hex"); -} - -export class RecordNode { - original: string; - normalizedInfo: NodeNormalizerResultObj; - _qNode: QNode; - _apiLabel: string; - - constructor( - node: FrozenNode | VerboseFrozenNode | MinimalFrozenNode, - qNode: QNode, - ) { - this.original = node.original; - this.normalizedInfo = node.normalizedInfo - ? node.normalizedInfo - : this.makeFakeInfo(node); - this._qNode = qNode; - this._apiLabel = node.apiLabel; - } - - makeFakeInfo( - node: FrozenNode | VerboseFrozenNode | MinimalFrozenNode, - ): NodeNormalizerResultObj { - return { - primaryID: node.curie, - equivalentIDs: node.equivalentCuries ?? [], - label: node.label, - labelAliases: node.names, - primaryTypes: [node.semanticType], - semanticTypes: node.semanticTypes ?? [], - attributes: node.attributes ?? {}, - }; - } - - toJSON(): VerboseFrozenNode { - return { - original: this.original, - normalizedInfo: this.normalizedInfo, - qNodeID: this.qNodeID, - isSet: this.isSet, - curie: this.curie, - UMLS: this.UMLS, - semanticType: this.semanticType, - semanticTypes: this.semanticTypes, - label: this.label, - apiLabel: this._apiLabel, - equivalentCuries: this.equivalentCuries, - names: this.names, - attributes: this.attributes, - }; - } - - freeze(): FrozenNode { - const node = this.toJSON() as FrozenNode; - delete node.normalizedInfo; - delete node.equivalentCuries; - delete node.names; - return node; - } - - freezeVerbose(): VerboseFrozenNode { - return this.toJSON(); - } - - freezeMinimal(): MinimalFrozenNode { - return { - original: this.original, - normalizedInfo: this.normalizedInfo, - apiLabel: this._apiLabel, - }; - } - - get qNodeID(): string { - return this._qNode.getID(); - } - - get isSet(): boolean { - return this._qNode.isSet(); - } - - get curie(): string { - return this.normalizedInfo?.primaryID; - } - - get UMLS(): string[] { - return ( - this.normalizedInfo?.equivalentIDs.reduce( - (arr: string[], curie: string) => { - if (curie.includes("UMLS")) arr.push(curie.replace("UMLS:", "")); - return arr; - }, - [], - ) ?? [] - ); - } - - get semanticType(): string[] { - return ( - this.normalizedInfo?.primaryTypes.map( - semanticType => `biolink:${semanticType}`, - ) ?? [] - ); - } - - get semanticTypes(): string[] { - return ( - this.normalizedInfo?.semanticTypes.map( - semanticType => `biolink:${semanticType}`, - ) ?? [] - ); - } - - get label(): string { - if (this.normalizedInfo?.label === this.curie) return this._apiLabel; - return this.normalizedInfo?.label ?? this._apiLabel; - } - - get equivalentCuries(): string[] { - return this.normalizedInfo?.equivalentIDs ?? []; - } - - get names(): string[] { - return this.normalizedInfo?.labelAliases ?? []; - } - - get attributes(): any { - return this.normalizedInfo?.attributes ?? {}; - } -} - -export class Record { - association: Association; - qEdge: QEdge; - config: any; - subject: RecordNode; - object: RecordNode; - reverseToExecution: boolean; - _qualifiers: BulkQualifiers; - _mappedResponse: MappedResponse; - - constructor( - record: FrozenRecord | VerboseFrozenRecord | MinimalFrozenRecord, - config?: any, - apiEdge?: Association, - qEdge?: QEdge, - reverse?: boolean, - ) { - this.association = apiEdge ? apiEdge : this.makeAPIEdge(record); - this.qEdge = qEdge ? qEdge : this.makeFakeQEdge(record); - this.config = config ? config : { EDGE_ATTRIBUTES_USED_IN_RECORD_HASH: [] }; - this.reverseToExecution = reverse || false; - if (!this.reverseToExecution) { - this.subject = new RecordNode(record.subject, this.qEdge.getInputNode()); - this.object = new RecordNode(record.object, this.qEdge.getOutputNode()); - } else { - this.subject = new RecordNode(record.subject, this.qEdge.getOutputNode()); - this.object = new RecordNode(record.object, this.qEdge.getInputNode()); - } - this._qualifiers = record.qualifiers || this.association.qualifiers; - this._mappedResponse = record.mappedResponse ? record.mappedResponse : {}; - if (!this._mappedResponse.publications) { - this._mappedResponse.publications = record.publications; - } - } - - reverse() { - const frozen = { ...this.freezeVerbose() }; - const reversedAPIEdge: Association = { ...frozen.association }; - reversedAPIEdge.input_id = frozen.association.output_id; - reversedAPIEdge.input_type = frozen.association.output_type; - reversedAPIEdge.output_id = frozen.association.input_id; - reversedAPIEdge.output_type = frozen.association.input_type; - const predicate = this.qEdge.getReversedPredicate( - frozen.association.predicate, - ); - reversedAPIEdge.predicate = predicate; - if (reversedAPIEdge.qualifiers) { - const reversedQualifiers = Object.fromEntries( - Object.entries(reversedAPIEdge.qualifiers).map( - ([qualifierType, qualifier]) => { - let newQualifierType: string = qualifierType; - let newQualifier: string | string[] = qualifier; - if (qualifierType.includes("predicate")) { - if (Array.isArray(qualifier)) { - newQualifier = qualifier.map( - (str: string) => - `biolink:${this.qEdge.getReversedPredicate( - str.replace("biolink:", ""), - )}`, - ); - } else { - newQualifier = `biolink:${this.qEdge.getReversedPredicate( - qualifier.replace("biolink:", ""), - )}`; - } - } - if (qualifierType.includes("subject")) { - newQualifierType = qualifierType.replace("subject", "object"); - } - if (qualifierType.includes("object")) { - newQualifierType = qualifierType.replace("object", "subject"); - } - return [newQualifierType, newQualifier]; - }, - ), - ); - - reversedAPIEdge.qualifiers = reversedQualifiers; - frozen.qualifiers = reversedQualifiers; - } - // frozen.predicate = 'biolink:' + predicate; - frozen.association = reversedAPIEdge; - const temp = frozen.subject; - frozen.subject = frozen.object; - frozen.object = temp; - return new Record( - frozen, - this.config, - frozen.association, - this.qEdge, - !this.reverseToExecution, - ); - } - - queryDirection() { - if (!this.qEdge.isReversed()) { - return this; - } else { - return this.reverse(); - } - } - - // for user-made records lacking qEdge - makeFakeQEdge( - record: FrozenRecord | VerboseFrozenRecord | MinimalFrozenRecord, - ): QEdge { - return { - getID(): string { - return "fakeEdge"; - }, - getInputNode(): QNode { - return { - getID(): string { - return record.subject.qNodeID; - }, - isSet(): boolean { - return record.subject.isSet || false; - }, - }; - }, - getOutputNode(): QNode { - return { - getID(): string { - return record.object.qNodeID; - }, - isSet(): boolean { - return record.object.isSet || false; - }, - }; - }, - isReversed(): boolean { - return false; - }, - // WARNING not useable alongside actual QEdge.getHashedEdgeRepresentation - // However the two should never show up together as this is only for testing purposes - getHashedEdgeRepresentation(): string { - return hash( - record.subject.semanticType + - record.predicate + - record.object.semanticType + - (record.subject.equivalentCuries || record.object.equivalentCuries), - ); - }, - }; - } - - makeAPIEdge( - record: FrozenRecord | VerboseFrozenRecord | MinimalFrozenRecord, - ): Association { - return { - predicate: record.predicate?.replace("biolink:", ""), - qualifiers: record.qualifiers - ? Object.fromEntries( - Object.entries(record.qualifiers).map( - ([qualifierType, qualifier]: [string, string]) => { - return [qualifierType.replace("biolink:", ""), qualifier]; - }, - ), - ) - : undefined, - api_name: record.api, - source: record.metaEdgeSource, - "x-translator": { - infores: record.apiInforesCurie, - }, - apiIsPrimaryKnowledgeSource: false, - }; - } - - public static freezeRecords(records: Record[]): FrozenRecord[] { - return records.map((record: Record): FrozenRecord => record.freeze()); - } - - public static unfreezeRecords( - records: FrozenRecord[], - config?: any, - ): Record[] { - return records.map( - (record: FrozenRecord): Record => new Record(record, config), - ); - } - - public static packRecords(records: Record[]): RecordPackage { - // save string space by storing apiEdge and recordNode .normalizedInfo's separately (eliminates duplicates) - const frozenRecords = []; - const apiEdgeHashes = []; - const apiEdges = []; - records.forEach((record: Record) => { - const frozenRecord = record.freezeMinimal(); - - const apiEdgeHash = hash(JSON.stringify(record.association)); - - let apiEdgeHashIndex = apiEdgeHashes.findIndex( - hash => hash === apiEdgeHash, - ); - - if (apiEdgeHashIndex === -1) { - apiEdgeHashes.push(apiEdgeHash); - apiEdges.push(record.association); - apiEdgeHashIndex = apiEdgeHashes.length - 1; - } - - frozenRecords.push({ - ...frozenRecord, - apiEdge: apiEdgeHashIndex, - }); - }); - - return [apiEdges, ...frozenRecords]; - } - - public static unpackRecords( - recordPack: RecordPackage, - qEdge: QEdge, - config?: any, - ): Record[] { - const [apiEdges, ...frozenRecords] = recordPack; - return frozenRecords.map((record: any): Record => { - const apiEdge = apiEdges[record.apiEdge]; - return new Record(record, config, apiEdge, qEdge); - }); - } - - toJSON(): VerboseFrozenRecord { - return { - subject: this.subject.freezeVerbose(), - object: this.object.freezeVerbose(), - association: this.association, - predicate: this.predicate, - qualifiers: this.qualifiers, - publications: this.publications, - recordHash: this.recordHash, - api: this.api, - apiInforesCurie: this.apiInforesCurie, - metaEdgeSource: this.metaEdgeSource, - mappedResponse: this._mappedResponse, - }; - } - - freeze(): FrozenRecord { - const record = this.toJSON() as FrozenRecord; - record.subject = this.subject.freeze(); - record.object = this.object.freeze(); - //@ts-ignore - delete record.association; - record.mappedResponse = { - ...record.mappedResponse, - publications: undefined, - }; - return record; - } - - freezeVerbose(): VerboseFrozenRecord { - return this.toJSON(); - } - - freezeMinimal(): MinimalFrozenRecord { - return { - subject: this.subject.freezeMinimal(), - object: this.object.freezeMinimal(), - qualifiers: this.qualifiers, - publications: this.publications, - mappedResponse: this._mappedResponse, - }; - } - - _getFlattenedEdgeAttributes(attributes: EdgeAttribute[]): EdgeAttribute[] { - return attributes - ? attributes.reduce((arr: EdgeAttribute[], attribute: EdgeAttribute) => { - attribute.attributes - ? arr.push( - attribute, - ...this._getFlattenedEdgeAttributes(attribute.attributes), - ) - : arr.push(attribute); - return arr; - }, []) - : []; - } - - get mappedResponse() { - return Object.fromEntries(Object.entries(this._mappedResponse).filter(([key, _val]) => { - return key !== "source_url" - })) - } - - get _configuredEdgeAttributesForHash(): string { - return this._getFlattenedEdgeAttributes( - this._mappedResponse["edge-attributes"], - ) - .filter(attribute => { - return this.config?.EDGE_ATTRIBUTES_USED_IN_RECORD_HASH?.includes( - attribute.attribute_type_id, - ); - }) - .reduce((acc, attribute) => { - return [...acc, `${attribute.attribute_type_id}:${attribute.value}`]; - }, []) - .join(","); - } - - get _recordHashContent(): string { - return [ - this.subject.curie, - this.predicate, - this.object.curie, - Object.entries(this.qualifiers) - .sort(([qTa, _qVa], [qTb, _qVb]) => qTa.localeCompare(qTb)) - .reduce( - (str, [qualifierType, qualifierValue]) => - `${str};${qualifierType}:${JSON.stringify(qualifierValue)}`, - "", - ), - this.api, - this.metaEdgeSource, - this._configuredEdgeAttributesForHash, - JSON.stringify( - this.provenanceChain.sort((sourceA, sourceB) => - sourceA.resource_id.localeCompare(sourceB.resource_id), - ), - ), - ].join("-"); - } - - get recordHash(): string { - return hash(this._recordHashContent); - } - - get predicate(): string { - return "biolink:" + this.association.predicate; - } - - get qualifiers(): BulkQualifiers { - if (!this._qualifiers) { - return {}; - } - return Object.fromEntries( - Object.entries(this._qualifiers).map(([qualifierType, qualifier]) => { - const newQualifierType = `biolink:${qualifierType.replace( - "biolink:", - "", - )}`; - let newQualifier = qualifier; - if (qualifierType.includes("predicate")) { - if (Array.isArray(qualifier)) { - newQualifier = qualifier.map( - str => `biolink:${str.replace("biolink", "")}`, - ); - } else { - newQualifier = `biolink:${qualifier.replace("biolink:", "")}`; - } - } - return [newQualifierType, newQualifier]; - }), - ); - } - - get api(): string { - return this.association.api_name; - } - - get apiInforesCurie(): string { - if (this.association["x-translator"]) { - return this.association["x-translator"]["infores"] || undefined; - } - return undefined; - } - - get metaEdgeSource(): string { - return this.association.source; - } - - get provenanceChain(): TrapiSource[] { - const source_urls = this._mappedResponse.source_url ?? undefined; - let returnValue: TrapiSource[] = []; - if (this._mappedResponse.trapi_sources) { - returnValue = _.cloneDeep(this._mappedResponse.trapi_sources); - } else { - returnValue.push({ - resource_id: this.association.apiIsPrimaryKnowledgeSource - ? this.apiInforesCurie - : this.metaEdgeSource, - resource_role: "primary_knowledge_source", - source_record_urls: source_urls, - }); - if (!this.association.apiIsPrimaryKnowledgeSource) { - returnValue.push({ - resource_id: this.apiInforesCurie, - resource_role: "aggregator_knowledge_source", - upstream_resource_ids: [this.metaEdgeSource], - }); - } - } - returnValue.push({ - resource_id: this.config.provenanceUsesServiceProvider - ? "infores:service-provider-trapi" - : "infores:biothings-explorer", - resource_role: "aggregator_knowledge_source", - upstream_resource_ids: [this.apiInforesCurie], - }); - return returnValue; - } - - get publications(): string[] { - return this._mappedResponse.publications || []; - } - - get knowledge_level(): string | undefined { - return this.association.knowledge_level; - } - - get agent_type(): string | undefined { - return this.association.agent_type; - } -} - -export interface FrozenRecord { - subject: FrozenNode; - object: FrozenNode; - predicate?: string; // not required if given apiEdge, qEdge - qualifiers?: BulkQualifiers; - publications?: string[]; // not required if given apiEdge, qEdge - recordHash?: string; // always supplied by Record, not required from user - api?: string; // not required if given apiEdge, qEdge - apiInforesCurie?: string; // not required if given apiEdge, qEdge - metaEdgeSource?: string; // not required if given apiEdge, qEdge - mappedResponse?: MappedResponse; -} - -export interface VerboseFrozenRecord { - subject: VerboseFrozenNode; - object: VerboseFrozenNode; - association: Association; - predicate?: string; // not required if given apiEdge, qEdge - qualifiers: BulkQualifiers; - publications?: string[]; // not required if given apiEdge, qEdge - recordHash?: string; // always supplied by Record, not required from user - api?: string; // not required if given apiEdge, qEdge - apiInforesCurie?: string; // not required if given apiEdge, qEdge - metaEdgeSource?: string; // not required if given apiEdge, qEdge - mappedResponse?: MappedResponse; -} - -// removes all computed values on assumption that apiEdge and qEdge are saved elsewhere -export interface MinimalFrozenRecord { - subject: VerboseFrozenNode | MinimalFrozenNode; - object: VerboseFrozenNode | MinimalFrozenNode; - publications?: string[]; // not always present - mappedResponse?: MappedResponse; - [additionalProperties: string]: any; -} - -export interface FrozenNode { - // less verbose, loses extra information from nodeNormalizer - original: string; - qNodeID: string; - isSet: boolean; - curie: string; - UMLS: string[]; - semanticType: string[]; - label: string; - apiLabel?: string; - attributes: any; - [additionalProperties: string]: any; // cleanest way to handler undefined properties -} - -export interface VerboseFrozenNode { - original: string; - normalizedInfo?: NodeNormalizerResultObj; // always supplied by Record, not required from user - qNodeID: string; - isSet: boolean; - curie: string; - UMLS: string[]; - semanticType: string[]; - semanticTypes: string[]; - label: string; - apiLabel?: string; - equivalentCuries?: string[]; // always supplied by Record, not required from user - names: string[]; - attributes: any; -} - -export interface MinimalFrozenNode { - original: string; - normalizedInfo?: NodeNormalizerResultObj; // always supplied by Record, not required from user - apiLabel?: string; - [additionalProperties: string]: any; // cleanest way to handler undefined properties -} - -export type RecordPackage = [apiEdges: any[], ...frozenRecords: FrozenRecord[]]; - -export interface MappedResponse { - trapi_sources?: TrapiSource[]; - "edge-attributes"?: EdgeAttribute[]; - [mappedItems: string]: any; -} - -export interface Association { - input_id?: string; - input_type?: string; - output_id?: string; - output_type?: string; - predicate: string; - source?: string; - api_name?: string; - "x-translator"?: any; - qualifiers?: BulkQualifiers; - apiIsPrimaryKnowledgeSource?: boolean; - [additionalProperties: string]: any; -} - -export interface QEdge { - getInputNode(): QNode; - getOutputNode(): QNode; - getHashedEdgeRepresentation(): string; - isReversed(): boolean; - [additionalProperties: string]: any; -} - -export interface QNode { - getID(): string; - isSet(): boolean; - [additionalProperties: string]: any; -} - -export interface EdgeAttribute { - attribute_source: string; - attribute_type_id: string; - value: any; - value_type_id: string; - attributes?: EdgeAttribute[]; - [additionalProperties: string]: any; -} - -export interface Identifier { - identifier: string; - label?: string; -} - -export interface NodeNormalizerResultObj { - primaryID: string; - equivalentIDs: string[]; - label: string; - labelAliases: string[]; - primaryTypes: string[]; - semanticTypes: string[]; - attributes: { - [attributeID: string]: any; - }; -} - -export interface BulkQualifiers { - [qualifierTypeID: string]: string | string[]; // qualifierValue -} diff --git a/src/transformers/biothings_transformer.ts b/src/transformers/biothings_transformer.ts index 8676dbc..cd09045 100644 --- a/src/transformers/biothings_transformer.ts +++ b/src/transformers/biothings_transformer.ts @@ -8,7 +8,7 @@ export default class BioThingsTransformer extends BaseTransformer { const mapper = item => { // for input not found, BioThings API returns an entry with a key "notfound" equal to true if (!("notfound" in item)) { - let input = generateCurie(this.edge.association.input_id, item.query); + let input = generateCurie(this.edge.association.input_id as string, item.query); if (input in res) { res[input].push(item); } else { diff --git a/src/transformers/transformer.ts b/src/transformers/transformer.ts index 02f1df3..be0e12f 100644 --- a/src/transformers/transformer.ts +++ b/src/transformers/transformer.ts @@ -2,8 +2,7 @@ import { transform } from "../json_transform/index"; import { JSONDoc } from "../json_transform/types"; import { generateCurie, toArray } from "../utils"; import { BTEKGOperationObject, BTEQueryObject } from "../types"; -import { Record } from "../record"; -import { FrozenRecord } from "../record"; +import { Record } from "@biothings-explorer/types"; import * as _ from "lodash"; import Debug from "debug"; import async from "async"; @@ -25,7 +24,7 @@ export default class BaseTransformer { */ async pairCurieWithAPIResponse() { const input = generateCurie( - this.edge.association.input_id, + this.edge.association.input_id as string, this.edge.input.hasOwnProperty("queryInputs") ? this.edge.input["queryInputs"] : (this.edge.input as string), @@ -228,7 +227,7 @@ export default class BaseTransformer { _removeNonEdgeData(mappedResponse: any) { delete mappedResponse["@type"]; - delete mappedResponse[this.edge.association.output_id]; + delete mappedResponse[this.edge.association.output_id as string]; delete mappedResponse["input_name"]; delete mappedResponse["output_name"]; return mappedResponse; @@ -330,7 +329,7 @@ export default class BaseTransformer { * @param {Object} mappedResponse - JSON response representing an output. */ extractObjectIDs(mappedResponse: object) { - const output_id_type = this.edge.association.output_id; + const output_id_type = this.edge.association.output_id as string; if (!(output_id_type in mappedResponse)) { return []; } diff --git a/src/transformers/trapi_transformer.ts b/src/transformers/trapi_transformer.ts index 0eb5dee..8d8f128 100644 --- a/src/transformers/trapi_transformer.ts +++ b/src/transformers/trapi_transformer.ts @@ -1,5 +1,5 @@ import BaseTransformer from "./transformer"; -import { Record } from "../record"; +import { Record } from "@biothings-explorer/types"; import { JSONDoc } from "../json_transform/types"; import { removeBioLinkPrefix } from "@biothings-explorer/utils"; diff --git a/src/types.ts b/src/types.ts index 6c24101..ce0427f 100644 --- a/src/types.ts +++ b/src/types.ts @@ -1,48 +1,5 @@ import { JSONDoc } from "./json_transform/types"; - -interface KGAssociationObject { - input_id?: string; - input_type: string; - output_id?: string; - output_type: string; - predicate: string; - source?: string; - api_name?: string; -} - -interface XBTEParametersObject { - [key: string]: string | number; -} - -interface TransformerObject { - wrap?: string; - pair?: string; -} - -interface TransformerSet { - [transformerPattern: string]: TransformerObject; -} - -interface QueryOperationInterface { - path: string; - method: string; - server: string; - tags: string[]; - path_params: string[]; - params: XBTEParametersObject; - request_body: object; - supportBatch: boolean; - inputSeparator: string; - transformer: TransformerSet; -} - -interface SmartAPIKGOperationObject { - association: KGAssociationObject; - query_operation?: QueryOperationInterface; - response_mapping?: any; - id?: string; - tags?: string[]; -} +import { SmartAPIKGOperationObject } from "@biothings-explorer/smartapi-kg"; interface TemplatedInput { queryInputs: string | string[];