From 5b9ce11fdccc73cd7ba0967a8f302cef3c10f3b3 Mon Sep 17 00:00:00 2001 From: Erik Spears Date: Wed, 16 Oct 2024 14:03:31 -0400 Subject: [PATCH] updates to our default BigQuery SearchProvider --- SearchProviders/company_data_bigquery.json | 31 ++++++++++++++++++++++ SearchProviders/funding_db_bigquery.json | 22 --------------- SearchProviders/preloaded.json | 18 ++++++++----- 3 files changed, 43 insertions(+), 28 deletions(-) create mode 100644 SearchProviders/company_data_bigquery.json delete mode 100644 SearchProviders/funding_db_bigquery.json diff --git a/SearchProviders/company_data_bigquery.json b/SearchProviders/company_data_bigquery.json new file mode 100644 index 000000000..9a8f5a96d --- /dev/null +++ b/SearchProviders/company_data_bigquery.json @@ -0,0 +1,31 @@ +{ + "name": "Company Data - BigQuery", + "active": false, + "default": false, + "connector": "BigQuery", + "url": "", + "query_template": "select {fields} from `{table}` where search({field1}, '{query_string}') or search({field2}, '{query_string}') or search({field3}, '{query_string}');", + "query_template_json": {}, + "post_query_template": {}, + "http_request_headers": {}, + "page_fetch_config_json": {}, + "query_processors": [ + "AdaptiveQueryProcessor" + ], + "query_mappings": "fields=*,sort_by_date=year_founded,table=company_dataset.company,field1=name,field2=domain,field3=locality", + "result_grouping_field": "", + "result_processors": [ + "MappingResultProcessor", + "CosineRelevancyResultProcessor" + ], + "response_mappings": "", + "result_mappings": "title=name,body='{name} was founded in {year_founded} and serves the {industry} industry. The company is located in {locality} and has approximately {current_employee_estimate} employees. The registered domain for this organization is: {domain}',url='https://www.{linkedin_url}',NO_PAYLOAD", + "results_per_query": 10, + "credentials": "/path/to/bigquery/token.json", + "eval_credentials": "", + "tags": [ + "Company", + "BigQuery", + "Internal" + ] +} diff --git a/SearchProviders/funding_db_bigquery.json b/SearchProviders/funding_db_bigquery.json deleted file mode 100644 index 769107056..000000000 --- a/SearchProviders/funding_db_bigquery.json +++ /dev/null @@ -1,22 +0,0 @@ -{ - "name": "Company Funding Records - BigQuery", - "active": false, - "default": false, - "connector": "BigQuery", - "query_template": "select {fields} from `{table}` where search({field1}, '{query_string}') or search({field2}, '{query_string}');", - "query_processors": [ - "AdaptiveQueryProcessor" - ], - "query_mappings": "fields=*,sort_by_date=fundedDate,table=funding.funding,field1=company,field2=city", - "result_processors": [ - "MappingResultProcessor", - "CosineRelevancyResultProcessor" - ], - "result_mappings": "title='{company}',body='{company} raised ${raisedamt} series {round} on {fundeddate}. The company is located in {city} {state} and has {numemps} employees.',url=id,date_published=fundeddate,NO_PAYLOAD", - "credentials": "/path/to/bigquery/token.json", - "tags": [ - "Company", - "BigQuery", - "Internal" - ] -} diff --git a/SearchProviders/preloaded.json b/SearchProviders/preloaded.json index 694d9ef8e..8521876ff 100644 --- a/SearchProviders/preloaded.json +++ b/SearchProviders/preloaded.json @@ -326,28 +326,34 @@ ] }, { - "name": "Company Funding Records - BigQuery", + "name": "Company Data - BigQuery", + "description": "Searches info on 7 million companies worldwide ncluding Linkedin URL, company size, location, and number of employees. Search only with company name, domain or location. Supports many languages. Does not support NOT operator.", "active": false, "default": false, "connector": "BigQuery", "url": "", - "query_template": "select {fields} from `{table}` where search({field1}, '{query_string}') or search({field2}, '{query_string}');", + "query_template": "select {fields} from `{table}` where search({field1}, '{query_string}') or search({field2}, '{query_string}') or search({field3}, '{query_string}');", + "query_template_json": {}, + "post_query_template": {}, + "http_request_headers": {}, + "page_fetch_config_json": {}, "query_processors": [ "AdaptiveQueryProcessor" ], - "query_mappings": "fields=*,sort_by_date=fundedDate,table=funding.funding,field1=company,field2=city", + "query_mappings": "fields=*,sort_by_date=year_founded,table=company_dataset.company,field1=name,field2=domain,field3=locality", + "result_grouping_field": "", "result_processors": [ "MappingResultProcessor", "CosineRelevancyResultProcessor" ], "response_mappings": "", - "result_mappings": "title='{company}',body='{company} raised ${raisedamt} series {round} on {fundeddate}. The company is located in {city} {state} and has {numemps} employees.',url=id,date_published=fundeddate,NO_PAYLOAD", + "result_mappings": "title=name,body='{name} was founded in {year_founded} and serves the {industry} industry. The company is located in {locality} and has approximately {current_employee_estimate} employees. The registered domain for this organization is: {domain}',url='https://www.{linkedin_url}',NO_PAYLOAD", "results_per_query": 10, "credentials": "/path/to/bigquery/token.json", + "eval_credentials": "", "tags": [ "Company", - "BigQuery", - "Internal" + "BigQuery" ] }, {