-
Notifications
You must be signed in to change notification settings - Fork 5
/
meltano.yml
85 lines (85 loc) · 2.86 KB
/
meltano.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
version: 1
send_anonymous_usage_stats: true
project_id: "tap-mongodb"
default_environment: dev
environments:
- name: dev
plugins:
extractors:
- name: "tap-mongodb"
namespace: "tap_mongodb"
pip_url: -e .
capabilities:
- batch
- state
- catalog
- discover
- about
- stream-maps
- test
settings:
- name: stream_prefix
description:
Optionally add a prefix for all streams, useful if ingesting
from multiple shards/clusters via independent tap-mongodb configs.
value: ""
- name: optional_replication_key
description: |
Make the replication key optional. If set to true, the tap will
not fail if the replication key is not found in a document.
value: False
- name: database_includes
description: |
A list of databases to include. If this is set,
only the databases in this list will be replicated.
value: []
- name: database_excludes
description: |
A list of databases to exclude. If this is set,
all databases except those in this list will be replicated.
value: []
- name: infer_schema
description: |
If set to true, the tap will infer the schema from a sample of the
documents in each collection. If set to false, the tap will
use a default schema for each collection.
value: False
- name: infer_schema_max_docs
description: |
The maximum number of documents to use when inferring the schema.
value: 2000
- name: mongo
description:
These props are passed directly to pymongo MongoClient allowing the
tap user full flexibility not provided in any other Mongo tap.
- name: mongo_file_location
description:
Optional path to a YAML file containing the mongo configuration
properties.
config:
# All streams will be prefixed with `example_`
stream_prefix: example_
# These are all passed directly through to pymongo MongoClient, ie:
mongo:
host: localhost
port: 27017
directConnection: true
readPreference: secondaryPreferred
username: mongodb
password: mongodb
authSource: admin
authMechanism: SCRAM-SHA-1
tls: true
select:
- "*.*"
metadata:
# Example of how to set a replication key for a collection
# <stream_prefix><db_name>_<collection_name>
example_mydb_mycollection:
replication-key: lastUpdatedAt
example_mydb_myothercollection:
replication-key: lastUpdatedAt
loaders:
- name: target-jsonl
variant: andyh1203
pip_url: target-jsonl