forked from elastic/elasticsearch
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
GeoIP database downloader (elastic#68424)
This change adds component that will download new GeoIP databases from infra service New databases are downloaded in chunks and stored in .geoip_databases index Downloads are verified against MD5 checksum provided by the server Current state of all stored databases is stored in cluster state in persistent task state Relates to elastic#68920 # Conflicts: # modules/ingest-geoip/src/main/java/org/elasticsearch/ingest/geoip/IngestGeoIpPlugin.java
- Loading branch information
1 parent
132c4f8
commit cc949b1
Showing
20 changed files
with
1,650 additions
and
62 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
63 changes: 63 additions & 0 deletions
63
...st-geoip/src/internalClusterTest/java/org/elasticsearch/ingest/geoip/AbstractGeoIpIT.java
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,63 @@ | ||
/* | ||
* Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one | ||
* or more contributor license agreements. Licensed under the Elastic License | ||
* 2.0 and the Server Side Public License, v 1; you may not use this file except | ||
* in compliance with, at your election, the Elastic License 2.0 or the Server | ||
* Side Public License, v 1. | ||
*/ | ||
|
||
package org.elasticsearch.ingest.geoip; | ||
|
||
import org.elasticsearch.common.settings.Setting; | ||
import org.elasticsearch.common.settings.Settings; | ||
import org.elasticsearch.plugins.Plugin; | ||
import org.elasticsearch.test.ESIntegTestCase; | ||
import org.elasticsearch.test.StreamsUtils; | ||
|
||
import java.io.ByteArrayInputStream; | ||
import java.io.IOException; | ||
import java.io.UncheckedIOException; | ||
import java.nio.file.Files; | ||
import java.nio.file.Path; | ||
import java.util.Arrays; | ||
import java.util.Collection; | ||
import java.util.Collections; | ||
import java.util.List; | ||
|
||
public abstract class AbstractGeoIpIT extends ESIntegTestCase { | ||
@Override | ||
protected Collection<Class<? extends Plugin>> nodePlugins() { | ||
return Arrays.asList(IngestGeoIpPlugin.class, IngestGeoIpSettingsPlugin.class); | ||
} | ||
|
||
@Override | ||
protected Settings nodeSettings(final int nodeOrdinal) { | ||
final Path databasePath = createTempDir(); | ||
try { | ||
Files.createDirectories(databasePath); | ||
Files.copy( | ||
new ByteArrayInputStream(StreamsUtils.copyToBytesFromClasspath("/GeoLite2-City.mmdb")), | ||
databasePath.resolve("GeoLite2-City.mmdb")); | ||
Files.copy( | ||
new ByteArrayInputStream(StreamsUtils.copyToBytesFromClasspath("/GeoLite2-Country.mmdb")), | ||
databasePath.resolve("GeoLite2-Country.mmdb")); | ||
Files.copy( | ||
new ByteArrayInputStream(StreamsUtils.copyToBytesFromClasspath("/GeoLite2-ASN.mmdb")), | ||
databasePath.resolve("GeoLite2-ASN.mmdb")); | ||
} catch (final IOException e) { | ||
throw new UncheckedIOException(e); | ||
} | ||
return Settings.builder() | ||
.put("ingest.geoip.database_path", databasePath) | ||
.put(super.nodeSettings(nodeOrdinal)) | ||
.build(); | ||
} | ||
|
||
public static class IngestGeoIpSettingsPlugin extends Plugin { | ||
|
||
@Override | ||
public List<Setting<?>> getSettings() { | ||
return Collections.singletonList(Setting.simpleString("ingest.geoip.database_path", Setting.Property.NodeScope)); | ||
} | ||
} | ||
} |
174 changes: 174 additions & 0 deletions
174
...-geoip/src/internalClusterTest/java/org/elasticsearch/ingest/geoip/GeoIpDownloaderIT.java
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,174 @@ | ||
/* | ||
* Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one | ||
* or more contributor license agreements. Licensed under the Elastic License | ||
* 2.0 and the Server Side Public License, v 1; you may not use this file except | ||
* in compliance with, at your election, the Elastic License 2.0 or the Server | ||
* Side Public License, v 1. | ||
*/ | ||
|
||
package org.elasticsearch.ingest.geoip; | ||
|
||
import com.maxmind.geoip2.DatabaseReader; | ||
import org.apache.lucene.search.TotalHits; | ||
import org.elasticsearch.action.admin.cluster.settings.ClusterUpdateSettingsResponse; | ||
import org.elasticsearch.action.search.SearchResponse; | ||
import org.elasticsearch.common.SuppressForbidden; | ||
import org.elasticsearch.common.settings.Settings; | ||
import org.elasticsearch.index.query.BoolQueryBuilder; | ||
import org.elasticsearch.index.query.MatchQueryBuilder; | ||
import org.elasticsearch.index.query.RangeQueryBuilder; | ||
import org.elasticsearch.index.reindex.ReindexPlugin; | ||
import org.elasticsearch.persistent.PersistentTaskParams; | ||
import org.elasticsearch.persistent.PersistentTasksCustomMetadata; | ||
import org.elasticsearch.plugins.Plugin; | ||
import org.elasticsearch.search.SearchHit; | ||
import org.elasticsearch.search.sort.SortOrder; | ||
import org.elasticsearch.test.ESIntegTestCase.ClusterScope; | ||
import org.elasticsearch.test.ESIntegTestCase.Scope; | ||
|
||
import java.io.BufferedOutputStream; | ||
import java.io.ByteArrayInputStream; | ||
import java.io.IOException; | ||
import java.io.InputStream; | ||
import java.io.OutputStream; | ||
import java.nio.file.Files; | ||
import java.nio.file.Path; | ||
import java.util.ArrayList; | ||
import java.util.Arrays; | ||
import java.util.Collection; | ||
import java.util.Iterator; | ||
import java.util.List; | ||
import java.util.Set; | ||
import java.util.concurrent.TimeUnit; | ||
import java.util.zip.GZIPInputStream; | ||
|
||
import static java.nio.file.StandardOpenOption.CREATE; | ||
import static java.nio.file.StandardOpenOption.TRUNCATE_EXISTING; | ||
import static java.nio.file.StandardOpenOption.WRITE; | ||
|
||
@ClusterScope(scope = Scope.TEST, maxNumDataNodes = 1) | ||
public class GeoIpDownloaderIT extends AbstractGeoIpIT { | ||
|
||
@Override | ||
protected Collection<Class<? extends Plugin>> nodePlugins() { | ||
return Arrays.asList(ReindexPlugin.class, IngestGeoIpPlugin.class, GeoIpProcessorNonIngestNodeIT.IngestGeoIpSettingsPlugin.class); | ||
} | ||
|
||
@Override | ||
protected Settings nodeSettings(int nodeOrdinal) { | ||
Settings.Builder settings = Settings.builder() | ||
.put(super.nodeSettings(nodeOrdinal)) | ||
.put(GeoIpDownloaderTaskExecutor.ENABLED_SETTING.getKey(), false); | ||
String endpoint = System.getProperty("geoip_endpoint"); | ||
if (endpoint != null) { | ||
settings.put(GeoIpDownloader.ENDPOINT_SETTING.getKey(), endpoint); | ||
} | ||
return settings.build(); | ||
} | ||
|
||
public void testGeoIpDatabasesDownload() throws Exception { | ||
ClusterUpdateSettingsResponse settingsResponse = client().admin().cluster() | ||
.prepareUpdateSettings() | ||
.setPersistentSettings(Settings.builder().put(GeoIpDownloaderTaskExecutor.ENABLED_SETTING.getKey(), true)) | ||
.get(); | ||
assertTrue(settingsResponse.isAcknowledged()); | ||
assertBusy(() -> { | ||
PersistentTasksCustomMetadata.PersistentTask<PersistentTaskParams> task = getTask(); | ||
assertNotNull(task); | ||
GeoIpTaskState state = (GeoIpTaskState) task.getState(); | ||
assertNotNull(state); | ||
assertEquals(Set.of("GeoLite2-ASN.mmdb", "GeoLite2-City.mmdb", "GeoLite2-Country.mmdb"), state.getDatabases().keySet()); | ||
}, 2, TimeUnit.MINUTES); | ||
|
||
GeoIpTaskState state = (GeoIpTaskState) getTask().getState(); | ||
for (String id : List.of("GeoLite2-ASN.mmdb", "GeoLite2-City.mmdb", "GeoLite2-Country.mmdb")) { | ||
assertBusy(() -> { | ||
GeoIpTaskState.Metadata metadata = state.get(id); | ||
BoolQueryBuilder queryBuilder = new BoolQueryBuilder() | ||
.filter(new MatchQueryBuilder("name", id)) | ||
.filter(new RangeQueryBuilder("chunk") | ||
.from(metadata.getFirstChunk()) | ||
.to(metadata.getLastChunk(), true)); | ||
int size = metadata.getLastChunk() - metadata.getFirstChunk() + 1; | ||
SearchResponse res = client().prepareSearch(GeoIpDownloader.DATABASES_INDEX) | ||
.setSize(size) | ||
.setQuery(queryBuilder) | ||
.addSort("chunk", SortOrder.ASC) | ||
.get(); | ||
TotalHits totalHits = res.getHits().getTotalHits(); | ||
assertEquals(TotalHits.Relation.EQUAL_TO, totalHits.relation); | ||
assertEquals(size, totalHits.value); | ||
assertEquals(size, res.getHits().getHits().length); | ||
|
||
List<byte[]> data = new ArrayList<>(); | ||
|
||
for (SearchHit hit : res.getHits().getHits()) { | ||
data.add((byte[]) hit.getSourceAsMap().get("data")); | ||
} | ||
|
||
GZIPInputStream stream = new GZIPInputStream(new MultiByteArrayInputStream(data)); | ||
Path tempFile = createTempFile(); | ||
try (OutputStream os = new BufferedOutputStream(Files.newOutputStream(tempFile, TRUNCATE_EXISTING, WRITE, CREATE))) { | ||
stream.transferTo(os); | ||
} | ||
|
||
parseDatabase(tempFile); | ||
}); | ||
} | ||
} | ||
|
||
@SuppressForbidden(reason = "Maxmind API requires java.io.File") | ||
private void parseDatabase(Path tempFile) throws IOException { | ||
try (DatabaseReader databaseReader = new DatabaseReader.Builder(tempFile.toFile()).build()) { | ||
assertNotNull(databaseReader.getMetadata()); | ||
} | ||
} | ||
|
||
private PersistentTasksCustomMetadata.PersistentTask<PersistentTaskParams> getTask() { | ||
return PersistentTasksCustomMetadata.getTaskWithId(clusterService().state(), GeoIpDownloader.GEOIP_DOWNLOADER); | ||
} | ||
|
||
private static class MultiByteArrayInputStream extends InputStream { | ||
|
||
private final Iterator<byte[]> data; | ||
private ByteArrayInputStream current; | ||
|
||
private MultiByteArrayInputStream(List<byte[]> data) { | ||
this.data = data.iterator(); | ||
} | ||
|
||
@Override | ||
public int read() { | ||
if (current == null) { | ||
if (data.hasNext() == false) { | ||
return -1; | ||
} | ||
|
||
current = new ByteArrayInputStream(data.next()); | ||
} | ||
int read = current.read(); | ||
if (read == -1) { | ||
current = null; | ||
return read(); | ||
} | ||
return read; | ||
} | ||
|
||
@Override | ||
public int read(byte[] b, int off, int len) throws IOException { | ||
if (current == null) { | ||
if (data.hasNext() == false) { | ||
return -1; | ||
} | ||
|
||
current = new ByteArrayInputStream(data.next()); | ||
} | ||
int read = current.read(b, off, len); | ||
if (read == -1) { | ||
current = null; | ||
return read(b, off, len); | ||
} | ||
return read; | ||
} | ||
} | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.