Skip to content

Commit

Permalink
Set User-Agent in http request (opensearch-project#300)
Browse files Browse the repository at this point in the history
Signed-off-by: Heemin Kim <[email protected]>
  • Loading branch information
heemin32 committed Jul 21, 2023
1 parent 235431e commit 062d73b
Show file tree
Hide file tree
Showing 10 changed files with 128 additions and 31 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,7 @@
import java.io.IOException;
import java.io.InputStreamReader;
import java.net.URL;
import java.net.URLConnection;
import java.nio.CharBuffer;
import java.security.AccessController;
import java.security.PrivilegedAction;
Expand All @@ -25,6 +26,8 @@
import org.opensearch.core.xcontent.DeprecationHandler;
import org.opensearch.core.xcontent.NamedXContentRegistry;
import org.opensearch.core.xcontent.XContentParser;
import org.opensearch.geospatial.annotation.VisibleForTesting;
import org.opensearch.geospatial.shared.Constants;

/**
* Ip2Geo datasource manifest file object
Expand All @@ -39,7 +42,7 @@ public class DatasourceManifest {
private static final ParseField DB_NAME_FIELD = new ParseField("db_name");
private static final ParseField SHA256_HASH_FIELD = new ParseField("sha256_hash");
private static final ParseField VALID_FOR_IN_DAYS_FIELD = new ParseField("valid_for_in_days");
private static final ParseField UPDATED_AT_FIELD = new ParseField("updated_at");
private static final ParseField UPDATED_AT_FIELD = new ParseField("updated_at_in_epoch_milli");
private static final ParseField PROVIDER_FIELD = new ParseField("provider");

/**
Expand Down Expand Up @@ -114,20 +117,31 @@ public static class Builder {
public static DatasourceManifest build(final URL url) {
SpecialPermission.check();
return AccessController.doPrivileged((PrivilegedAction<DatasourceManifest>) () -> {
try (BufferedReader reader = new BufferedReader(new InputStreamReader(url.openStream()))) {
CharBuffer charBuffer = CharBuffer.allocate(MANIFEST_FILE_MAX_BYTES);
reader.read(charBuffer);
charBuffer.flip();
XContentParser parser = JsonXContent.jsonXContent.createParser(
NamedXContentRegistry.EMPTY,
DeprecationHandler.IGNORE_DEPRECATIONS,
charBuffer.toString()
);
return PARSER.parse(parser, null);
try {
URLConnection connection = url.openConnection();
return internalBuild(connection);
} catch (IOException e) {
throw new RuntimeException(e);
}
});
}

@VisibleForTesting
@SuppressForbidden(reason = "Need to connect to http endpoint to read manifest file")
protected static DatasourceManifest internalBuild(final URLConnection connection) throws IOException {
connection.addRequestProperty(Constants.USER_AGENT_KEY, Constants.USER_AGENT_VALUE);
InputStreamReader inputStreamReader = new InputStreamReader(connection.getInputStream());
try (BufferedReader reader = new BufferedReader(inputStreamReader)) {
CharBuffer charBuffer = CharBuffer.allocate(MANIFEST_FILE_MAX_BYTES);
reader.read(charBuffer);
charBuffer.flip();
XContentParser parser = JsonXContent.jsonXContent.createParser(
NamedXContentRegistry.EMPTY,
DeprecationHandler.IGNORE_DEPRECATIONS,
charBuffer.toString()
);
return PARSER.parse(parser, null);
}
}
}
}
Original file line number Diff line number Diff line change
Expand Up @@ -12,6 +12,7 @@
import java.io.InputStream;
import java.io.InputStreamReader;
import java.net.URL;
import java.net.URLConnection;
import java.nio.charset.StandardCharsets;
import java.security.AccessController;
import java.security.PrivilegedAction;
Expand Down Expand Up @@ -53,6 +54,8 @@
import org.opensearch.common.unit.TimeValue;
import org.opensearch.common.xcontent.XContentHelper;
import org.opensearch.common.xcontent.XContentType;
import org.opensearch.geospatial.annotation.VisibleForTesting;
import org.opensearch.geospatial.shared.Constants;
import org.opensearch.geospatial.shared.StashedThreadContext;
import org.opensearch.index.query.QueryBuilders;

Expand Down Expand Up @@ -139,26 +142,29 @@ public CSVParser getDatabaseReader(final DatasourceManifest manifest) {
return AccessController.doPrivileged((PrivilegedAction<CSVParser>) () -> {
try {
URL zipUrl = new URL(manifest.getUrl());
ZipInputStream zipIn = new ZipInputStream(zipUrl.openStream());
ZipEntry zipEntry = zipIn.getNextEntry();
while (zipEntry != null) {
if (zipEntry.getName().equalsIgnoreCase(manifest.getDbName()) == false) {
zipEntry = zipIn.getNextEntry();
continue;
}
return new CSVParser(new BufferedReader(new InputStreamReader(zipIn)), CSVFormat.RFC4180);
}
return internalGetDatabaseReader(manifest, zipUrl.openConnection());
} catch (IOException e) {
throw new OpenSearchException("failed to read geoip data from {}", manifest.getUrl(), e);
}
throw new OpenSearchException(
"database file [{}] does not exist in the zip file [{}]",
manifest.getDbName(),
manifest.getUrl()
);
});
}

@VisibleForTesting
@SuppressForbidden(reason = "Need to connect to http endpoint to read GeoIP database file")
protected CSVParser internalGetDatabaseReader(final DatasourceManifest manifest, final URLConnection connection) throws IOException {
connection.addRequestProperty(Constants.USER_AGENT_KEY, Constants.USER_AGENT_VALUE);
ZipInputStream zipIn = new ZipInputStream(connection.getInputStream());
ZipEntry zipEntry = zipIn.getNextEntry();
while (zipEntry != null) {
if (zipEntry.getName().equalsIgnoreCase(manifest.getDbName()) == false) {
zipEntry = zipIn.getNextEntry();
continue;
}
return new CSVParser(new BufferedReader(new InputStreamReader(zipIn)), CSVFormat.RFC4180);
}
throw new OpenSearchException("database file [{}] does not exist in the zip file [{}]", manifest.getDbName(), manifest.getUrl());
}

/**
* Create a document in json string format to ingest in datasource database index
*
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -23,8 +23,7 @@ public class Ip2GeoSettings {
*/
public static final Setting<String> DATASOURCE_ENDPOINT = Setting.simpleString(
"plugins.geospatial.ip2geo.datasource.endpoint",
// TODO: This value is not correct. Update it later once CDN server is ready.
"https://geoip.maps.opensearch.org/v1/geolite-2/manifest.json",
"https://geoip.maps.opensearch.org/v1/geolite2-city/manifest.json",
new DatasourceEndpointValidator(),
Setting.Property.NodeScope,
Setting.Property.Dynamic
Expand Down
15 changes: 15 additions & 0 deletions src/main/java/org/opensearch/geospatial/shared/Constants.java
Original file line number Diff line number Diff line change
@@ -0,0 +1,15 @@
/*
* Copyright OpenSearch Contributors
* SPDX-License-Identifier: Apache-2.0
*/

package org.opensearch.geospatial.shared;

import java.util.Locale;

import org.opensearch.Version;

public class Constants {
public static final String USER_AGENT_KEY = "User-Agent";
public static final String USER_AGENT_VALUE = String.format(Locale.ROOT, "OpenSearch/%s vanilla", Version.CURRENT.toString());
}
Original file line number Diff line number Diff line change
Expand Up @@ -69,7 +69,7 @@ public void testPrepareRequestDefaultValue() {
verifyingClient.setExecuteLocallyVerifier((actionResponse, actionRequest) -> {
assertTrue(actionRequest instanceof PutDatasourceRequest);
PutDatasourceRequest putDatasourceRequest = (PutDatasourceRequest) actionRequest;
assertEquals("https://geoip.maps.opensearch.org/v1/geolite-2/manifest.json", putDatasourceRequest.getEndpoint());
assertEquals("https://geoip.maps.opensearch.org/v1/geolite2-city/manifest.json", putDatasourceRequest.getEndpoint());
assertEquals(TimeValue.timeValueDays(3), putDatasourceRequest.getUpdateInterval());
assertEquals(datasourceName, putDatasourceRequest.getName());
isExecuted.set(true);
Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,38 @@
/*
* Copyright OpenSearch Contributors
* SPDX-License-Identifier: Apache-2.0
*/

package org.opensearch.geospatial.ip2geo.common;

import static org.mockito.Mockito.mock;
import static org.mockito.Mockito.verify;
import static org.mockito.Mockito.when;

import java.io.File;
import java.io.FileInputStream;
import java.net.URLConnection;

import lombok.SneakyThrows;

import org.opensearch.common.SuppressForbidden;
import org.opensearch.geospatial.ip2geo.Ip2GeoTestCase;
import org.opensearch.geospatial.shared.Constants;

@SuppressForbidden(reason = "unit test")
public class DatasourceManifestTests extends Ip2GeoTestCase {

@SneakyThrows
public void testInternalBuild_whenCalled_thenCorrectUserAgentValueIsSet() {
URLConnection connection = mock(URLConnection.class);
File manifestFile = new File(this.getClass().getClassLoader().getResource("ip2geo/manifest.json").getFile());
when(connection.getInputStream()).thenReturn(new FileInputStream(manifestFile));

// Run
DatasourceManifest manifest = DatasourceManifest.Builder.internalBuild(connection);

// Verify
verify(connection).addRequestProperty(Constants.USER_AGENT_KEY, Constants.USER_AGENT_VALUE);
assertEquals("https://test.com/db.zip", manifest.getUrl());
}
}
Original file line number Diff line number Diff line change
Expand Up @@ -14,6 +14,8 @@
import static org.opensearch.geospatial.ip2geo.jobscheduler.Datasource.IP2GEO_DATA_INDEX_NAME_PREFIX;

import java.io.File;
import java.io.FileInputStream;
import java.net.URLConnection;
import java.nio.ByteBuffer;
import java.nio.charset.StandardCharsets;
import java.time.Instant;
Expand Down Expand Up @@ -55,6 +57,7 @@
import org.opensearch.common.bytes.BytesReference;
import org.opensearch.geospatial.GeospatialTestHelper;
import org.opensearch.geospatial.ip2geo.Ip2GeoTestCase;
import org.opensearch.geospatial.shared.Constants;
import org.opensearch.index.query.QueryBuilders;
import org.opensearch.search.SearchHit;
import org.opensearch.search.SearchHits;
Expand Down Expand Up @@ -139,6 +142,28 @@ public void testGetDatabaseReaderNoFile() throws Exception {
assertTrue(exception.getMessage().contains("does not exist"));
}

@SneakyThrows
public void testInternalGetDatabaseReader_whenCalled_thenSetUserAgent() {
File zipFile = new File(this.getClass().getClassLoader().getResource("ip2geo/sample_valid.zip").getFile());
DatasourceManifest manifest = new DatasourceManifest(
zipFile.toURI().toURL().toExternalForm(),
"sample_valid.csv",
"fake_sha256",
1l,
Instant.now().toEpochMilli(),
"tester"
);

URLConnection connection = mock(URLConnection.class);
when(connection.getInputStream()).thenReturn(new FileInputStream(zipFile));

// Run
noOpsGeoIpDataFacade.internalGetDatabaseReader(manifest, connection);

// Verify
verify(connection).addRequestProperty(Constants.USER_AGENT_KEY, Constants.USER_AGENT_VALUE);
}

public void testDeleteIp2GeoDataIndex() {
String index = String.format(Locale.ROOT, "%s.%s", IP2GEO_DATA_INDEX_NAME_PREFIX, GeospatialTestHelper.randomLowerCaseString());
verifyingClient.setExecuteVerifier((actionResponse, actionRequest) -> {
Expand Down
2 changes: 1 addition & 1 deletion src/test/resources/ip2geo/manifest.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,6 @@
"db_name": "sample_valid.csv",
"sha256_hash": "safasdfaskkkesadfasdf",
"valid_for_in_days": 30,
"updated_at": 3134012341236,
"updated_at_in_epoch_milli": 3134012341236,
"provider": "sample_provider"
}
2 changes: 1 addition & 1 deletion src/test/resources/ip2geo/manifest_invalid_url.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,6 @@
"db_name": "sample_valid.csv",
"sha256_hash": "safasdfaskkkesadfasdf",
"valid_for_in_days": 30,
"updated_at": 3134012341236,
"updated_at_in_epoch_milli": 3134012341236,
"provider": "sample_provider"
}
2 changes: 1 addition & 1 deletion src/test/resources/ip2geo/manifest_template.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,6 @@
"db_name": "sample_valid.csv",
"sha256_hash": "safasdfaskkkesadfasdf",
"valid_for_in_days": 30,
"updated_at": 3134012341236,
"updated_at_in_epoch_milli": 3134012341236,
"provider": "maxmind"
}

0 comments on commit 062d73b

Please sign in to comment.