Search in sources :

Example 1 with SingularityS3SearchRequest

use of com.hubspot.singularity.api.SingularityS3SearchRequest in project Singularity by HubSpot.

the class S3LogResource method getS3LogsWithExecutorService.

// Fetching logs
private List<SingularityS3LogMetadata> getS3LogsWithExecutorService(S3Configuration s3Configuration, ListeningExecutorService executorService, Map<SingularityS3Service, Set<String>> servicesToPrefixes, int totalPrefixCount, final SingularityS3SearchRequest search, final ConcurrentHashMap<String, ContinuationToken> continuationTokens, final boolean paginated) throws InterruptedException, ExecutionException, TimeoutException {
    List<ListenableFuture<List<S3ObjectSummaryHolder>>> futures = Lists.newArrayListWithCapacity(totalPrefixCount);
    final AtomicInteger resultCount = new AtomicInteger();
    for (final Map.Entry<SingularityS3Service, Set<String>> entry : servicesToPrefixes.entrySet()) {
        final String s3Bucket = entry.getKey().getBucket();
        final String group = entry.getKey().getGroup();
        final AmazonS3 s3Client = entry.getKey().getS3Client();
        for (final String s3Prefix : entry.getValue()) {
            final String key = String.format(CONTINUATION_TOKEN_KEY_FORMAT, group, s3Bucket, s3Prefix);
            if (search.getContinuationTokens().containsKey(key) && search.getContinuationTokens().get(key).isLastPage()) {
                LOG.trace("No further content for prefix {} in bucket {}, skipping", s3Prefix, s3Bucket);
                continuationTokens.putIfAbsent(key, search.getContinuationTokens().get(key));
                continue;
            }
            futures.add(executorService.submit(new Callable<List<S3ObjectSummaryHolder>>() {

                @Override
                public List<S3ObjectSummaryHolder> call() throws Exception {
                    ListObjectsV2Request request = new ListObjectsV2Request().withBucketName(s3Bucket).withPrefix(s3Prefix);
                    if (paginated) {
                        Optional<ContinuationToken> token = Optional.empty();
                        if (search.getContinuationTokens().containsKey(key) && !Strings.isNullOrEmpty(search.getContinuationTokens().get(key).getValue())) {
                            request.setContinuationToken(search.getContinuationTokens().get(key).getValue());
                            token = Optional.of(search.getContinuationTokens().get(key));
                        }
                        int targetResultCount = search.getMaxPerPage().orElse(DEFAULT_TARGET_MAX_RESULTS);
                        request.setMaxKeys(targetResultCount);
                        if (resultCount.get() < targetResultCount) {
                            ListObjectsV2Result result = s3Client.listObjectsV2(request);
                            if (result.getObjectSummaries().isEmpty()) {
                                continuationTokens.putIfAbsent(key, new ContinuationToken(result.getNextContinuationToken(), true));
                                return Collections.emptyList();
                            } else {
                                boolean addToList = incrementIfLessThan(resultCount, result.getObjectSummaries().size(), targetResultCount);
                                if (addToList) {
                                    continuationTokens.putIfAbsent(key, new ContinuationToken(result.getNextContinuationToken(), !result.isTruncated()));
                                    List<S3ObjectSummaryHolder> objectSummaryHolders = new ArrayList<>();
                                    for (S3ObjectSummary objectSummary : result.getObjectSummaries()) {
                                        if (search.getFileNamePrefixWhitelist().isEmpty() || search.getFileNamePrefixWhitelist().stream().anyMatch(whitelistedPrefix -> objectSummary.getKey().startsWith(whitelistedPrefix))) {
                                            objectSummaryHolders.add(new S3ObjectSummaryHolder(group, objectSummary));
                                        }
                                    }
                                    return objectSummaryHolders;
                                } else {
                                    continuationTokens.putIfAbsent(key, token.orElse(new ContinuationToken(null, false)));
                                    return Collections.emptyList();
                                }
                            }
                        } else {
                            continuationTokens.putIfAbsent(key, token.orElse(new ContinuationToken(null, false)));
                            return Collections.emptyList();
                        }
                    } else {
                        ListObjectsV2Result result = s3Client.listObjectsV2(request);
                        List<S3ObjectSummaryHolder> objectSummaryHolders = new ArrayList<>();
                        for (S3ObjectSummary objectSummary : result.getObjectSummaries()) {
                            if (search.getFileNamePrefixWhitelist().isEmpty() || search.getFileNamePrefixWhitelist().stream().anyMatch(whitelistedPrefix -> objectSummary.getKey().startsWith(whitelistedPrefix))) {
                                objectSummaryHolders.add(new S3ObjectSummaryHolder(group, objectSummary));
                            }
                        }
                        while (result.isTruncated() && result.getContinuationToken() != null) {
                            result = s3Client.listObjectsV2(new ListObjectsV2Request().withBucketName(s3Bucket).withPrefix(s3Prefix).withContinuationToken(result.getContinuationToken()));
                            for (S3ObjectSummary objectSummary : result.getObjectSummaries()) {
                                objectSummaryHolders.add(new S3ObjectSummaryHolder(group, objectSummary));
                            }
                        }
                        return objectSummaryHolders;
                    }
                }
            }));
        }
    }
    final long start = System.currentTimeMillis();
    List<List<S3ObjectSummaryHolder>> results = Futures.allAsList(futures).get(s3Configuration.getWaitForS3ListSeconds(), TimeUnit.SECONDS);
    List<S3ObjectSummaryHolder> objects = Lists.newArrayListWithExpectedSize(results.size() * 2);
    for (List<S3ObjectSummaryHolder> s3ObjectSummaryHolders : results) {
        for (final S3ObjectSummaryHolder s3ObjectHolder : s3ObjectSummaryHolders) {
            objects.add(s3ObjectHolder);
        }
    }
    LOG.trace("Got {} objects from S3 after {}", objects.size(), JavaUtils.duration(start));
    List<ListenableFuture<SingularityS3LogMetadata>> logFutures = Lists.newArrayListWithCapacity(objects.size());
    final Date expireAt = new Date(System.currentTimeMillis() + s3Configuration.getExpireS3LinksAfterMillis());
    for (final S3ObjectSummaryHolder s3ObjectHolder : objects) {
        final S3ObjectSummary s3Object = s3ObjectHolder.getObjectSummary();
        final AmazonS3 s3Client = s3Services.getServiceByGroupAndBucketOrDefault(s3ObjectHolder.getGroup(), s3Object.getBucketName()).getS3Client();
        logFutures.add(executorService.submit(new Callable<SingularityS3LogMetadata>() {

            @Override
            public SingularityS3LogMetadata call() throws Exception {
                Optional<Long> maybeStartTime = Optional.empty();
                Optional<Long> maybeEndTime = Optional.empty();
                if (!search.isExcludeMetadata()) {
                    GetObjectMetadataRequest metadataRequest = new GetObjectMetadataRequest(s3Object.getBucketName(), s3Object.getKey());
                    Map<String, String> objectMetadata = s3Client.getObjectMetadata(metadataRequest).getUserMetadata();
                    maybeStartTime = getMetadataAsLong(objectMetadata, SingularityS3Log.LOG_START_S3_ATTR);
                    maybeEndTime = getMetadataAsLong(objectMetadata, SingularityS3Log.LOG_END_S3_ATTR);
                }
                if (search.isListOnly()) {
                    return new SingularityS3LogMetadata(s3Object.getKey(), s3Object.getLastModified().getTime(), s3Object.getSize(), maybeStartTime, maybeEndTime);
                } else {
                    GeneratePresignedUrlRequest getUrlRequest = new GeneratePresignedUrlRequest(s3Object.getBucketName(), s3Object.getKey()).withMethod(HttpMethod.GET).withExpiration(expireAt);
                    String getUrl = s3Client.generatePresignedUrl(getUrlRequest).toString();
                    ResponseHeaderOverrides downloadHeaders = new ResponseHeaderOverrides();
                    downloadHeaders.setContentDisposition(CONTENT_DISPOSITION_DOWNLOAD_HEADER);
                    downloadHeaders.setContentEncoding(CONTENT_ENCODING_DOWNLOAD_HEADER);
                    GeneratePresignedUrlRequest downloadUrlRequest = new GeneratePresignedUrlRequest(s3Object.getBucketName(), s3Object.getKey()).withMethod(HttpMethod.GET).withExpiration(expireAt).withResponseHeaders(downloadHeaders);
                    String downloadUrl = s3Client.generatePresignedUrl(downloadUrlRequest).toString();
                    return new SingularityS3Log(getUrl, s3Object.getKey(), s3Object.getLastModified().getTime(), s3Object.getSize(), downloadUrl, maybeStartTime, maybeEndTime);
                }
            }
        }));
    }
    return Futures.allAsList(logFutures).get(s3Configuration.getWaitForS3LinksSeconds(), TimeUnit.SECONDS);
}
Also used : WebExceptions.timeout(com.hubspot.singularity.WebExceptions.timeout) DeployManager(com.hubspot.singularity.data.DeployManager) WebExceptions.checkBadRequest(com.hubspot.singularity.WebExceptions.checkBadRequest) HistoryManager(com.hubspot.singularity.data.history.HistoryManager) Tags(io.swagger.v3.oas.annotations.tags.Tags) Produces(javax.ws.rs.Produces) Date(java.util.Date) Inject(com.google.inject.Inject) RequestManager(com.hubspot.singularity.data.RequestManager) Path(javax.ws.rs.Path) LoggerFactory(org.slf4j.LoggerFactory) TimeoutException(java.util.concurrent.TimeoutException) SingularityS3SearchRequest(com.hubspot.singularity.api.SingularityS3SearchRequest) LeaderLatch(org.apache.curator.framework.recipes.leader.LeaderLatch) ListObjectsV2Request(com.amazonaws.services.s3.model.ListObjectsV2Request) RequestHistoryType(com.hubspot.singularity.SingularityRequestHistory.RequestHistoryType) MediaType(javax.ws.rs.core.MediaType) QueryParam(javax.ws.rs.QueryParam) Consumes(javax.ws.rs.Consumes) AtomicInteger(java.util.concurrent.atomic.AtomicInteger) SingularityS3SearchResult(com.hubspot.singularity.api.SingularityS3SearchResult) RequestBody(io.swagger.v3.oas.annotations.parameters.RequestBody) Map(java.util.Map) DefaultValue(javax.ws.rs.DefaultValue) ApiPaths(com.hubspot.singularity.config.ApiPaths) TaskManager(com.hubspot.singularity.data.TaskManager) HttpMethod(com.amazonaws.HttpMethod) SingularityTaskId(com.hubspot.singularity.SingularityTaskId) GeneratePresignedUrlRequest(com.amazonaws.services.s3.model.GeneratePresignedUrlRequest) Schema(io.swagger.v3.oas.annotations.media.Schema) Longs(com.google.common.primitives.Longs) S3ObjectSummaryHolder(com.hubspot.singularity.helpers.S3ObjectSummaryHolder) ImmutableMap(com.google.common.collect.ImmutableMap) ContinuationToken(com.hubspot.singularity.api.ContinuationToken) Collection(java.util.Collection) ConcurrentHashMap(java.util.concurrent.ConcurrentHashMap) Singularity(com.hubspot.singularity.Singularity) Set(java.util.Set) S3Configuration(com.hubspot.singularity.config.S3Configuration) SingularityS3LogMetadata(com.hubspot.singularity.SingularityS3LogMetadata) Executors(java.util.concurrent.Executors) Parameter(io.swagger.v3.oas.annotations.Parameter) JavaUtils(com.hubspot.mesos.JavaUtils) List(java.util.List) SingularityAuthorizationScope(com.hubspot.singularity.SingularityAuthorizationScope) Tag(io.swagger.v3.oas.annotations.tags.Tag) Optional(java.util.Optional) SingularityS3FormatHelper(com.hubspot.singularity.SingularityS3FormatHelper) SimplifiedTaskState(com.hubspot.singularity.SingularityTaskHistoryUpdate.SimplifiedTaskState) SingularityS3Log(com.hubspot.singularity.SingularityS3Log) ListeningExecutorService(com.google.common.util.concurrent.ListeningExecutorService) ThreadFactoryBuilder(com.google.common.util.concurrent.ThreadFactoryBuilder) SingularityRequestWithState(com.hubspot.singularity.SingularityRequestWithState) SingularityRequest(com.hubspot.singularity.SingularityRequest) SingularityTaskHistoryUpdate(com.hubspot.singularity.SingularityTaskHistoryUpdate) Iterables(com.google.common.collect.Iterables) MoreExecutors(com.google.common.util.concurrent.MoreExecutors) PathParam(javax.ws.rs.PathParam) ListenableFuture(com.google.common.util.concurrent.ListenableFuture) SingularityRequestHistory(com.hubspot.singularity.SingularityRequestHistory) GET(javax.ws.rs.GET) SingularityUser(com.hubspot.singularity.SingularityUser) Auth(io.dropwizard.auth.Auth) HashMap(java.util.HashMap) Callable(java.util.concurrent.Callable) ListObjectsV2Result(com.amazonaws.services.s3.model.ListObjectsV2Result) ArrayList(java.util.ArrayList) HashSet(java.util.HashSet) Strings(com.google.common.base.Strings) SingularityS3UploaderFile(com.hubspot.singularity.SingularityS3UploaderFile) Content(io.swagger.v3.oas.annotations.media.Content) Operation(io.swagger.v3.oas.annotations.Operation) Lists(com.google.common.collect.Lists) ApiResponse(io.swagger.v3.oas.annotations.responses.ApiResponse) AsyncHttpClient(com.ning.http.client.AsyncHttpClient) AmazonS3(com.amazonaws.services.s3.AmazonS3) S3ObjectSummary(com.amazonaws.services.s3.model.S3ObjectSummary) SingularityAuthorizer(com.hubspot.singularity.auth.SingularityAuthorizer) SingularityDeployHistory(com.hubspot.singularity.SingularityDeployHistory) SingularityTaskHistory(com.hubspot.singularity.SingularityTaskHistory) POST(javax.ws.rs.POST) Logger(org.slf4j.Logger) SingularityS3Services(com.hubspot.singularity.helpers.SingularityS3Services) ObjectMapper(com.fasterxml.jackson.databind.ObjectMapper) ResponseHeaderOverrides(com.amazonaws.services.s3.model.ResponseHeaderOverrides) WebExceptions.checkNotFound(com.hubspot.singularity.WebExceptions.checkNotFound) ExecutionException(java.util.concurrent.ExecutionException) TimeUnit(java.util.concurrent.TimeUnit) Futures(com.google.common.util.concurrent.Futures) ArraySchema(io.swagger.v3.oas.annotations.media.ArraySchema) RequestHistoryHelper(com.hubspot.singularity.data.history.RequestHistoryHelper) GetObjectMetadataRequest(com.amazonaws.services.s3.model.GetObjectMetadataRequest) SingularityS3Service(com.hubspot.singularity.helpers.SingularityS3Service) Comparator(java.util.Comparator) Collections(java.util.Collections) AmazonS3(com.amazonaws.services.s3.AmazonS3) Set(java.util.Set) HashSet(java.util.HashSet) ContinuationToken(com.hubspot.singularity.api.ContinuationToken) ListObjectsV2Result(com.amazonaws.services.s3.model.ListObjectsV2Result) ArrayList(java.util.ArrayList) Callable(java.util.concurrent.Callable) S3ObjectSummaryHolder(com.hubspot.singularity.helpers.S3ObjectSummaryHolder) GetObjectMetadataRequest(com.amazonaws.services.s3.model.GetObjectMetadataRequest) ListObjectsV2Request(com.amazonaws.services.s3.model.ListObjectsV2Request) List(java.util.List) ArrayList(java.util.ArrayList) SingularityS3Service(com.hubspot.singularity.helpers.SingularityS3Service) SingularityS3LogMetadata(com.hubspot.singularity.SingularityS3LogMetadata) S3ObjectSummary(com.amazonaws.services.s3.model.S3ObjectSummary) Date(java.util.Date) GeneratePresignedUrlRequest(com.amazonaws.services.s3.model.GeneratePresignedUrlRequest) SingularityS3Log(com.hubspot.singularity.SingularityS3Log) AtomicInteger(java.util.concurrent.atomic.AtomicInteger) ListenableFuture(com.google.common.util.concurrent.ListenableFuture) ResponseHeaderOverrides(com.amazonaws.services.s3.model.ResponseHeaderOverrides) Map(java.util.Map) ImmutableMap(com.google.common.collect.ImmutableMap) ConcurrentHashMap(java.util.concurrent.ConcurrentHashMap) HashMap(java.util.HashMap)

Example 2 with SingularityS3SearchRequest

use of com.hubspot.singularity.api.SingularityS3SearchRequest in project Singularity by HubSpot.

the class S3LogResource method getS3LogsForTask.

@GET
@Path("/task/{taskId}")
@Operation(summary = "Retrieve the list of logs stored in S3 for a specific task", responses = { @ApiResponse(responseCode = "200", description = "Returns a list of metadata about log files for the specified task", content = { @Content(array = @ArraySchema(schema = @Schema(implementation = SingularityS3LogMetadata.class))), @Content(array = @ArraySchema(schema = @Schema(implementation = SingularityS3Log.class))) }), @ApiResponse(responseCode = "404", description = "S3 configuration is not present") })
public List<SingularityS3LogMetadata> getS3LogsForTask(@Parameter(hidden = true) @Auth SingularityUser user, @Parameter(required = true, description = "The task ID to search for") @PathParam("taskId") String taskId, @Parameter(description = "Start timestamp (millis, 13 digit)") @QueryParam("start") Optional<Long> start, @Parameter(description = "End timestamp (mills, 13 digit)") @QueryParam("end") Optional<Long> end, @Parameter(description = "Exclude custom object metadata") @QueryParam("excludeMetadata") @DefaultValue("false") boolean excludeMetadata, @Parameter(description = "Do not generate download/get urls, only list the files and metadata") @QueryParam("list") @DefaultValue("false") boolean listOnly) throws Exception {
    checkS3();
    final SingularityS3SearchRequest search = new SingularityS3SearchRequest(Collections.emptyMap(), Collections.singletonList(taskId), start, end, excludeMetadata, listOnly, Optional.empty(), Collections.emptyMap());
    try {
        return getS3Logs(configuration.get(), getServiceToPrefixes(search, user), search, false).getResults();
    } catch (TimeoutException te) {
        throw timeout("Timed out waiting for response from S3 for %s", taskId);
    } catch (Throwable t) {
        throw new RuntimeException(t);
    }
}
Also used : SingularityS3SearchRequest(com.hubspot.singularity.api.SingularityS3SearchRequest) TimeoutException(java.util.concurrent.TimeoutException) Path(javax.ws.rs.Path) GET(javax.ws.rs.GET) Operation(io.swagger.v3.oas.annotations.Operation)

Aggregations

HttpMethod (com.amazonaws.HttpMethod)1 AmazonS3 (com.amazonaws.services.s3.AmazonS3)1 GeneratePresignedUrlRequest (com.amazonaws.services.s3.model.GeneratePresignedUrlRequest)1 GetObjectMetadataRequest (com.amazonaws.services.s3.model.GetObjectMetadataRequest)1 ListObjectsV2Request (com.amazonaws.services.s3.model.ListObjectsV2Request)1 ListObjectsV2Result (com.amazonaws.services.s3.model.ListObjectsV2Result)1 ResponseHeaderOverrides (com.amazonaws.services.s3.model.ResponseHeaderOverrides)1 S3ObjectSummary (com.amazonaws.services.s3.model.S3ObjectSummary)1 ObjectMapper (com.fasterxml.jackson.databind.ObjectMapper)1 Strings (com.google.common.base.Strings)1 ImmutableMap (com.google.common.collect.ImmutableMap)1 Iterables (com.google.common.collect.Iterables)1 Lists (com.google.common.collect.Lists)1 Longs (com.google.common.primitives.Longs)1 Futures (com.google.common.util.concurrent.Futures)1 ListenableFuture (com.google.common.util.concurrent.ListenableFuture)1 ListeningExecutorService (com.google.common.util.concurrent.ListeningExecutorService)1 MoreExecutors (com.google.common.util.concurrent.MoreExecutors)1 ThreadFactoryBuilder (com.google.common.util.concurrent.ThreadFactoryBuilder)1 Inject (com.google.inject.Inject)1