[ 
https://issues.apache.org/jira/browse/FLINK-7068?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=16173180#comment-16173180
 ] 

ASF GitHub Bot commented on FLINK-7068:
---------------------------------------

Github user NicoK commented on a diff in the pull request:

    https://github.com/apache/flink/pull/4358#discussion_r139969639
  
    --- Diff: 
flink-runtime/src/main/java/org/apache/flink/runtime/blob/TransientBlobCache.java
 ---
    @@ -0,0 +1,322 @@
    +/*
    + * Licensed to the Apache Software Foundation (ASF) under one
    + * or more contributor license agreements.  See the NOTICE file
    + * distributed with this work for additional information
    + * regarding copyright ownership.  The ASF licenses this file
    + * to you under the Apache License, Version 2.0 (the
    + * "License"); you may not use this file except in compliance
    + * with the License.  You may obtain a copy of the License at
    + *
    + *     http://www.apache.org/licenses/LICENSE-2.0
    + *
    + * Unless required by applicable law or agreed to in writing, software
    + * distributed under the License is distributed on an "AS IS" BASIS,
    + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
    + * See the License for the specific language governing permissions and
    + * limitations under the License.
    + */
    +
    +package org.apache.flink.runtime.blob;
    +
    +import org.apache.flink.annotation.VisibleForTesting;
    +import org.apache.flink.api.common.JobID;
    +import org.apache.flink.configuration.BlobServerOptions;
    +import org.apache.flink.configuration.Configuration;
    +import org.apache.flink.util.FileUtils;
    +import org.slf4j.Logger;
    +import org.slf4j.LoggerFactory;
    +
    +import javax.annotation.Nullable;
    +import java.io.File;
    +import java.io.IOException;
    +import java.io.InputStream;
    +import java.net.InetSocketAddress;
    +import java.util.concurrent.atomic.AtomicBoolean;
    +import java.util.concurrent.atomic.AtomicLong;
    +import java.util.concurrent.locks.ReadWriteLock;
    +import java.util.concurrent.locks.ReentrantReadWriteLock;
    +
    +import static org.apache.flink.util.Preconditions.checkArgument;
    +import static org.apache.flink.util.Preconditions.checkNotNull;
    +
    +/**
    + * Provides access to transient BLOB files stored at the {@link 
BlobServer}.
    + *
    + * TODO: currently, this is still cache-based with local copies - make 
this truly transient, i.e. return file streams with no local copy
    + */
    +public class TransientBlobCache implements TransientBlobService {
    +
    +   /** The log object used for debugging. */
    +   private static final Logger LOG = 
LoggerFactory.getLogger(TransientBlobCache.class);
    +
    +   /** Counter to generate unique names for temporary files. */
    +   private final AtomicLong tempFileCounter = new AtomicLong(0);
    +
    +   private final InetSocketAddress serverAddress;
    +
    +   /**
    +    * Root directory for local file storage
    +    */
    +   private final File storageDir;
    +
    +   private final AtomicBoolean shutdownRequested = new AtomicBoolean();
    +
    +   /** Shutdown hook thread to ensure deletion of the local storage 
directory. */
    +   private final Thread shutdownHook;
    +
    +   /** The number of retries when the transfer fails */
    +   private final int numFetchRetries;
    +
    +   /** Configuration for the blob client like ssl parameters required to 
connect to the blob server */
    +   private final Configuration blobClientConfig;
    +
    +   /** Lock guarding concurrent file accesses */
    +   private final ReadWriteLock readWriteLock;
    +
    +   /**
    +    * Instantiates a new BLOB cache.
    +    *
    +    * @param serverAddress
    +    *              address of the {@link BlobServer} to use for fetching 
files from
    +    * @param blobClientConfig
    +    *              global configuration
    +    *
    +    * @throws IOException
    +    *              thrown if the (local or distributed) file storage 
cannot be created or is not usable
    +    */
    +   public TransientBlobCache(
    +                   final InetSocketAddress serverAddress,
    +                   final Configuration blobClientConfig) throws 
IOException {
    +
    +           this.serverAddress = checkNotNull(serverAddress);
    +           this.blobClientConfig = checkNotNull(blobClientConfig);
    +           this.readWriteLock = new ReentrantReadWriteLock();
    +
    +           // configure and create the storage directory
    +           String storageDirectory = 
blobClientConfig.getString(BlobServerOptions.STORAGE_DIRECTORY);
    +           this.storageDir = 
BlobUtils.initLocalStorageDirectory(storageDirectory);
    +           LOG.info("Created transient BLOB cache storage directory " + 
storageDir);
    +
    +           // configure the number of fetch retries
    +           final int fetchRetries = 
blobClientConfig.getInteger(BlobServerOptions.FETCH_RETRIES);
    +           if (fetchRetries >= 0) {
    +                   this.numFetchRetries = fetchRetries;
    +           } else {
    +                   LOG.warn("Invalid value for {}. System will attempt no 
retries on failed fetches of BLOBs.",
    +                           BlobServerOptions.FETCH_RETRIES.key());
    +                   this.numFetchRetries = 0;
    +           }
    +
    +           // Add shutdown hook to delete storage directory
    +           shutdownHook = BlobUtils.addShutdownHook(this, LOG);
    +   }
    +
    +   @Override
    +   public File getFile(BlobKey key) throws IOException {
    +           return getFileInternal(null, key);
    +   }
    +
    +   @Override
    +   public File getFile(JobID jobId, BlobKey key) throws IOException {
    +           checkNotNull(jobId);
    +           return getFileInternal(jobId, key);
    +   }
    +
    +   /**
    +    * Returns local copy of the file for the BLOB with the given key.
    +    * <p>
    +    * The method will first attempt to serve the BLOB from its local 
cache. If the BLOB is not in
    +    * the cache, the method will try to download it from this cache's BLOB 
server.
    +    *
    +    * @param jobId
    +    *              ID of the job this blob belongs to (or <tt>null</tt> if 
job-unrelated)
    +    * @param blobKey
    +    *              The key of the desired BLOB.
    +    *
    +    * @return file referring to the local storage location of the BLOB.
    +    *
    +    * @throws IOException
    +    *              Thrown if an I/O error occurs while downloading the 
BLOBs from the BLOB server.
    +    */
    +   private File getFileInternal(@Nullable JobID jobId, BlobKey blobKey) 
throws IOException {
    +           checkArgument(blobKey != null, "BLOB key cannot be null.");
    +
    +           final File localFile = BlobUtils.getStorageLocation(storageDir, 
jobId, blobKey);
    +           readWriteLock.readLock().lock();
    +
    +           try {
    +                   if (localFile.exists()) {
    +                           return localFile;
    +                   }
    +           } finally {
    +                   readWriteLock.readLock().unlock();
    +           }
    +
    +           // download from the BlobServer directly
    +           // use a temporary file (thread-safe without locking)
    +           File incomingFile = createTemporaryFilename();
    +           try {
    +                   BlobClient.downloadFromBlobServer(jobId, blobKey, 
false, incomingFile, serverAddress,
    +                           blobClientConfig, numFetchRetries);
    --- End diff --
    
    only manually via the `TransientBlobCache#delete()` methods


> change BlobService sub-classes for permanent and transient BLOBs
> ----------------------------------------------------------------
>
>                 Key: FLINK-7068
>                 URL: https://issues.apache.org/jira/browse/FLINK-7068
>             Project: Flink
>          Issue Type: Sub-task
>          Components: Distributed Coordination, Network
>    Affects Versions: 1.4.0
>            Reporter: Nico Kruber
>            Assignee: Nico Kruber
>
> A {{PermanentBlobStore}} should resemble use cases for BLOBs that are 
> permanently stored for a job's life time (HA and non-HA).
> A {{TransientBlobStore}} should reflect BLOB offloading for logs, RPC, etc. 
> which even does not have to be reflected by files.



--
This message was sent by Atlassian JIRA
(v6.4.14#64029)

Reply via email to