BufferedFileIO.java

/*
 * #%L
 * nom.tam FITS library
 * %%
 * Copyright (C) 2004 - 2021 nom-tam-fits
 * %%
 * This is free and unencumbered software released into the public domain.
 * 
 * Anyone is free to copy, modify, publish, use, compile, sell, or
 * distribute this software, either in source code form or as a compiled
 * binary, for any purpose, commercial or non-commercial, and by any
 * means.
 * 
 * In jurisdictions that recognize copyright laws, the author or authors
 * of this software dedicate any and all copyright interest in the
 * software to the public domain. We make this dedication for the benefit
 * of the public at large and to the detriment of our heirs and
 * successors. We intend this dedication to be an overt act of
 * relinquishment in perpetuity of all present and future rights to this
 * software under copyright law.
 * 
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
 * IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR
 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
 * OTHER DEALINGS IN THE SOFTWARE.
 * #L%
 */

package nom.tam.util;

import java.io.Closeable;
import java.io.EOFException;
import java.io.File;
import java.io.FileDescriptor;
import java.io.Flushable;
import java.io.IOException;
import java.io.RandomAccessFile;
import java.nio.channels.FileChannel;

/**
 * Basic file input/output with efficient internal buffering. 
 * 
 * @author Attila Kovacs
 *
 * @since 1.16
 */
class BufferedFileIO implements InputReader, OutputWriter, Flushable, Closeable {
    
    protected static final int BYTE_MASK = 0xFF;
    
    /** The undelying unbuffere random access file IO */
    private RandomAccessFile file;
    
    /** The file position at which the buffer begins */
    private long startOfBuf;
    
    /** The buffer */
    private byte[] buf;
    
    /** Pointer to the next byte to read/write */
    private int offset;
    
    /** The last legal element in the buffer */
    private int end;
    
    /** Whether the buffer has been modified locally, so it needs to be written back to stream before discarding. */
    private boolean isModified;
    
    /** Whether the current position is beyond the current ennd-of-file */
    private boolean writeAhead;
    
    
    /**
     * Instantiates a new buffered random access file with the specified IO mode and buffer size.
     * This class offers up to 2+ orders of magnitude superior performance over {@link RandomAccessFile}
     * when repeatedly reading or writing chunks of data at consecutive locations
     * 
     * @param f             the file
     * @param mode          the access mode, such as "rw" (see {@link RandomAccessFile} for more info).
     * @param bufferSize    the size of the buffer in bytes
     * @throws IOException  if there was an IO error getting the required access to the file.
     */
    BufferedFileIO(File f, String mode, int bufferSize) throws IOException {
        this.file = new RandomAccessFile(f, mode);
        buf = new byte[bufferSize];
        startOfBuf = 0;
        offset = 0;
        end = 0;
        isModified = false;
        writeAhead = false;
    }
    
    public final synchronized void seek(long newPos) throws IOException {
        // Check that the new position is valid
        if (newPos < 0) {                
            throw new IllegalArgumentException("seek at " + newPos);
        }
        
        if (newPos <= startOfBuf + end) {
            // AK: Do not invoke checking length (costly) if not necessary
            writeAhead = false;
        } else {
            writeAhead = newPos > length();
        }
        
        if (newPos < startOfBuf || newPos >= startOfBuf + end) {
            // The new position is outside the currently buffered region.
            // Write the current buffer back to the stream, and start anew.
            flush();
  
            // We'll start buffering at the new position next.
            startOfBuf = newPos;
            end = 0;
        }
        
        // Position within the new buffer...
        offset = (int) (newPos - startOfBuf);
        
        matchBufferPos();
    }
    
    /**
     * Get the channel associated with this file. Note that this returns the
     * channel of the associated RandomAccessFile. Note that since the
     * BufferedFile buffers the I/O's to the underlying file, the offset of the
     * channel may be different than the offset of the BufferedFile. This is
     * different than for a RandomAccessFile where the offsets are guaranteed to
     * be the same.
     * 
     * @return the file channel
     */
    public final FileChannel getChannel() {
        return file.getChannel();
    }
    
    /**
     * Get the file descriptor associated with this stream. Note that this
     * returns the file descriptor of the associated RandomAccessFile.
     * 
     * @return the file descriptor
     * @throws IOException
     *             if the descriptor could not be accessed.
     */
    public final FileDescriptor getFD() throws IOException {
        return file.getFD();
    }

    /**
     * Gets the current read/write position in the file.
     * 
     * @return the current byte offset from the beginning of the file.
     */
    public final synchronized long getFilePointer() {
        return startOfBuf + offset;
    }
    
    /**
     * Returns the number of bytes that can still be read from the file before the end
     * is reached.
     * 
     * @return                  the number of bytes left to read.
     * @throws IOException      if there was an IO error.
     */
    private synchronized long getRemaining() throws IOException {
        long n = file.length() - getFilePointer();
        return n > 0 ? n : 0L;
    }
    
    /**
     * Checks if there is more that can be read from this file. If so, it ensures that
     * the next byte is buffered.
     * 
     * @return      <code>true</code> if there is more that can be read from the file
     *              (and from the buffer!), or else <code>false</code>.
     *              
     * @throws IOException  if there was an IO error accessing the file.
     */
    private synchronized boolean makeAvailable() throws IOException {
        if (offset < end) {
            return true;
        }
        
        if (getRemaining() <= 0) {
            return false;
        }

        // Buffer as much as we can.
        seek(getFilePointer());
        end = file.read(buf, 0, buf.length);
        
        return end > 0;
    }
    
    /**
     * Checks if there are the required number of bytes available to read from this file.
     * 
     * @param need  the number of bytes we need.
     * @return      <code>true</code> if the needed number of bytes can be read from the file
     *              or else <code>false</code>.
     *              
     * @throws IOException  if there was an IO error accessing the file.
     */
    public final synchronized boolean hasAvailable(int need) throws IOException {
        if (end >= offset + need) {
            return true;
        }
        if (file.length() >= getFilePointer() + need) {
            return true;
        }
        return false;
    }
    
    /**
     * Returns the current length of the file.
     * 
     * @return the current length of the file.
     * @throws IOException
     *             if the operation failed
     */
    public final synchronized long length() throws IOException {
        // It's either the file's length or that of the end of the (yet) unsynched buffer...
        if (end > 0) {
            return Math.max(file.length(), startOfBuf + end);
        }
        return file.length();
    }
    
    /**
     * Sets the length of the file. This method calls the method of the same name
     * in {@link RandomAccessFile}.
     * 
     * @param newLength
     *            The number of bytes at which the file is set.
     * @throws IOException
     *             if the resizing of the underlying stream fails
     */
    public synchronized void setLength(long newLength) throws IOException {
        // Check if we can change the length inside the current buffer.
        final long bufEnd = startOfBuf + end;
        if (newLength >= startOfBuf && newLength < bufEnd) {
            // If truncated in the buffered region, then truncate the buffer also...
            end = (int) (newLength - startOfBuf);
        } else {
            flush();
            end = 0;
        }
        
        if (getFilePointer() > newLength) {
            seek(newLength);
        }
        
        // Change the length of the file itself...
        file.setLength(newLength);
    }
    
    /** 
     * Positions the file pointer to match the current buffer pointer.
     * 
     * @throws IOException  if there was an IO error
     */
    private synchronized void matchBufferPos() throws IOException {
        file.seek(getFilePointer());
    }
    
  
    /** 
     * Positions the buffer pointer to match the current file pointer.
     * 
     * @throws IOException  if there was an IO error
     */
    private synchronized void matchFilePos() throws IOException {
        seek(file.getFilePointer());
    }
    
    @Override
    public synchronized void close() throws IOException {
        flush();
        file.close();
        startOfBuf = 0;
        offset = 0;
        end = 0;
    }
    
    /**
     * Moves the buffer to the current read/write position.
     * 
     * @throws IOException  if there was an IO error writing the prior data back to the file.
     */
    private synchronized void moveBuffer() throws IOException {
        seek(getFilePointer());
    }
    
    @Override
    public synchronized void flush() throws IOException {
        if (!isModified) {
            return;
        }

        // the buffer was modified locally, so we need to write it back to the stream    
        if (end > 0) {
            file.seek(startOfBuf);
            file.write(buf, 0, end);
        }
        isModified = false;
    }
    
   
    @Override
    public final synchronized void write(int b) throws IOException {
        if (writeAhead) {
            setLength(getFilePointer());
        }

        if (offset >= buf.length) {
            // The buffer is full, it's time to write it back to stream, and start anew
            moveBuffer();
        }
        
        isModified = true;
        buf[offset++] = (byte) b;
       
        if (offset > end) {
            // We are writing at the end of the file, and we need to grow the buffer with the file...
            end = offset;
        }
    }
    
    
    @Override
    public final synchronized int read() throws IOException {
        if (!makeAvailable()) {
            // By contract of read(), it returns -1 at th end of file.
            return -1;
        }

        // Return the unsigned(!) byte.
        return buf[offset++] & BYTE_MASK;
    }
    
    
    @Override
    public final synchronized void write(byte[] b, int from, int len) throws IOException {
        if (len <= 0) {
            return;
        }

        if (writeAhead) {
            setLength(getFilePointer());
        }
        
        if (len > 2 * buf.length) {
            // Large direct write...
            matchBufferPos();
            file.write(b, from, len);
            matchFilePos();
            return;
        }
        
        while (len > 0) {
            if (offset >= buf.length) {
                // The buffer is full, it's time to write it back to stream, and start anew.
                moveBuffer();
            }
            
            isModified = true;
            int n = Math.min(len, buf.length - offset);
            System.arraycopy(b, from, buf, offset, n);
            
            offset += n;
            from += n;
            len -= n;
           
            if (offset > end) {
                // We are growing the file, so grow the buffer also...
                end = offset;
            }
        }
    }
    
    @Override
    public final synchronized int read(byte[] b, int from, int len) throws IOException {
        if (len <= 0) {
            // Nothing to do.
            return 0;
        }
        
        if (len > 2 * buf.length) {
            // Large direct read...
            matchBufferPos();
            int l = file.read(b, from, len);
            matchFilePos();
            return l;
        }
        
        int got = 0;
        
        while (got < len) {
            if (!makeAvailable()) {
                return got > 0 ? got : -1;
            }
            
            int n = Math.min(len - got, end - offset);   
            
            System.arraycopy(buf, offset, b, from, n);
            
            got += n;
            offset += n;   
            from += n;
        }

        return got;
    }
    
    /**
     * Reads bytes to completely fill the supplied buffer. If not enough bytes are avaialable in the
     * file to fully fill the buffer, an {@link EOFException} will be thrown.
     * 
     * @param b             the buffer
     * @throws IOException  if there was an IO error before the buffer could be fully populated.
     * 
     */
    public final synchronized void readFully(byte[] b) throws IOException {
        readFully(b, 0, b.length);
    }

    /**
     * Reads bytes to fill the supplied buffer with the requested number of bytes from the given
     * starting buffer index. If not enough bytes are avaialable in the
     * file to deliver the reqauested number of bytes the buffer, an {@link EOFException} will be thrown.
     * 
     * @param b             the buffer
     * @param off           the buffer index at which to start reading data
     * @param len           the total number of bytes to read.
     * @throws IOException  if there was an IO error before the requested number of bytes could
     *                      all be read.
     */
    public synchronized void readFully(byte[] b, int off, int len) throws IOException { 
        while (len > 0) {
            int n = read(b, off, len);
            if (n < 0) {
                throw new EOFException();
            }
            off += n;
            len -= n;
        }
    }
    
    /**
     * Same as {@link RandomAccessFile#readUTF()}.
     * 
     * @return              a string
     * @throws IOException  if there was an IO error while reading from the file.
     */
    public final synchronized String readUTF() throws IOException {
        matchBufferPos();
        String s = file.readUTF();
        matchFilePos();
        return s;
    }

    /**
     * Same as {@link RandomAccessFile#writeUTF(String)}
     * 
     * @param s             a string
     * @throws IOException  if there was an IO error while writing to the file.
     */
    public final synchronized void writeUTF(String s) throws IOException {
        matchBufferPos();
        file.writeUTF(s);
        matchFilePos();
    }
    
    /**
     * Moves the file pointer by a number of bytes from its current position.
     * 
     * @param n     the number of byter to move. Negative values are allowed and
     *              result in moving the pointer backward.
     * @return      the actual number of bytes that the pointer moved, which may be
     *              fewer than requested if the file boundary was reached.
     * @throws IOException  if there was an IO error.
     */
    public final synchronized long skip(long n) throws IOException {
        if (offset + n >= 0 && offset + n <= end) {
            // Skip within the buffered region...
            offset = (int) (offset + n);
            return n;
        }
        
        long pos = getFilePointer();
       
        n = Math.max(n, -pos);        
        
        seek(pos + n);
        return n;
    }

    /**
     * Read as many bytes into a byte array as possible. The number of bytes read may be fewer than
     * the size of the array, for example because the end-of-file is reached during the read.
     * 
     * @param b         the byte buffer to fill with data from the file.
     * @return          the number of bytes actually read.
     * @throws IOException  if there was an IO error while reading, other than the end-of-file.
     * 
     */
    public final synchronized int read(byte[] b) throws IOException {
        return read(b, 0, b.length);
    }
    
    /**
     * Writes the contents of a byte array into the file.
     * 
     * @param b             the byte buffer to write into the file.
     * @throws IOException  if there was an IO error while writing to the file...
     * 
     */
    public final synchronized void write(byte[] b) throws IOException {
        write(b, 0, b.length);
    }
    
}