hms-dbmi · ramari16 · Aug 23, 2023 · May 25, 2023 · May 25, 2023 · May 31, 2023
diff --git a/client-api/pom.xml b/client-api/pom.xml
@@ -4,12 +4,12 @@
   <parent>
     <artifactId>pic-sure-hpds</artifactId>
     <groupId>edu.harvard.hms.dbmi.avillach.hpds</groupId>
-    <version>1.0-SNAPSHOT</version>
+    <version>2.0.0-SNAPSHOT</version>
   </parent>
 
   <groupId>edu.harvard.hms.dbmi.avillach.hpds</groupId>
   <artifactId>client-api</artifactId>
-  <version>1.0-SNAPSHOT</version>
+  <version>2.0.0-SNAPSHOT</version>
 
   <name>client-api</name>
   <!-- FIXME change it to the project's website -->

diff --git a/common/pom.xml b/common/pom.xml
@@ -6,7 +6,7 @@
 	<parent>
 		<artifactId>pic-sure-hpds</artifactId>
 		<groupId>edu.harvard.hms.dbmi.avillach.hpds</groupId>
-		<version>1.0-SNAPSHOT</version>
+		<version>2.0.0-SNAPSHOT</version>
 	</parent>
 
 	<artifactId>common</artifactId>
@@ -21,5 +21,13 @@
 			<groupId>com.google.guava</groupId>
 			<artifactId>guava</artifactId>
 		</dependency>
+		<dependency>
+			<groupId>org.codehaus.jackson</groupId>
+			<artifactId>jackson-core-asl</artifactId>
+		</dependency>
+		<dependency>
+			<groupId>org.codehaus.jackson</groupId>
+			<artifactId>jackson-mapper-asl</artifactId>
+		</dependency>
 	</dependencies>
 </project>
diff --git a/...rc/main/java/edu/harvard/hms/dbmi/avillach/hpds/storage/FileBackedByteIndexedStorage.java b/...rc/main/java/edu/harvard/hms/dbmi/avillach/hpds/storage/FileBackedByteIndexedStorage.java
@@ -1,44 +1,52 @@
 package edu.harvard.hms.dbmi.avillach.hpds.storage;
 
-import java.io.ByteArrayInputStream;
-import java.io.File;
-import java.io.FileNotFoundException;
-import java.io.IOException;
-import java.io.ObjectInputStream;
-import java.io.ObjectOutputStream;
-import java.io.RandomAccessFile;
-import java.io.Serializable;
+import java.io.*;
 import java.util.Set;
 import java.util.concurrent.ConcurrentHashMap;
 import java.util.function.Function;
-import java.util.zip.GZIPInputStream;
-import java.util.zip.GZIPOutputStream;
 
-import org.apache.commons.io.output.ByteArrayOutputStream;
-
-public class FileBackedByteIndexedStorage <K, V extends Serializable> implements Serializable {
+public abstract class FileBackedByteIndexedStorage <K, V extends Serializable> implements Serializable {
 	private static final long serialVersionUID = -7297090745384302635L;
-	private transient RandomAccessFile storage;
-	private ConcurrentHashMap<K, Long[]> index;
-	private File storageFile;
-	private boolean completed = false;
-	private Long maxStorageSize;  //leave this in to not break serialization
+	protected transient RandomAccessFile storage;
+	protected ConcurrentHashMap<K, Long[]> index;
+	protected File storageFile;
+	protected boolean completed = false;
+
 
 	public FileBackedByteIndexedStorage(Class<K> keyClass, Class<V> valueClass, File storageFile) throws FileNotFoundException {
 		this.index = new ConcurrentHashMap<K, Long[]>();
 		this.storageFile = storageFile;
 		this.storage = new RandomAccessFile(this.storageFile, "rw");
 	}
 
+	public void updateStorageDirectory(File storageDirectory) {
+		if (!storageDirectory.isDirectory()) {
+			throw new IllegalArgumentException("storageDirectory is not a directory");
+		}
+		String currentStoreageFilename = storageFile.getName();
+		storageFile = new File(storageDirectory, currentStoreageFilename);
+	}
+
 	public Set<K> keys(){
 		return index.keySet();
 	}
 
-	public void put(K key, V value) throws IOException {
+	public void put(K key, V value) {
 		if(completed) {
 			throw new RuntimeException("A completed FileBackedByteIndexedStorage cannot be modified.");
 		}
-		Long[] recordIndex = store(value);
+		Long[] recordIndex;
+		try (ByteArrayOutputStream out = writeObject(value)) {
+			recordIndex = new Long[2];
+			synchronized (storage) {
+				storage.seek(storage.length());
+				recordIndex[0] = storage.getFilePointer();
+				storage.write(out.toByteArray());
+				recordIndex[1] = storage.getFilePointer() - recordIndex[0];
+			}
+		} catch (IOException e) {
+			throw new UncheckedIOException(e);
+		}
 		index.put(key, recordIndex);
 	}
 
@@ -63,60 +71,43 @@ public void complete() {
 		this.completed = true;
 	}
 
-	public boolean isComplete() {
-		return this.completed;
-	}
-
-	private Long[] store(V value) throws IOException {
-
-		ByteArrayOutputStream out = new ByteArrayOutputStream();
-		ObjectOutputStream oos = new ObjectOutputStream(new GZIPOutputStream(out));
-		oos.writeObject(value);
-		oos.flush();
-		oos.close();
-
-		Long[] recordIndex = new Long[2];
-		synchronized(storage) {
-			storage.seek(storage.length());
-			recordIndex[0] = storage.getFilePointer();
-			storage.write(out.toByteArray());	
-			recordIndex[1] = storage.getFilePointer() - recordIndex[0];
-//			maxStorageSize = storage.getFilePointer();
-		}
-		return recordIndex;
-	}
-
-	public V get(K key) throws IOException {
-		if(this.storage==null) {
-			synchronized(this) {
-				this.open();
-			}
-		}
-		Long[] offsetsInStorage = index.get(key);
-		if(offsetsInStorage != null) {
-			Long offsetInStorage = index.get(key)[0];
-			int offsetLength = index.get(key)[1].intValue();
-			if(offsetInStorage != null && offsetLength>0) {
-				byte[] buffer = new byte[offsetLength];
-				synchronized(storage) {
-					storage.seek(offsetInStorage);
-					storage.readFully(buffer);					
+	public V get(K key) {
+		try {
+			if(this.storage==null) {
+				synchronized(this) {
+					this.open();
 				}
-				ObjectInputStream in = new ObjectInputStream(new GZIPInputStream(new ByteArrayInputStream(buffer)));
-
-				try {
-					V readObject = (V) in.readObject();
+			}
+			Long[] offsetsInStorage = index.get(key);
+			if(offsetsInStorage != null) {
+				Long offsetInStorage = index.get(key)[0];
+				int offsetLength = index.get(key)[1].intValue();
-				Long offsetInStorage = index.get(key)[0];
-				int offsetLength = index.get(key)[1].intValue();
+				Long offsetInStorage = offsetsInStorage[0];
+				int offsetLength = offsetsInStorage[1].intValue();
-				Long offsetInStorage = index.get(key)[0];
-				int offsetLength = index.get(key)[1].intValue();
+				Long offsetInStorage = offsetsInStorage[0];
+				int offsetLength = offsetsInStorage[1].intValue();
+				if(offsetInStorage != null && offsetLength>0) {
+					byte[] buffer = new byte[offsetLength];
+					synchronized(storage) {
+						storage.seek(offsetInStorage);
+						storage.readFully(buffer);
+					}
+					V readObject = readObject(buffer);
 					return readObject;
-				} catch (ClassNotFoundException e) {
-					throw new RuntimeException("This should never happen.");
-				} finally {
-					in.close();
+				}else {
+					return null;
 				}
-			}else {
+			} else {
 				return null;
 			}
-		} else {
-			return null;
+		} catch (IOException e) {
+			throw new UncheckedIOException(e);
 		}
 	}
+
+	protected abstract V readObject(byte[] buffer);
+
+	protected abstract ByteArrayOutputStream writeObject(V value) throws IOException;
+
+	public V getOrELse(K key, V defaultValue) {
+		V result = get(key);
+		return result == null ? defaultValue : result;
+	}
+
 }
diff --git a/...rc/main/java/edu/harvard/hms/dbmi/avillach/hpds/storage/FileBackedJavaIndexedStorage.java b/...rc/main/java/edu/harvard/hms/dbmi/avillach/hpds/storage/FileBackedJavaIndexedStorage.java
@@ -0,0 +1,32 @@
+package edu.harvard.hms.dbmi.avillach.hpds.storage;
+
+import java.io.*;
+import java.util.zip.GZIPInputStream;
+import java.util.zip.GZIPOutputStream;
+
+public class FileBackedJavaIndexedStorage <K, V extends Serializable> extends FileBackedByteIndexedStorage<K, V> {
+    public FileBackedJavaIndexedStorage(Class<K> keyClass, Class<V> valueClass, File storageFile) throws FileNotFoundException {
+        super(keyClass, valueClass, storageFile);
+    }
+
+    protected ByteArrayOutputStream writeObject(V value) throws IOException {
+        ByteArrayOutputStream out = new ByteArrayOutputStream();
+        ObjectOutputStream oos = new ObjectOutputStream(new GZIPOutputStream(out));
+        oos.writeObject(value);
+        oos.flush();
+        oos.close();
+        return out;
+    }
+
+    @Override
+    protected V readObject(byte[] buffer) {
+        try (ObjectInputStream in = new ObjectInputStream(new GZIPInputStream(new ByteArrayInputStream(buffer)));) {
+            V readObject = (V) in.readObject();
+            return readObject;
+        } catch (IOException e) {
+            throw new UncheckedIOException(e);
+        } catch (ClassNotFoundException e) {
+            throw new RuntimeException(e);
+        }
+    }
+}
diff --git a/.../src/main/java/edu/harvard/hms/dbmi/avillach/hpds/storage/FileBackedJsonIndexStorage.java b/.../src/main/java/edu/harvard/hms/dbmi/avillach/hpds/storage/FileBackedJsonIndexStorage.java
@@ -0,0 +1,40 @@
+package edu.harvard.hms.dbmi.avillach.hpds.storage;
+
+import org.codehaus.jackson.map.ObjectMapper;
+import org.codehaus.jackson.type.TypeReference;
+
+import java.io.*;
+import java.util.zip.GZIPInputStream;
+import java.util.zip.GZIPOutputStream;
+
+public abstract class FileBackedJsonIndexStorage <K, V extends Serializable> extends FileBackedByteIndexedStorage<K, V> {
+    private static final long serialVersionUID = -1086729119489479152L;
+
+    protected transient ObjectMapper objectMapper = new ObjectMapper();
+
+    public FileBackedJsonIndexStorage(File storageFile) throws FileNotFoundException {
+        super(null, null, storageFile);
+    }
+
+    protected ByteArrayOutputStream writeObject(V value) throws IOException {
+        ByteArrayOutputStream out = new ByteArrayOutputStream();
+        objectMapper.writeValue(new GZIPOutputStream(out), value);
+        return out;
+    }
+
+    protected V readObject(byte[] buffer) {
+        try {
+            return objectMapper.readValue(new GZIPInputStream(new ByteArrayInputStream(buffer)), getTypeReference());
+        } catch (IOException e) {
+            throw new RuntimeException(e);
+        }
+    }
+
+    // Required to populate the objectMapper on deserialization
+    private void readObject(ObjectInputStream in) throws IOException, ClassNotFoundException {
+        in.defaultReadObject();
+        objectMapper = new ObjectMapper();
+    }
+
+    public abstract TypeReference<V> getTypeReference();
+}
diff --git a/data/pom.xml b/data/pom.xml
@@ -5,7 +5,7 @@
 	<parent>
 		<artifactId>pic-sure-hpds</artifactId>
 		<groupId>edu.harvard.hms.dbmi.avillach.hpds</groupId>
-		<version>1.0-SNAPSHOT</version>
+		<version>2.0.0-SNAPSHOT</version>
 	</parent>
 
 	<artifactId>data</artifactId>