Merge pull request #16 from clowder-framework/release/1.10.0

v1.10.0 release
clowder-framework · Jun 30, 2020 · db2a6ab · db2a6ab
2 parents 3b84e70 + 0792f2c
commit db2a6ab
Show file tree

Hide file tree

Showing 15 changed files with 463 additions and 89 deletions.
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -4,7 +4,21 @@ All notable changes to this project will be documented in this file.
 The format is based on [Keep a Changelog](http://keepachangelog.com/)
 and this project adheres to [Semantic Versioning](http://semver.org/).
 
+## 1.10.0 - 2020-06-30
+
+### Added
+- Ability to mark multiple files in a dataset and perform bulk operations (download, tag, delete) on them at once.
+
+### Fixed
+- Return thumbnail as part of the file information.
+  [#8](https://github.com/clowder-framework/clowder/issues/8)
+- Datasets layout on space page would sometimes have overlapping tiles.
+
+### Changed
+- mongo-init script with users would return with exit code -1 if user exists, now returns exit code 0.
+
 ## 1.9.0 - 2020-06-01
+
 **_Warning:_ This update modifies information stored in Elasticsearch used for text based searching. To take advantage 
 of these changes a reindex of Elasticsearch is required. A reindex can be started by an admin from the Admin menu.**
 

diff --git a/app/api/Datasets.scala b/app/api/Datasets.scala
@@ -2065,10 +2065,16 @@ class  Datasets @Inject()(
     * @param dataset dataset from which to get teh files
     * @param chunkSize chunk size in memory in which to buffer the stream
     * @param compression java built in compression value. Use 0 for no compression.
+    * @param bagit whether or not to include bagit structures in zip
+    * @param user an optional user to include in metadata
+    * @param fileIDs a list of UUIDs of files in the dataset to include (i.e. marked file downloads)
+    * @param folderId a folder UUID in the dataset to include (i.e. folder download)
     * @return Enumerator to produce array of bytes from a zipped stream containing the bytes of each file
     *         in the dataset
     */
-  def enumeratorFromDataset(dataset: Dataset, chunkSize: Int = 1024 * 8, compression: Int = Deflater.DEFAULT_COMPRESSION, bagit: Boolean, user : Option[User])
+  def enumeratorFromDataset(dataset: Dataset, chunkSize: Int = 1024 * 8,
+                            compression: Int = Deflater.DEFAULT_COMPRESSION, bagit: Boolean,
+                            user : Option[User], fileIDs: Option[List[UUID]], folderId: Option[UUID])
                            (implicit ec: ExecutionContext): Enumerator[Array[Byte]] = {
     implicit val pec = ec.prepare()
     val dataFolder = if (bagit) "data/" else ""
@@ -2077,7 +2083,19 @@ class  Datasets @Inject()(
 
     // compute list of all files and folder in dataset. This will also make sure
     // that all files and folder names are unique.
-    listFilesInFolder(dataset.files, dataset.folders, dataFolder, filenameMap, inputFiles)
+    fileIDs match {
+      case Some(fids) => {
+        Logger.info("Downloading only some files")
+        Logger.info(fids.toString)
+        listFilesInFolder(fids, List.empty, dataFolder, filenameMap, inputFiles)
+      }
+      case None => {
+        folderId match {
+          case Some(fid) => listFilesInFolder(List.empty, List(fid), dataFolder, filenameMap, inputFiles)
+          case None => listFilesInFolder(dataset.files, dataset.folders, dataFolder, filenameMap, inputFiles)
+        }
+      }
+    }
 
     val md5Files = scala.collection.mutable.HashMap.empty[String, MessageDigest] //for the files
     val md5Bag = scala.collection.mutable.HashMap.empty[String, MessageDigest] //for the bag files
@@ -2121,14 +2139,13 @@ class  Datasets @Inject()(
      * the enumerator is finished
      */
 
-    var is: Option[InputStream] = addDatasetInfoToZip(dataFolder,dataset,zip)
+    var is: Option[InputStream] = addDatasetInfoToZip(dataFolder, dataset, zip)
     //digest input stream
     val md5 = MessageDigest.getInstance("MD5")
     md5Files.put(dataFolder+"_info.json",md5)
     is = Some(new DigestInputStream(is.get,md5))
     file_type = 1 //next is metadata
 
-
     Enumerator.generateM({
       is match {
         case Some(inputStream) => {
@@ -2415,7 +2432,7 @@ class  Datasets @Inject()(
 
         // Use custom enumerator to create the zip file on the fly
         // Use a 1MB in memory byte array
-        Ok.chunked(enumeratorFromDataset(dataset,1024*1024, compression,bagit,user)).withHeaders(
+        Ok.chunked(enumeratorFromDataset(dataset,1024*1024, compression, bagit, user, None, None)).withHeaders(
           CONTENT_TYPE -> "application/zip",
           CONTENT_DISPOSITION -> (FileUtils.encodeAttachment(dataset.name+ ".zip", request.headers.get("user-agent").getOrElse("")))
         )
@@ -2427,6 +2444,62 @@ class  Datasets @Inject()(
     }
   }
 
+  // Takes dataset ID and a comma-separated string of file UUIDs in the dataset and streams just those files as a zip
+  def downloadPartial(id: UUID, fileList: String) = PermissionAction(Permission.DownloadFiles, Some(ResourceRef(ResourceRef.dataset, id))) { implicit request =>
+    implicit val user = request.user
+    datasets.get(id) match {
+      case Some(dataset) => {
+        val fileIDs = fileList.split(',').map(fid => new UUID(fid)).toList
+        val bagit = play.api.Play.configuration.getBoolean("downloadDatasetBagit").getOrElse(true)
+
+        // Increment download count for each file
+        fileIDs.foreach(fid => files.incrementDownloads(fid, user))
+
+        // Use custom enumerator to create the zip file on the fly
+        // Use a 1MB in memory byte array
+        Ok.chunked(enumeratorFromDataset(dataset,1024*1024, -1, bagit, user, Some(fileIDs), None)).withHeaders(
+          CONTENT_TYPE -> "application/zip",
+          CONTENT_DISPOSITION -> (FileUtils.encodeAttachment(dataset.name+ " (Partial).zip", request.headers.get("user-agent").getOrElse("")))
+        )
+      }
+      // If the dataset wasn't found by ID
+      case None => {
+        NotFound
+      }
+    }
+  }
+
+  // Takes dataset ID and a folder ID in that dataset and streams just that folder and sub-folders as a zip
+  def downloadFolder(id: UUID, folderId: UUID) = PermissionAction(Permission.DownloadFiles, Some(ResourceRef(ResourceRef.dataset, id))) { implicit request =>
+    implicit val user = request.user
+    datasets.get(id) match {
+      case Some(dataset) => {
+        val bagit = play.api.Play.configuration.getBoolean("downloadDatasetBagit").getOrElse(true)
+
+        // Increment download count for each file in folder
+        folders.get(folderId) match {
+          case Some(fo) => {
+            fo.files.foreach(fid => files.incrementDownloads(fid, user))
+
+            // Use custom enumerator to create the zip file on the fly
+            // Use a 1MB in memory byte array
+            Ok.chunked(enumeratorFromDataset(dataset,1024*1024, -1, bagit, user, None, Some(folderId))).withHeaders(
+              CONTENT_TYPE -> "application/zip",
+              CONTENT_DISPOSITION -> (FileUtils.encodeAttachment(dataset.name+ " ("+fo.name+" Folder).zip", request.headers.get("user-agent").getOrElse("")))
+            )
+          }
+          case None => NotFound
+        }
+
+
+      }
+      // If the dataset wasn't found by ID
+      case None => {
+        NotFound
+      }
+    }
+  }
+
   def updateAccess(id:UUID, access:String) = PermissionAction(Permission.PublicDataset, Some(ResourceRef(ResourceRef.dataset, id))) { implicit request =>
     implicit val user = request.user
     user match {

diff --git a/app/api/Files.scala b/app/api/Files.scala
@@ -728,42 +728,29 @@ class Files @Inject()(
       "content-type" -> file.contentType,
       "date-created" -> file.uploadDate.toString(),
       "size" -> file.length.toString,
+      "thumbnail" -> file.thumbnail_id.orNull,
       "authorId" -> file.author.id.stringify,
       "status" -> file.status)
 
     // Only include filepath if using DiskByte storage and user is serverAdmin
     val jsonMap = file.loader match {
       case "services.filesystem.DiskByteStorageService" => {
         if (serverAdmin)
-          Map(
-            "id" -> file.id.toString,
-            "filename" -> file.filename,
-            "filepath" -> file.loader_id,
-            "filedescription" -> file.description,
-            "content-type" -> file.contentType,
-            "date-created" -> file.uploadDate.toString(),
-            "size" -> file.length.toString,
-            "authorId" -> file.author.id.stringify,
-            "status" -> file.status)
+          defaultMap ++ Map(
+            "filepath" -> file.loader_id
+          )
         else
           defaultMap
       }
       case "services.s3.S3ByteStorageService" => {
         if (serverAdmin) {
           val bucketName = configuration.getString(S3ByteStorageService.BucketName).getOrElse("")
           val serviceEndpoint = configuration.getString(S3ByteStorageService.ServiceEndpoint).getOrElse("")
-          Map(
-            "id" -> file.id.toString,
-            "filename" -> file.filename,
+          defaultMap ++ Map(
             "service-endpoint" -> serviceEndpoint,
             "bucket-name" -> bucketName,
-            "object-key" -> file.loader_id,
-            "filedescription" -> file.description,
-            "content-type" -> file.contentType,
-            "date-created" -> file.uploadDate.toString(),
-            "size" -> file.length.toString,
-            "authorId" -> file.author.id.stringify,
-            "status" -> file.status)
+            "object-key" -> file.loader_id
+          )
         } else
           defaultMap
       }

diff --git a/app/controllers/Application.scala b/app/controllers/Application.scala
@@ -333,6 +333,8 @@ class Application @Inject() (files: FileService, collections: CollectionService,
         api.routes.javascript.Datasets.unfollow,
         api.routes.javascript.Datasets.detachFile,
         api.routes.javascript.Datasets.download,
+        api.routes.javascript.Datasets.downloadPartial,
+        api.routes.javascript.Datasets.downloadFolder,
         api.routes.javascript.Datasets.getPreviews,
         api.routes.javascript.Datasets.updateAccess,
         api.routes.javascript.Datasets.addFileEvent,