LISTSERV mailing list manager LISTSERV 16.5

Help for HPS-SVN Archives


HPS-SVN Archives

HPS-SVN Archives


HPS-SVN@LISTSERV.SLAC.STANFORD.EDU


View:

Message:

[

First

|

Previous

|

Next

|

Last

]

By Topic:

[

First

|

Previous

|

Next

|

Last

]

By Author:

[

First

|

Previous

|

Next

|

Last

]

Font:

Proportional Font

LISTSERV Archives

LISTSERV Archives

HPS-SVN Home

HPS-SVN Home

HPS-SVN  January 2016

HPS-SVN January 2016

Subject:

r4078 - in /java/branches/jeremy-dev/crawler/src/main/java/org/hps/crawler: CrawlerFileVisitor.java DataType.java DatacatCrawler.java DatacatHelper.java

From:

[log in to unmask]

Reply-To:

Notification of commits to the hps svn repository <[log in to unmask]>

Date:

Mon, 4 Jan 2016 18:56:45 -0000

Content-Type:

text/plain

Parts/Attachments:

Parts/Attachments

text/plain (232 lines)

Author: [log in to unmask]
Date: Mon Jan  4 10:56:39 2016
New Revision: 4078

Log:
Cleanup building of new dataset; other minor changes.

Modified:
    java/branches/jeremy-dev/crawler/src/main/java/org/hps/crawler/CrawlerFileVisitor.java
    java/branches/jeremy-dev/crawler/src/main/java/org/hps/crawler/DataType.java
    java/branches/jeremy-dev/crawler/src/main/java/org/hps/crawler/DatacatCrawler.java
    java/branches/jeremy-dev/crawler/src/main/java/org/hps/crawler/DatacatHelper.java

Modified: java/branches/jeremy-dev/crawler/src/main/java/org/hps/crawler/CrawlerFileVisitor.java
 =============================================================================
--- java/branches/jeremy-dev/crawler/src/main/java/org/hps/crawler/CrawlerFileVisitor.java	(original)
+++ java/branches/jeremy-dev/crawler/src/main/java/org/hps/crawler/CrawlerFileVisitor.java	Mon Jan  4 10:56:39 2016
@@ -10,7 +10,7 @@
 import java.util.List;
 
 /**
- * Visitor which creates a {@link FileSet} from walking a directory tree.
+ * Visitor which creates a list of files from walking a directory tree.
  * <p>
  * Any number of {@link java.io.FileFilter} objects can be registered with this visitor to restrict which files are
  * accepted.
@@ -20,12 +20,12 @@
 final class CrawlerFileVisitor extends SimpleFileVisitor<Path> {
 
     /**
-     * The run log containing information about files from each run.
+     * The list of files found from crawling.
      */
     private final List<File> files = new ArrayList<File>();
 
     /**
-     * A list of file filters to apply.
+     * A list of file filters applied to each path.
      */
     private final List<FileFilter> filters = new ArrayList<FileFilter>();
 

Modified: java/branches/jeremy-dev/crawler/src/main/java/org/hps/crawler/DataType.java
 =============================================================================
--- java/branches/jeremy-dev/crawler/src/main/java/org/hps/crawler/DataType.java	(original)
+++ java/branches/jeremy-dev/crawler/src/main/java/org/hps/crawler/DataType.java	Mon Jan  4 10:56:39 2016
@@ -7,7 +7,7 @@
  */
 public enum DataType {
     /**
-     * Data quality management plots.
+     * Data quality management plots (AIDA or ROOT).
      */
     DQM,
     /**
@@ -15,7 +15,7 @@
      */
     RAW,
     /**
-     * Reconstructed data (usually LCIO).
+     * Reconstructed data (LCIO).
      */
     RECON,
     /**

Modified: java/branches/jeremy-dev/crawler/src/main/java/org/hps/crawler/DatacatCrawler.java
 =============================================================================
--- java/branches/jeremy-dev/crawler/src/main/java/org/hps/crawler/DatacatCrawler.java	(original)
+++ java/branches/jeremy-dev/crawler/src/main/java/org/hps/crawler/DatacatCrawler.java	Mon Jan  4 10:56:39 2016
@@ -2,7 +2,6 @@
 
 import java.io.File;
 import java.io.IOException;
-import java.net.URISyntaxException;
 import java.nio.file.FileVisitOption;
 import java.nio.file.Files;
 import java.nio.file.attribute.BasicFileAttributes;
@@ -19,8 +18,6 @@
 import org.apache.commons.cli.HelpFormatter;
 import org.apache.commons.cli.Options;
 import org.apache.commons.cli.ParseException;
-import org.srs.datacat.client.Client;
-import org.srs.datacat.client.ClientBuilder;
 import org.srs.datacat.model.DatasetModel;
 
 /**
@@ -57,7 +54,6 @@
      * Statically define the command options.
      */
     static {
-        OPTIONS.addOption("L", "log-level", true, "set the log level (INFO, FINE, etc.)");
         OPTIONS.addOption("b", "min-date", true, "min date for a file (example \"2015-03-26 11:28:59\")");
         OPTIONS.addOption("d", "directory", true, "root directory to crawl");
         OPTIONS.addOption("f", "folder", true, "datacat folder");
@@ -108,13 +104,6 @@
             // Print help.
             if (cl.hasOption("h") || args.length == 0) {
                 this.printUsage();
-            }
-
-            // Log level (only used for this class's logger).
-            if (cl.hasOption("L")) {
-                final Level level = Level.parse(cl.getOptionValue("L"));
-                LOGGER.config("log level " + level);
-                LOGGER.setLevel(level);
             }
 
             // Root directory for file crawling.
@@ -217,6 +206,18 @@
                 }
                 config.setAcceptRuns(acceptRuns);
             }
+                                    
+            // Dry run.
+            if (cl.hasOption("D")) {
+                config.setDryRun(true);
+            }
+                        
+            // List of paths.
+            if (!cl.getArgList().isEmpty()) {
+                for (String arg : cl.getArgList()) {
+                    config.addPath(arg);
+                }
+            }
             
             // Dataset site (defaults to JLAB).
             Site site = Site.JLAB;
@@ -226,22 +227,10 @@
             LOGGER.config("dataset site " + site);
             config.setSite(site);
             
-            // Dry run.
-            if (cl.hasOption("D")) {
-                config.setDryRun(true);
-            }
-            
             // Data catalog URL.
             if (cl.hasOption("u")) {
                 config.setDatacatUrl(cl.getOptionValue("u"));
                 LOGGER.config("datacat URL " + config.datacatUrl());
-            }
-            
-            // List of paths.
-            if (!cl.getArgList().isEmpty()) {
-                for (String arg : cl.getArgList()) {
-                    config.addPath(arg);
-                }
             }
 
         } catch (final ParseException e) {

Modified: java/branches/jeremy-dev/crawler/src/main/java/org/hps/crawler/DatacatHelper.java
 =============================================================================
--- java/branches/jeremy-dev/crawler/src/main/java/org/hps/crawler/DatacatHelper.java	(original)
+++ java/branches/jeremy-dev/crawler/src/main/java/org/hps/crawler/DatacatHelper.java	Mon Jan  4 10:56:39 2016
@@ -14,6 +14,7 @@
 import org.srs.datacat.client.Client;
 import org.srs.datacat.client.ClientBuilder;
 import org.srs.datacat.model.DatasetModel;
+import org.srs.datacat.model.DatasetView.VersionId;
 import org.srs.datacat.shared.Dataset;
 import org.srs.datacat.shared.Provider;
 
@@ -183,27 +184,37 @@
             String dataType,
             String fileFormat) {
         
-        Provider provider = new Provider();        
-        List<DatasetModel> datasets = new ArrayList<DatasetModel>();
-                              
+        Provider provider = new Provider();                                              
         Dataset.Builder datasetBuilder = provider.getDatasetBuilder();
-        datasetBuilder.versionId(1);
-        datasetBuilder.master(true);
-        datasetBuilder.name(file.getName());
-        datasetBuilder.resource(file.getPath());
-        datasetBuilder.size((Long) metadata.get("size"));
-        datasetBuilder.scanStatus("OK");
-        datasetBuilder.dataType(dataType);
-        datasetBuilder.fileFormat(fileFormat);
-        datasetBuilder.site(site);
+        
+        // Set basic info on new dataset.
+        datasetBuilder.versionId(VersionId.valueOf("new"))
+            .master(true)
+            .name(file.getName())
+            .resource(file.getPath())
+            .dataType(dataType)
+            .fileFormat(fileFormat)
+            .site(site)
+            .scanStatus("OK");
+        
+        // Set system metadata from the provided metadata map.
         if (metadata.get("eventCount") != null) {
             datasetBuilder.eventCount((Long) metadata.get("eventCount"));
         }
-        datasetBuilder.runMin((Long) metadata.get("runMin"));
-        datasetBuilder.runMax((Long) metadata.get("runMax"));
-        datasetBuilder.checksum((String) metadata.get("checksum"));
-                        
-        // Create user metadata leaving out system metadata fields.
+        if (metadata.get("checksum") != null) {
+            datasetBuilder.checksum((String) metadata.get("checksum"));
+        }
+        if (metadata.get("runMin") != null) {                   
+            datasetBuilder.runMin((Long) metadata.get("runMin"));
+        }
+        if (metadata.get("runMax") != null) {
+            datasetBuilder.runMax((Long) metadata.get("runMax"));
+        }
+        if (metadata.get("size") != null) {
+            datasetBuilder.size((Long) metadata.get("size"));
+        }
+                                
+        // Create user metadata, leaving out system metadata fields.
         Map<String, Object> userMetadata = new HashMap<String, Object>();
         for (Entry<String, Object> metadataEntry : metadata.entrySet()) {
             if (!SYSTEM_METADATA.contains(metadataEntry.getKey())) {
@@ -212,11 +223,7 @@
         }
         datasetBuilder.versionMetadata(userMetadata);
         
-        // Build dataset and add to list.
-        DatasetModel dataset = datasetBuilder.build();
-        datasets.add(dataset);
-        
-        return dataset;
+        return datasetBuilder.build();
     }
     
     /**

Top of Message | Previous Page | Permalink

Advanced Options


Options

Log In

Log In

Get Password

Get Password


Search Archives

Search Archives


Subscribe or Unsubscribe

Subscribe or Unsubscribe


Archives

November 2017
August 2017
July 2017
January 2017
December 2016
November 2016
October 2016
September 2016
August 2016
July 2016
June 2016
May 2016
April 2016
March 2016
February 2016
January 2016
December 2015
November 2015
October 2015
September 2015
August 2015
July 2015
June 2015
May 2015
April 2015
March 2015
February 2015
January 2015
December 2014
November 2014
October 2014
September 2014
August 2014
July 2014
June 2014
May 2014
April 2014
March 2014
February 2014
January 2014
December 2013
November 2013

ATOM RSS1 RSS2



LISTSERV.SLAC.STANFORD.EDU

Secured by F-Secure Anti-Virus CataList Email List Search Powered by the LISTSERV Email List Manager

Privacy Notice, Security Notice and Terms of Use