Start line:  
End line:  

Snippet Preview

Snippet HTML Code

Stack Overflow Questions
<?xml version="1.0" encoding="UTF-8"?>

<!-- Generated by maven-plugin-tools 3.1 on 2013-08-16 -->

<plugin>
  <name>CDK Maven Plugin</name>
  <description>The CDK Maven Plugin provides Maven goals for packaging, deploying, and running distributed applications.</description>
  <groupId>com.cloudera.cdk</groupId>
  <artifactId>cdk-maven-plugin</artifactId>
  <version>0.6.0</version>
  <goalPrefix>cdk</goalPrefix>
  <mojos>
    <mojo>
      <goal>create-dataset</goal>
      <description>Create a named dataset whose entries conform to a defined schema.</description>
      <requiresDirectInvocation>false</requiresDirectInvocation>
      <requiresProject>false</requiresProject>
      <requiresReports>false</requiresReports>
      <aggregator>false</aggregator>
      <requiresOnline>false</requiresOnline>
      <inheritedByDefault>true</inheritedByDefault>
      <implementation>com.cloudera.cdk.maven.plugins.CreateDatasetMojo</implementation>
      <language>java</language>
      <instantiationStrategy>per-lookup</instantiationStrategy>
      <executionStrategy>once-per-session</executionStrategy>
      <threadSafe>false</threadSafe>
      <parameters>
        <parameter>
          <name>avroSchemaFile</name>
          <type>java.lang.String</type>
          <required>true</required>
          <editable>true</editable>
          <description>The file containing the Avro schema. If no file with the specified name is found on the local filesystem, then the classpath is searched for a matching resource.</description>
        </parameter>
        <parameter>
          <name>datasetName</name>
          <type>java.lang.String</type>
          <required>true</required>
          <editable>true</editable>
          <description>The name of the dataset to create.</description>
        </parameter>
        <parameter>
          <name>format</name>
          <type>java.lang.String</type>
          <required>false</required>
          <editable>true</editable>
          <description>The file format (avro or parquet).</description>
        </parameter>
        <parameter>
          <name>hadoopConfiguration</name>
          <type>java.util.Properties</type>
          <required>false</required>
          <editable>true</editable>
          <description>Hadoop configuration properties.</description>
        </parameter>
        <parameter>
          <name>hcatalog</name>
          <type>boolean</type>
          <required>false</required>
          <editable>true</editable>
          <description>If true, store dataset metadata in HCatalog, otherwise store it on the filesystem.</description>
        </parameter>
        <parameter>
          <name>partitionExpression</name>
          <type>java.lang.String</type>
          <required>false</required>
          <editable>true</editable>
          <description>The partition expression, in JEXL format (experimental).</description>
        </parameter>
        <parameter>
          <name>rootDirectory</name>
          <type>java.lang.String</type>
          <required>false</required>
          <editable>true</editable>
          <description>The root directory of the dataset repository. Optional if using HCatalog for metadata storage.</description>
        </parameter>
      </parameters>
      <configuration>
        <avroSchemaFile implementation="java.lang.String">${cdk.avroSchemaFile}</avroSchemaFile>
        <datasetName implementation="java.lang.String">${cdk.datasetName}</datasetName>
        <format implementation="java.lang.String">${cdk.format}</format>
        <hadoopConfiguration implementation="java.util.Properties">${cdk.hadoopConfiguration}</hadoopConfiguration>
        <hcatalog implementation="boolean">${cdk.hcatalog}</hcatalog>
        <partitionExpression implementation="java.lang.String">${cdk.partitionExpression}</partitionExpression>
        <rootDirectory implementation="java.lang.String">${cdk.rootDirectory}</rootDirectory>
      </configuration>
    </mojo>
    <mojo>
      <goal>deploy-app</goal>
      <description>Deploy a packaged application to a Hadoop filesystem, such as HDFS.</description>
      <requiresDirectInvocation>false</requiresDirectInvocation>
      <requiresProject>true</requiresProject>
      <requiresReports>false</requiresReports>
      <aggregator>false</aggregator>
      <requiresOnline>false</requiresOnline>
      <inheritedByDefault>true</inheritedByDefault>
      <implementation>com.cloudera.cdk.maven.plugins.DeployAppMojo</implementation>
      <language>java</language>
      <instantiationStrategy>per-lookup</instantiationStrategy>
      <executionStrategy>once-per-session</executionStrategy>
      <threadSafe>false</threadSafe>
      <parameters>
        <parameter>
          <name>applicationName</name>
          <type>java.lang.String</type>
          <required>false</required>
          <editable>true</editable>
          <description>The name of the application.</description>
        </parameter>
        <parameter>
          <name>applicationsDirectory</name>
          <type>java.lang.String</type>
          <required>false</required>
          <editable>true</editable>
          <description>The base directory in the Hadoop filesystem (typically HDFS) where applications are stored.</description>
        </parameter>
        <parameter>
          <name>deployFileSystem</name>
          <type>java.lang.String</type>
          <required>true</required>
          <editable>true</editable>
          <description>The Hadoop fileystem used to deploy the application. The filesystem must be accessible by the client deploying the application.</description>
        </parameter>
        <parameter>
          <name>localApplicationFile</name>
          <type>java.io.File</type>
          <required>false</required>
          <editable>true</editable>
          <description>The local directory of the application to deploy.</description>
        </parameter>
        <parameter>
          <name>updateApplication</name>
          <type>boolean</type>
          <required>false</required>
          <editable>true</editable>
          <description>Whether to automatically undeploy applications that already exist when deploying. If false, and this application has already been deployed, then an error will be reported.</description>
        </parameter>
      </parameters>
      <configuration>
        <applicationName implementation="java.lang.String" default-value="${project.build.finalName}-app">${cdk.applicationName}</applicationName>
        <applicationsDirectory implementation="java.lang.String" default-value="/user/${user.name}/apps/">${cdk.applicationsDirectory}</applicationsDirectory>
        <deployFileSystem implementation="java.lang.String">${cdk.deployFileSystem}</deployFileSystem>
        <localApplicationFile implementation="java.io.File" default-value="${project.build.directory}/${project.build.finalName}-app">${cdk.localApplicationFile}</localApplicationFile>
        <updateApplication implementation="boolean" default-value="false">${cdk.updateApplication}</updateApplication>
      </configuration>
    </mojo>
    <mojo>
      <goal>drop-dataset</goal>
      <description>Delete a dataset and its metadata.</description>
      <requiresDirectInvocation>false</requiresDirectInvocation>
      <requiresProject>false</requiresProject>
      <requiresReports>false</requiresReports>
      <aggregator>false</aggregator>
      <requiresOnline>false</requiresOnline>
      <inheritedByDefault>true</inheritedByDefault>
      <implementation>com.cloudera.cdk.maven.plugins.DropDatasetMojo</implementation>
      <language>java</language>
      <instantiationStrategy>per-lookup</instantiationStrategy>
      <executionStrategy>once-per-session</executionStrategy>
      <threadSafe>false</threadSafe>
      <parameters>
        <parameter>
          <name>datasetName</name>
          <type>java.lang.String</type>
          <required>true</required>
          <editable>true</editable>
          <description>The name of the dataset to drop.</description>
        </parameter>
        <parameter>
          <name>hadoopConfiguration</name>
          <type>java.util.Properties</type>
          <required>false</required>
          <editable>true</editable>
          <description>Hadoop configuration properties.</description>
        </parameter>
        <parameter>
          <name>hcatalog</name>
          <type>boolean</type>
          <required>false</required>
          <editable>true</editable>
          <description>If true, store dataset metadata in HCatalog, otherwise store it on the filesystem.</description>
        </parameter>
        <parameter>
          <name>rootDirectory</name>
          <type>java.lang.String</type>
          <required>false</required>
          <editable>true</editable>
          <description>The root directory of the dataset repository. Optional if using HCatalog for metadata storage.</description>
        </parameter>
      </parameters>
      <configuration>
        <datasetName implementation="java.lang.String">${cdk.datasetName}</datasetName>
        <hadoopConfiguration implementation="java.util.Properties">${cdk.hadoopConfiguration}</hadoopConfiguration>
        <hcatalog implementation="boolean">${cdk.hcatalog}</hcatalog>
        <rootDirectory implementation="java.lang.String">${cdk.rootDirectory}</rootDirectory>
      </configuration>
    </mojo>
    <mojo>
      <goal>package-app</goal>
      <description>Package an application on the local filesystem.</description>
      <requiresDependencyResolution>runtime</requiresDependencyResolution>
      <requiresDirectInvocation>false</requiresDirectInvocation>
      <requiresProject>true</requiresProject>
      <requiresReports>false</requiresReports>
      <aggregator>false</aggregator>
      <requiresOnline>false</requiresOnline>
      <inheritedByDefault>true</inheritedByDefault>
      <phase>package</phase>
      <implementation>com.cloudera.cdk.maven.plugins.PackageAppMojo</implementation>
      <language>java</language>
      <instantiationStrategy>per-lookup</instantiationStrategy>
      <executionStrategy>once-per-session</executionStrategy>
      <threadSafe>false</threadSafe>
      <parameters>
        <parameter>
          <name>addDependenciesToDistributedCache</name>
          <type>boolean</type>
          <required>false</required>
          <editable>true</editable>
          <description>Whether to add dependencies in the runtime classpath to Hadoop&apos;s distributed cache so that they are added to the classpath for MapReduce tasks (via -libjars).</description>
        </parameter>
        <parameter>
          <name>applicationName</name>
          <type>java.lang.String</type>
          <required>false</required>
          <editable>true</editable>
          <description>The name of the application.</description>
        </parameter>
        <parameter>
          <name>applicationsDirectory</name>
          <type>java.lang.String</type>
          <required>false</required>
          <editable>true</editable>
          <description>The base directory in the Hadoop filesystem (typically HDFS) where applications are stored.</description>
        </parameter>
        <parameter>
          <name>applicationType</name>
          <type>java.lang.String</type>
          <required>false</required>
          <editable>true</editable>
          <description>The type of the application (workflow, coordination, or bundle).</description>
        </parameter>
        <parameter>
          <name>args</name>
          <type>java.lang.String[]</type>
          <required>false</required>
          <editable>true</editable>
          <description>Arguments to pass to the tool, in addition to those generated by addDependenciesToDistributedCache and hadoopConfiguration.</description>
        </parameter>
        <parameter>
          <name>coordinatorFile</name>
          <type>java.io.File</type>
          <required>false</required>
          <editable>true</editable>
          <description>The coordinator.xml file to use (only for applications of type coordinator).</description>
        </parameter>
        <parameter>
          <name>encoding</name>
          <type>java.lang.String</type>
          <required>false</required>
          <editable>true</editable>
          <description>Character encoding for the auto-generated workflow file.</description>
        </parameter>
        <parameter>
          <name>generateWorkflowXml</name>
          <type>boolean</type>
          <required>false</required>
          <editable>true</editable>
          <description>Whether the workflow.xml should be generated or not.</description>
        </parameter>
        <parameter>
          <name>hadoopConfiguration</name>
          <type>java.util.Properties</type>
          <required>false</required>
          <editable>true</editable>
          <description>Hadoop configuration properties.</description>
        </parameter>
        <parameter>
          <name>schemaVersion</name>
          <type>java.lang.String</type>
          <required>false</required>
          <editable>true</editable>
          <description>The version of the Oozie workflow schema.</description>
        </parameter>
        <parameter>
          <name>toolClass</name>
          <type>java.lang.String</type>
          <required>true</required>
          <editable>true</editable>
          <description>The tool class to run. The specified class must have a standard Java main method.</description>
        </parameter>
        <parameter>
          <name>workflowName</name>
          <type>java.lang.String</type>
          <required>false</required>
          <editable>true</editable>
          <description>The name of the workflow.</description>
        </parameter>
      </parameters>
      <configuration>
        <addDependenciesToDistributedCache implementation="boolean" default-value="true">${cdk.addDependenciesToDistributedCache}</addDependenciesToDistributedCache>
        <applicationName implementation="java.lang.String" default-value="${project.build.finalName}-app">${cdk.applicationName}</applicationName>
        <applicationsDirectory implementation="java.lang.String" default-value="/user/${user.name}/apps/">${cdk.applicationsDirectory}</applicationsDirectory>
        <applicationType implementation="java.lang.String" default-value="workflow">${cdk.applicationType}</applicationType>
        <args implementation="java.lang.String[]">${cdk.args}</args>
        <coordinatorFile implementation="java.io.File" default-value="${basedir}/src/main/oozie/coordinator.xml">${cdk.coordinatorFile}</coordinatorFile>
        <encoding implementation="java.lang.String" default-value="UTF-8">${cdk.workflowFileEncoding}</encoding>
        <generateWorkflowXml implementation="boolean" default-value="true">${cdk.generateWorkflowXml}</generateWorkflowXml>
        <hadoopConfiguration implementation="java.util.Properties">${cdk.hadoopConfiguration}</hadoopConfiguration>
        <schemaVersion implementation="java.lang.String" default-value="0.4">${cdk.schemaVersion}</schemaVersion>
        <toolClass implementation="java.lang.String">${cdk.toolClass}</toolClass>
        <workflowName implementation="java.lang.String" default-value="${project.build.finalName}">${cdk.workflowName}</workflowName>
      </configuration>
    </mojo>
    <mojo>
      <goal>run-app</goal>
      <description>Run an app as a job on a cluster.</description>
      <requiresDirectInvocation>false</requiresDirectInvocation>
      <requiresProject>true</requiresProject>
      <requiresReports>false</requiresReports>
      <aggregator>false</aggregator>
      <requiresOnline>false</requiresOnline>
      <inheritedByDefault>true</inheritedByDefault>
      <implementation>com.cloudera.cdk.maven.plugins.RunAppMojo</implementation>
      <language>java</language>
      <instantiationStrategy>per-lookup</instantiationStrategy>
      <executionStrategy>once-per-session</executionStrategy>
      <threadSafe>false</threadSafe>
      <parameters>
        <parameter>
          <name>applicationName</name>
          <type>java.lang.String</type>
          <required>false</required>
          <editable>true</editable>
          <description>The name of the application.</description>
        </parameter>
        <parameter>
          <name>applicationsDirectory</name>
          <type>java.lang.String</type>
          <required>false</required>
          <editable>true</editable>
          <description>The base directory in the Hadoop filesystem (typically HDFS) where applications are stored.</description>
        </parameter>
        <parameter>
          <name>applicationType</name>
          <type>java.lang.String</type>
          <required>false</required>
          <editable>true</editable>
          <description>The type of the application (workflow, coordination, or bundle).</description>
        </parameter>
        <parameter>
          <name>hadoopConfiguration</name>
          <type>java.util.Properties</type>
          <required>false</required>
          <editable>true</editable>
          <description>Hadoop configuration properties.</description>
        </parameter>
        <parameter>
          <name>jobProperties</name>
          <type>java.util.Properties</type>
          <required>false</required>
          <editable>true</editable>
          <description>Job configuration properties for the application. This provides a means to specify values for parameterized properties in Oozie applications.</description>
        </parameter>
        <parameter>
          <name>oozieUrl</name>
          <type>java.lang.String</type>
          <required>true</required>
          <editable>true</editable>
          <description>The URL of the Oozie service to use.</description>
        </parameter>
      </parameters>
      <configuration>
        <applicationName implementation="java.lang.String" default-value="${project.build.finalName}-app">${cdk.applicationName}</applicationName>
        <applicationsDirectory implementation="java.lang.String" default-value="/user/${user.name}/apps/">${cdk.applicationsDirectory}</applicationsDirectory>
        <applicationType implementation="java.lang.String" default-value="workflow">${cdk.applicationType}</applicationType>
        <hadoopConfiguration implementation="java.util.Properties">${cdk.hadoopConfiguration}</hadoopConfiguration>
        <jobProperties implementation="java.util.Properties">${cdk.jobProperties}</jobProperties>
        <oozieUrl implementation="java.lang.String">${cdk.oozieUrl}</oozieUrl>
      </configuration>
    </mojo>
    <mojo>
      <goal>run-tool</goal>
      <description>Run a Hadoop tool on the local machine.</description>
      <requiresDependencyResolution>runtime</requiresDependencyResolution>
      <requiresDirectInvocation>false</requiresDirectInvocation>
      <requiresProject>true</requiresProject>
      <requiresReports>false</requiresReports>
      <aggregator>false</aggregator>
      <requiresOnline>false</requiresOnline>
      <inheritedByDefault>true</inheritedByDefault>
      <implementation>com.cloudera.cdk.maven.plugins.RunToolMojo</implementation>
      <language>java</language>
      <instantiationStrategy>per-lookup</instantiationStrategy>
      <executionStrategy>once-per-session</executionStrategy>
      <threadSafe>false</threadSafe>
      <parameters>
        <parameter>
          <name>addDependenciesToDistributedCache</name>
          <type>boolean</type>
          <required>false</required>
          <editable>true</editable>
          <description>Whether to add dependencies in the runtime classpath to Hadoop&apos;s distributed cache so that they are added to the classpath for MapReduce tasks (via -libjars).</description>
        </parameter>
        <parameter>
          <name>args</name>
          <type>java.lang.String[]</type>
          <required>false</required>
          <editable>true</editable>
          <description>Arguments to pass to the tool, in addition to those generated by addDependenciesToDistributedCache and hadoopConfiguration.</description>
        </parameter>
        <parameter>
          <name>hadoopConfiguration</name>
          <type>java.util.Properties</type>
          <required>false</required>
          <editable>true</editable>
          <description>Hadoop configuration properties.</description>
        </parameter>
        <parameter>
          <name>toolClass</name>
          <type>java.lang.String</type>
          <required>true</required>
          <editable>true</editable>
          <description>The tool class to run. The specified class must have a standard Java main method.</description>
        </parameter>
      </parameters>
      <configuration>
        <addDependenciesToDistributedCache implementation="boolean" default-value="true">${cdk.addDependenciesToDistributedCache}</addDependenciesToDistributedCache>
        <args implementation="java.lang.String[]">${cdk.args}</args>
        <hadoopConfiguration implementation="java.util.Properties">${cdk.hadoopConfiguration}</hadoopConfiguration>
        <toolClass implementation="java.lang.String">${cdk.toolClass}</toolClass>
      </configuration>
    </mojo>
  </mojos>
</plugin>
New to GrepCode? Check out our FAQ X