Merge pull request #2 from ihelmke/master

bcarrier · bcarrier · commit c838a6f21820 · 2011-09-12T10:52:04.000-07:00
Cloud/EC2 Changes
diff --git a/deploy/setup.sh b/deploy/setup.sh
@@ -0,0 +1,9 @@
+sudo apt-get install unzip
+sudo unzip  -n -qq sleuthkit-pipeline-1-SNAPSHOT-libs.zip -d /usr/lib/hadoop/lib/
+for SERVICE in /etc/init.d/hadoop*
+do
+    sudo $SERVICE restart
+done
+echo "export LD_LIBRARY_PATH=$HOME/txpete/fsrip/deps/" >> $HOME/.bashrc
+echo "export PATH=$PATH:$HOME/txpete/fsrip/" >> $HOME/.bashrc
+echo "export HADOO_HOME=/usr/lib/hadoop/" >> $HOME/.bashrc
diff --git a/deploy/tpkickoff.sh b/deploy/tpkickoff.sh
@@ -0,0 +1,54 @@
+#!/bin/sh
+
+if [ $# -ne 3 ] && [ $# -ne 4 ]
+then
+  echo "Usage: tpkickoff.sh image_friendly_name image_path jar_dir"
+  exit 1
+fi
+
+if [ $# -eq 4 ]
+then
+  if [ ${#4} -ne 32 ]
+  then
+    echo "Invalid Image ID: Must be 32 digits long"
+    exit 1
+  fi
+fi
+
+pwd
+date
+
+FriendlyName=$1
+ImagePath=$2
+JarDir=$3
+
+JarFile=`ls $JarDir/sleuthkit-pipeline-r*-job.jar | sort | tail -n 1`
+
+JsonFile=$FriendlyName.json
+HdfsImage=$FriendlyName.dd
+
+echo "jar file is ${JarFile}"
+
+# rip filesystem metadata, upload to hdfs
+fsrip dumpfs $ImagePath | $HADOOP_HOME/bin/hadoop jar $JarFile com.lightboxtechnologies.spectrum.Uploader $JsonFile
+
+# upload image to hdfs
+ImageID=`cat $ImagePath | $HADOOP_HOME/bin/hadoop jar $JarFile com.lightboxtechnologies.spectrum.Uploader $HdfsImage`
+echo "done uploading"
+if [ $# -eq 4 ]
+  then
+  ImageID=$4
+fi
+echo "Image ID is ${ImageID}"
+
+# kick off ingest
+$HADOOP_HOME/bin/hadoop jar $JarFile org.sleuthkit.hadoop.pipeline.Ingest $ImageID $HdfsImage $JsonFile $FriendlyName
+echo "done with ingest"
+
+# copy reports template
+$HADOOP_HOME/bin/hadoop fs -cp /texaspete/templates/reports /texaspete/data/$ImageID/
+
+# kick off pipeline
+$HADOOP_HOME/bin/hadoop jar $JarFile org.sleuthkit.hadoop.pipeline.Pipeline $ImageID $FriendlyName
+
+date
diff --git a/pipeline/pom.xml b/pipeline/pom.xml
@@ -89,6 +89,13 @@
   <profiles>
     <profile>
       <id>dependency-package</id>
+<!-- If you need the zip file with the dependencies of this project built
+along with the project, uncomment the next block of code. -->
+<!--
+      <activation>
+	<activeByDefault>true</activeByDefault>
+      </activation>
+-->
       <build>
 	<plugins>
 	  <plugin>
diff --git a/pushtocluster.sh b/pushtocluster.sh
@@ -0,0 +1,5 @@
+for addr in "$@"
+do
+    scp -r txpete/ $addr:~
+    ssh $addr "cd ~/txpete/; ./setup.sh"
+done
diff --git a/whirr-ec2-framework.properties b/whirr-ec2-framework.properties
@@ -0,0 +1,57 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+#
+# HBase CDH install
+#
+
+whirr.cluster-name=hadoop_framework
+
+whirr.instance-templates=1 zookeeper+hadoop-namenode+hadoop-jobtracker+hbase-master,1 hadoop-datanode+hadoop-tasktracker+hbase-regionserver
+
+# replication level should not be higher than number of data nodes
+hbase-site.dfs.replication=1
+
+#custom CDH zookeeper install and configure functions
+whirr.zookeeper.install-function=install_cdh_zookeeper
+whirr.zookeeper.configure-function=configure_cdh_zookeeper
+
+#custom CDH hadoop install and configure functions
+whirr.hadoop.install-function=install_cdh_hadoop
+whirr.hadoop.configure-function=configure_cdh_hadoop
+
+#custom CDH hbase install and configure functions
+whirr.hbase.install-function=install_cdh_hbase
+whirr.hbase.configure-function=configure_cdh_hbase
+
+whirr.provider=aws-ec2
+
+whirr.identity=<EC2_IDENTITY>
+whirr.credential=<EC2_CREDENTIAL>
+
+# The size of the instance to use. See http://aws.amazon.com/ec2/instance-types/
+whirr.hardware-id=c1.xlarge
+
+# Ubuntu 10.04 LTS Lucid. See http://cloud.ubuntu.com/ami/
+whirr.image-id=us-east-1/ami-04c9306d
+
+# If you choose a different location, make sure whirr.image-id is updated too
+whirr.location-id=us-east-1
+
+# By default use the user system SSH keys. Override them here.
+whirr.private-key-file=${sys:user.home}/.ssh/id_rsa
+whirr.public-key-file=${sys:user.home}/.ssh/id_rsa.pub