#!/bin/sh # Licensed to the Apache Software Foundation (ASF) under one # or more contributor license agreements. See the NOTICE file # distributed with this work for additional information # regarding copyright ownership. The ASF licenses this file # to you under the Apache License, Version 2.0 (the # "License"); you may not use this file except in compliance # with the License. You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. cwd=`dirname $0` ARCHIVES=`ls -1 $cwd/../../../build/apache-cassandra*.jar` for jar in `ls -1 $cwd/../../../build/lib/jars/*.jar $cwd/../../../lib/*.jar`; do ARCHIVES=$ARCHIVES,$jar done hadoop jar $cwd/../../../build/lib/jars/hadoop-streaming*.jar \ -D stream.reduce.output=cassandra_avro_output \ -D stream.io.identifier.resolver.class=org.apache.cassandra.hadoop.streaming.AvroResolver \ -D cassandra.output.keyspace=Keyspace1 \ -D cassandra.output.columnfamily=Standard1 \ -D cassandra.partitioner.class=org.apache.cassandra.dht.RandomPartitioner \ -D cassandra.thrift.address=127.0.0.1 \ -D cassandra.thrift.port=9160 \ -libjars $ARCHIVES \ -file $cwd/../../../interface/avro/cassandra.avpr \ -outputformat org.apache.cassandra.hadoop.ColumnFamilyOutputFormat \ -output /tmp/ignored \ -mapper $cwd/mapper.py -reducer $cwd/reducer.py \ $*