Code Monkey home page Code Monkey logo

apptrans's Introduction

#Run Book

#Build mvn clean package

#Upload to cluster scp target/AppTrans.jar [email protected]:./

#Log into Cluster ssh [email protected]

#Set up Kafka Topic kafka-topics --zookeeper ted-training-1-1.vpc.cloudera.com:2181
--partition 2 --replication-factor 2 --create --topic app-event-input

#Running the generator java -cp AppTrans.jar com.cloudera.sa.apptrans.generator.AppEventProducer
ted-training-1-4.vpc.cloudera.com:9092,ted-training-1-5.vpc.cloudera.com:9092
app-event-input 100 0 5 async 1000 10000 20000 ./data/uber_bay_area_lat_lon.csv 1000

#Listen to Kafka with Console kafka-topics --zookeeper ted-training-1-1.vpc.cloudera.com:2181 --list

kafka-console-producer --broker-list
ted-training-1-4.vpc.cloudera.com:9092,ted-training-1-5.vpc.cloudera.com:9092
--topic app-event-input

kafka-console-consumer
--zookeeper ted-training-1-1.vpc.cloudera.com:2181
--topic app-event-input

#Set up Kudu Tables Run these in HUE in the impala window

kudu/apptrans/createAccountMart.sql

kudu/apptrans/createAppEvent.sql

#Set up SolR Collection solrctl instancedir --generate app-event-collection

switch out the schema.xml with the following file app-event-collection/conf/schema.xml

solrctl instancedir --create app-event-collection app-event-collection

solrctl collection --create app-event-collection -s 3 -r 2 -m 3

#Set up HBase Table hadoop jar AppTrans.jar com.cloudera.sa.apptrans.setup.hbase.CreateSaltedTable app-event f 6 6 /opt/cloudera/parcels/CDH/lib/hbase/conf/

hadoop jar AppTrans.jar com.cloudera.sa.apptrans.setup.hbase.CreateSaltedTable account-mart f 6 6 /opt/cloudera/parcels/CDH/lib/hbase/conf/

#Spark Streaming to SolR ##Run Spark to SolR export JAVA_HOME=/opt/jdk1.8.0_91/

spark-submit --class com.cloudera.sa.apptrans.streaming.ingestion.solr.SparkStreamingAppEventToSolR
--master yarn --deploy-mode client --executor-memory 512MB --num-executors 2 --executor-cores 1
AppTrans.jar
ted-training-1-4.vpc.cloudera.com:9092,ted-training-1-5.vpc.cloudera.com:9092
app-event-input
tmp/checkpoint
1
c
app-event-collection
ted-training-1-1.vpc.cloudera.com:2181/solr

##Test SolR input Go to the Hue Dashboard Page

#Spark Streaming to Kudu ##Run Spark to Kudu export JAVA_HOME=/opt/jdk1.8.0_91/

spark-submit --class com.cloudera.sa.apptrans.streaming.ingestion.kudu.SparkStreamingAppEventToKudu
--master yarn --deploy-mode client --executor-memory 512MB --num-executors 2 --executor-cores 1
AppTrans.jar
ted-training-1-4.vpc.cloudera.com:9092,ted-training-1-5.vpc.cloudera.com:9092
app-event-input
1
c
ted-training-1-2.vpc.cloudera.com
account_mart_kudu
app_event_kudu
tmp/checkpoint

##Test Kudu input select * from customer_tran_kudu;

##Rest Server com.cloudera.sa.example.card.server.kudu.KuduRestServer 4242
ted-training-1-2.vpc.cloudera.com app_event_kudu account_mart_kudu

##Run Spark SQL Example spark-submit --class com.cloudera.sa.apptrans.sql.kudu.KuduSimpleSums
--master yarn --deploy-mode client --executor-memory 512MB --num-executors 2 --executor-cores 1
AppTrans.jar
c
ted-training-1-2.vpc.cloudera.com
account_mart_kudu

#Spark Streaming to HBase ##Run Spark to HBase export JAVA_HOME=/opt/jdk1.8.0_91/ spark-submit --class com.cloudera.sa.apptrans.streaming.ingestion.hbase.SparkStreamingAppEventToHBase
--master yarn --deploy-mode client --executor-memory 512MB --num-executors 2 --executor-cores 1
AppTrans.jar
ted-training-1-4.vpc.cloudera.com:9092,ted-training-1-5.vpc.cloudera.com:9092
app-event-input
1
c
app-event
6
tmp/checkpoint
/opt/cloudera/parcels/CDH/lib/hbase/conf/

##Test Kudu input scan 'card-trans'

##Rest Server com.cloudera.sa.example.card.server.hbase.HBaseRestService
4242 / /opt/cloudera/parcels/CDH/lib/hbase/conf/
6
customer_trans_kudu

apptrans's People

Watchers

Myles Daniel Baker avatar  avatar

Recommend Projects

  • React photo React

    A declarative, efficient, and flexible JavaScript library for building user interfaces.

  • Vue.js photo Vue.js

    ๐Ÿ–– Vue.js is a progressive, incrementally-adoptable JavaScript framework for building UI on the web.

  • Typescript photo Typescript

    TypeScript is a superset of JavaScript that compiles to clean JavaScript output.

  • TensorFlow photo TensorFlow

    An Open Source Machine Learning Framework for Everyone

  • Django photo Django

    The Web framework for perfectionists with deadlines.

  • D3 photo D3

    Bring data to life with SVG, Canvas and HTML. ๐Ÿ“Š๐Ÿ“ˆ๐ŸŽ‰

Recommend Topics

  • javascript

    JavaScript (JS) is a lightweight interpreted programming language with first-class functions.

  • web

    Some thing interesting about web. New door for the world.

  • server

    A server is a program made to process requests and deliver data to clients.

  • Machine learning

    Machine learning is a way of modeling and interpreting data that allows a piece of software to respond intelligently.

  • Game

    Some thing interesting about game, make everyone happy.

Recommend Org

  • Facebook photo Facebook

    We are working to build community through open source technology. NB: members must have two-factor auth.

  • Microsoft photo Microsoft

    Open source projects and samples from Microsoft.

  • Google photo Google

    Google โค๏ธ Open Source for everyone.

  • D3 photo D3

    Data-Driven Documents codes.