Skip to content

airpingu/rhadoopiii

 
 

Folders and files

NameName
Last commit message
Last commit date

Latest commit

 

History

14 Commits
 
 
 
 
 
 
 
 
 
 
 
 
 
 

Repository files navigation

RHadoop Course Material

Slideshare: https://www.slideshare.net/secret/gDf3JYJRPWzkf5

Source Code: http://rpubs.com/ywchiu/25570

$ sudo yum install libxml2-devel

$ sudo yum install curl-devel

$ sudo R

install.packages(c("Rcurl", "httr"), dependencies = TRUE)

install.packages("devtools", dependencies = TRUE)

library(devtools)

install_github("pryr", "hadley")

install.packages(c("R.methodsS3", "hydroPSO"), dependencies = TRUE)

install.packages("dplyr", dependencies = TRUE)

install.packages("rjson", dependencies = TRUE)

$ wget --no-check-certificate https://raw.github.com/RevolutionAnalytics/plyrmr/master/build/plyrmr_0.5.0.tar.gz

$ sudo R CMD INSTALL plyrmr_0.5.0.tar.gz

2330 Analysis

==========================

tw2330 = read.csv("~/Downloads/tw2330.csv", head=TRUE)

head(tw2330)

head(tw2330,10)

tail(tw2330,10)

str(tw2330)

tw2330$Date = as.Date(tw2330$Date)

str(tw2330)

tw2330[tw2330$Date >='2014-03-01' & tw2330$Date < '2014-09-01' ,]

tw2330_mar_sep = tw2330[tw2330$Date >='2014-03-01' & tw2330$Date < '2014-09-01' ,]

min(tw2330_mar_sep$Close)

max(tw2330_mar_sep$Close)

mean(tw2330_mar_sep$Close)

hist(tw2330_mar_sep$Close)

hist(tw2330$Close)

boxplot(tw2330$Close)

head(tw2330[order(tw2330$Close, decreasing=TRUE) ,])

tw2330$tf = ifelse(tw2330$Close - tw2330$Open > 0 , TRUE, FALSE)

table(tw2330$tf)

RHBASE INSTALL

==============================

hbase shell

create 't1','f1'

ERROR: Can't get master address from ZooKeeper; znode data == null

restart habase service

sudo service hbase-master restart

sudo env JAVA_HOME=/usr/java/jdk1.7.0_67-cloudera /usr/lib/hbase/bin/hbase-daemon.sh restart regionserver

sudo service zookeeper-server restart

install thrift

sudo yum install automake libtool flex bison pkgconfig gcc-c++ boost-devel libevent-devel zlib-devel python-devel ruby-devel

sudo yum install openssl openssl-devel

wget https://archive.apache.org/dist/thrift/0.8.0/thrift-0.8.0.tar.gz

tar -zxvf thrift-0.8.0.tar.gz

cd thrift-0.8.0

./configure

make

sudo make install

config thrift

sudo updatedb

export PKG_CONFIG_PATH=$PKG_CONFIG_PATH:/usr/local/lib/pkgconfig

pkg-config --cflags thrift

sudo cp /usr/local/lib/libthrift-0.8.0.so /usr/lib64/

install rhbase

wget --no-check-certificate https://github.com/RevolutionAnalytics/rhbase/blob/master/build/rhbase_1.2.1.tar.gz?raw=true

mv rhbase_1.2.1.tar.gz?raw=true rhbase_1.2.1.tar.gz

sudo PKG_CONFIG_PATH=/usr/local/lib/pkgconfig R CMD INSTALL rhbase_1.2.1.tar.gz

Releases

No releases published

Packages

No packages published

Languages

  • HTML 86.6%
  • R 11.8%
  • Shell 1.3%
  • PigLatin 0.3%