日韩久久久精品,亚洲精品久久久久久久久久久,亚洲欧美一区二区三区国产精品 ,一区二区福利

配置RHadoop與運行WordCount例子

系統(tǒng) 2784 0

1、安裝R語言環(huán)境

su -c 'rpm -Uvh http://download.fedoraproject.org/pub/epel/6/i386/epel-release-6-8.noarch.rpm'

su -c 'yum install foo'

yum list R-\*

yum install R

2、安裝RStudio Desktop和Server

Desktop是rpm包,雙擊執(zhí)行

Server安裝命令:

yum install openssl098e # Required only for RedHat/CentOS 6 and 7

wget http://download2.rstudio.org/rstudio-server-0.98.1091-x86_64.rpm

yum install --nogpgcheck rstudio-server-0.98.1091-x86_64.rpm

添加r-user用戶

3、安裝gcc、git、pkg-config

yum install gcc git pkg-config

4、安裝thrift0.9.0

yum install automake libtool flex bison pkgconfig gcc-c++ boost-devel libevent-devel zlib-devel python-devel ruby-devel

編譯安裝步驟:

Update the System

????yum -y update

Install the Platform Development Tools

????yum -y groupinstall "Development Tools"

Upgrade autoconf/automake/bison

????yum install -y wget

Upgrade autoconf

????wget http://ftp.gnu.org/gnu/autoconf/autoconf-2.69.tar.gz

????tar xvf autoconf-2.69.tar.gz

????cd autoconf-2.69

????./configure --prefix=/usr

????make

????make install

Upgrade automake

????wget http://ftp.gnu.org/gnu/automake/automake-1.14.tar.gz

????tar xvf automake-1.14.tar.gz

????cd automake-1.14

????./configure --prefix=/usr

????make

????make install

Upgrade bison

????wget http://ftp.gnu.org/gnu/bison/bison-2.5.1.tar.gz

????tar xvf bison-2.5.1.tar.gz

????cd bison-2.5.1

????./configure --prefix=/usr

????make

????make install

Install C++ Lib Dependencies

????yum -y install libevent-devel zlib-devel openssl-devel

Upgrade Boost

????wget http://sourceforge.net/projects/boost/files/boost/1.55.0/boost_1_55_0.tar.gz

????tar xvf boost_1_55_0.tar.gz

????cd boost_1_55_0

????./bootstrap.sh

????./b2 install

Build and Install the Apache Thrift IDL Compiler

????git clone https://git-wip-us.apache.org/repos/asf/thrift.git

????cd thrift

????./bootstrap.sh

????./configure --with-lua=no

????修改/thrift-0.9.1/lib/cpp/thrift.pc的includedir=${prefix}/include/thrift

????make

????make install

Update PKG_CONFIG_PATH:

????export PKG_CONFIG_PATH=$PKG_CONFIG_PATH:/usr/local/lib/pkgconfig/

Verifiy pkg-config path is correct:

????pkg-config --cflags thrift

????returns:

????-I /usr/local/include/thrift

拷貝文件到lib文件夾

????cp /usr/local/lib/libthrift-1.0.0-dev.so /usr/lib/

5、設置Linux環(huán)境變量

export HADOOP_PREFIX=/usr/lib/hadoop

export HADOOP_CMD=/usr/lib/hadoop/bin/hadoop

export HADOOP_STREAMING=/usr/lib/hadoop-mapreduce/hadoop-streaming.jar

6、root用戶下開啟R環(huán)境安裝依賴包

install.packages(c("rJava", "Rcpp", "RJSONIO", "bitops", "digest",

????????????????????"functional", "stringr", "plyr", "reshape2", "dplyr",

????????????????????"R.methodsS3", "caTools", "Hmisc", "data.table", "memoise"))

7、root用戶下開啟R環(huán)境安裝RHadoop包

install.packages("/root/RHadoop/rhdfs_1.0.8.tar.gz", repos=NULL, type="source")

install.packages("/root/RHadoop/rmr2_3.3.0.tar.gz", repos=NULL, type="source")

install.packages("/root/RHadoop/plyrmr_0.5.0.tar.gz", repos=NULL, type="source")

install.packages("/root/RHadoop/rhbase_1.2.1.tar.gz", repos=NULL, type="source")

8、配置ant 和 maven

export MAVEN_HOME=/root/apache-maven-3.2.5

export PATH=/root/apache-maven-3.2.5/bin:$PATH

export ANT_HOME=/root/apache-ant-1.9.4

export PATH=$ANT_HOME/bin:$PATH

9、測試RHadoop

Sys.setenv("HADOOP_PREFIX"="/usr/lib/hadoop")

Sys.setenv("HADOOP_CMD"="/usr/lib/hadoop/bin/hadoop")

Sys.setenv("HADOOP_STREAMING"="/usr/lib/hadoop-mapreduce/hadoop-streaming.jar")

?

????library(rmr2)

????bp = rmr.options("backend.parameters")

????trans <- list(D="mapreduce.map.java.opts=-Xmx400M",

???????????????? D="mapreduce.reduce.java.opts=-Xmx400M",

???????????????? D="mapreduce.map.memory.mb=4096",

???????????????? D="mapreduce.reduce.memory.mb=4096",

???????????????? D="mapreduce.task.io.sort.mb=100")

????bp <- list(hadoop=trans)

????#### 沒有使用的代碼 開始 #######################

????bp$hadoop[1]="mapreduce.map.java.opts=-Xmx400M"

????bp$hadoop[2]="mapreduce.reduce.java.opts=-Xmx400M"

????bp$hadoop[3]="mapreduce.map.memory.mb=1024"

????bp$hadoop[4]="mapreduce.reduce.memory.mb=2048"

????bp$hadoop[5]="mapreduce.task.io.sort.mb=100"

????#### 沒有使用的代碼 結(jié)束 #######################

????rmr.options(backend.parameters = bp)

????rmr.options("backend.parameters")

????## map function

????map <- function(k,lines) {

????????words.list <- strsplit(lines, '\\s')

????????words <- unlist(words.list)

????????return( keyval(words, 1) )

????}

????## reduce function

????reduce <- function(word, counts) {

????????keyval(word, sum(counts))

????}

????wordcount <- function (input, output=NULL) {

????????mapreduce(input=input, output=output, input.format="text",

map=map, reduce=reduce)

????}

?

????## delete previous result if any

????system("/usr/lib/hadoop/bin/hadoop fs -rm -r /tmp/zhengcong/out")

????

????## Submit job

????hdfs.root <- '/tmp/zhengcong'

????hdfs.data <- file.path(hdfs.root, 'hp')

????hdfs.out <- file.path(hdfs.root, 'out')

????out <- wordcount(hdfs.data, hdfs.out)

?

????## Fetch results from HDFS

????results <- from.dfs(out)

?

????## check top 30 frequent words

????results.df <- as.data.frame(results, stringsAsFactors=F)

????colnames(results.df) <- c('word', 'count')

????head(results.df[order(results.df$count, decreasing=T), ], 30)

?

10、錯誤解決

????rJava無法加載,root用戶下運行 R CMD javareconf -e

????添加 export LD_LIBRARY_PATH=$JAVA_HOME/lib/amd64:$JAVA_HOME/jre/lib/amd64/server

配置RHadoop與運行WordCount例子


更多文章、技術(shù)交流、商務合作、聯(lián)系博主

微信掃碼或搜索:z360901061

微信掃一掃加我為好友

QQ號聯(lián)系: 360901061

您的支持是博主寫作最大的動力,如果您喜歡我的文章,感覺我的文章對您有幫助,請用微信掃描下面二維碼支持博主2元、5元、10元、20元等您想捐的金額吧,狠狠點擊下面給點支持吧,站長非常感激您!手機微信長按不能支付解決辦法:請將微信支付二維碼保存到相冊,切換到微信,然后點擊微信右上角掃一掃功能,選擇支付二維碼完成支付。

【本文對您有幫助就好】

您的支持是博主寫作最大的動力,如果您喜歡我的文章,感覺我的文章對您有幫助,請用微信掃描上面二維碼支持博主2元、5元、10元、自定義金額等您想捐的金額吧,站長會非常 感謝您的哦!!!

發(fā)表我的評論
最新評論 總共0條評論
主站蜘蛛池模板: 桐柏县| 招远市| 沽源县| 阳原县| 垦利县| 大足县| 乡城县| 谷城县| 九台市| 栾城县| 靖西县| 金沙县| 策勒县| 涟源市| 阳高县| 山丹县| 黎川县| 探索| 灵宝市| 新沂市| 资兴市| 浮山县| 永城市| 泰和县| 旺苍县| 伊宁市| 集贤县| 南康市| 磐石市| 福鼎市| 永新县| 兴宁市| 宁远县| 津市市| 洞口县| 翁源县| 肥西县| 聊城市| 巩义市| 七台河市| 哈巴河县|