Skip site navigation (1)Skip section navigation (2)
Date:      Sun, 15 Feb 2015 14:21:28 +0000 (UTC)
From:      Dmitry Sivachenko <demon@FreeBSD.org>
To:        ports-committers@freebsd.org, svn-ports-all@freebsd.org, svn-ports-head@freebsd.org
Subject:   svn commit: r379038 - in head/devel: . pig pig/files
Message-ID:  <201502151421.t1FELSNb065043@svn.freebsd.org>

next in thread | raw e-mail | index | archive | help
Author: demon
Date: Sun Feb 15 14:21:28 2015
New Revision: 379038
URL: https://svnweb.freebsd.org/changeset/ports/379038
QAT: https://qat.redports.org/buildarchive/r379038/

Log:
  New port: Apache Pig.
  Pig is an engine for executing data flows in parallel on Hadoop.

Added:
  head/devel/pig/
  head/devel/pig/Makefile   (contents, props changed)
  head/devel/pig/distinfo   (contents, props changed)
  head/devel/pig/files/
  head/devel/pig/files/patch-bin-pig   (contents, props changed)
  head/devel/pig/files/patch-ivy-ivysettings.xml   (contents, props changed)
  head/devel/pig/pkg-descr   (contents, props changed)
  head/devel/pig/pkg-plist   (contents, props changed)
Modified:
  head/devel/Makefile

Modified: head/devel/Makefile
==============================================================================
--- head/devel/Makefile	Sun Feb 15 14:12:19 2015	(r379037)
+++ head/devel/Makefile	Sun Feb 15 14:21:28 2015	(r379038)
@@ -3545,6 +3545,7 @@
     SUBDIR += physfs-devel
     SUBDIR += picp
     SUBDIR += picprog
+    SUBDIR += pig
     SUBDIR += piklab
     SUBDIR += pinba_engine
     SUBDIR += pipestatus

Added: head/devel/pig/Makefile
==============================================================================
--- /dev/null	00:00:00 1970	(empty, because file is newly added)
+++ head/devel/pig/Makefile	Sun Feb 15 14:21:28 2015	(r379038)
@@ -0,0 +1,47 @@
+# Created by: Dmitry Sivachenko <demon@FreeBSD.org>
+# $FreeBSD$
+
+PORTNAME=	pig
+PORTVERSION=	0.14.0
+CATEGORIES=	devel java
+MASTER_SITES=	${MASTER_SITE_APACHE} \
+		LOCAL/demon/:ant \
+		http://people.freebsd.org/~demon/:ant \
+		http://central.maven.org/maven2/org/apache/ivy/ivy/2.2.0/:ivy
+MASTER_SITE_SUBDIR=${PORTNAME}/${PORTNAME}-${PORTVERSION}
+DISTFILES=	${PORTNAME}-${PORTVERSION}-src${EXTRACT_SUFX} FreeBSD-${PORTNAME}-${PORTVERSION}-ant-repository.tar.gz:ant ivy-2.2.0.jar:ivy
+DIST_SUBDIR=	hadoop
+EXTRACT_ONLY=	${PORTNAME}-${PORTVERSION}-src${EXTRACT_SUFX} FreeBSD-${PORTNAME}-${PORTVERSION}-ant-repository.tar.gz
+
+MAINTAINER=	demon@FreeBSD.org
+COMMENT=	Engine for executing data flows in parallel on Hadoop
+
+LICENSE=	APACHE20
+
+BUILD_DEPENDS=	${LOCALBASE}/bin/ant:${PORTSDIR}/devel/apache-ant
+RUN_DEPENDS=	bash:${PORTSDIR}/shells/bash \
+		yarn:${PORTSDIR}/devel/hadoop2
+
+USE_JAVA=	yes
+JAVA_VERSION=	1.7+
+WRKSRC=		${WRKDIR}/${PORTNAME}-${PORTVERSION}-src
+
+post-patch:
+	${REINPLACE_CMD} -e "s#%%WRKDIR%%#${WRKDIR}#" ${WRKSRC}/ivy/ivysettings.xml
+
+pre-build:
+	${CP} ${DISTDIR}/${DIST_SUBDIR}/ivy-2.2.0.jar ${WRKSRC}/ivy/
+
+do-build:
+	cd ${WRKSRC} && ${SETENV} ${MAKE_ENV} ${LOCALBASE}/bin/ant -Dhadoopversion=23
+
+post-build:
+	${REINPLACE_CMD} -e "s#%%JAVA_HOME%%#${JAVA_HOME}#" -e "s#%%LOCALBASE%%#${LOCALBASE}#" ${WRKSRC}/bin/pig
+
+do-install:
+	${MKDIR} ${STAGEDIR}${DATADIR}
+	cd ${WRKSRC} && ${COPYTREE_SHARE} lib ${STAGEDIR}${DATADIR}/
+	${INSTALL_DATA} ${WRKSRC}/pig-${PORTVERSION}-SNAPSHOT-core-h2.jar ${STAGEDIR}${DATADIR}/
+	${INSTALL_SCRIPT} ${WRKSRC}/bin/pig ${STAGEDIR}/${PREFIX}/bin/
+
+.include <bsd.port.mk>

Added: head/devel/pig/distinfo
==============================================================================
--- /dev/null	00:00:00 1970	(empty, because file is newly added)
+++ head/devel/pig/distinfo	Sun Feb 15 14:21:28 2015	(r379038)
@@ -0,0 +1,6 @@
+SHA256 (hadoop/pig-0.14.0-src.tar.gz) = e95e8449b68186966996be786c4a620b36b4e15707d263bd76c3e10cdb26c1a2
+SIZE (hadoop/pig-0.14.0-src.tar.gz) = 14651571
+SHA256 (hadoop/FreeBSD-pig-0.14.0-ant-repository.tar.gz) = cc298457ba337564a0addd4a129c8a51d7aaa1a512e6ebdf89d6cba6fb22de81
+SIZE (hadoop/FreeBSD-pig-0.14.0-ant-repository.tar.gz) = 111651511
+SHA256 (hadoop/ivy-2.2.0.jar) = 9d0a56026680999986ca33d53d12d6f28f7bff5e3c9e6e0c6633a3677ca00f18
+SIZE (hadoop/ivy-2.2.0.jar) = 947592

Added: head/devel/pig/files/patch-bin-pig
==============================================================================
--- /dev/null	00:00:00 1970	(empty, because file is newly added)
+++ head/devel/pig/files/patch-bin-pig	Sun Feb 15 14:21:28 2015	(r379038)
@@ -0,0 +1,68 @@
+--- bin/pig.orig	2014-11-17 04:37:53.000000000 +0300
++++ bin/pig	2015-02-15 16:23:44.000000000 +0300
+@@ -88,6 +88,8 @@
+     export PIG_HOME=`dirname "$this"`/..
+ fi
+ 
++PIG_CONF_DIR=${PIG_HOME}/etc/pig
++
+ if [ -z "$PIG_CONF_DIR" ]; then
+     if [ -f ${PIG_HOME}/conf/pig.properties ]; then
+         PIG_CONF_DIR=${PIG_HOME}/conf
+@@ -111,6 +113,7 @@
+     JAVA_HOME=$JAVA_HOME
+ fi
+     
++JAVA_HOME=%%JAVA_HOME%%
+ if [ "$JAVA_HOME" = "" ]; then
+     echo "Error: JAVA_HOME is not set."
+     exit 1
+@@ -206,6 +209,7 @@
+ fi
+ 
+ # add HADOOP_CONF_DIR
++HADOOP_CONF_DIR=%%LOCALBASE%%/etc/hadoop
+ if [ "$HADOOP_CONF_DIR" != "" ]; then
+     CLASSPATH=${CLASSPATH}:${HADOOP_CONF_DIR}
+ fi
+@@ -244,23 +248,23 @@
+ 
+ # For Hadoop 0.23.0+
+ #
+-#if [ -d "${PIG_HOME}/share/hadoop/common" ]; then
+-#    for f in ${PIG_HOME}/share/hadoop/common/hadoop*.jar; do
+-#        CLASSPATH=${CLASSPATH}:$f;
+-#    done
+-#fi
+-#
+-#if [ -d "${PIG_HOME}/share/hadoop/hdfs" ]; then
+-#    for f in ${PIG_HOME}/share/hadoop/hdfs/hadoop*.jar; do
+-#        CLASSPATH=${CLASSPATH}:$f;
+-#    done
+-#fi
+-#
+-#if [ -d "${PIG_HOME}/share/hadoop/mapreduce" ]; then
+-#    for f in ${PIG_HOME}/share/hadoop/mapreduce/hadoop*.jar; do
+-#        CLASSPATH=${CLASSPATH}:$f;
+-#    done
+-#fi
++if [ -d "${PIG_HOME}/share/hadoop/common" ]; then
++    for f in ${PIG_HOME}/share/hadoop/common/hadoop*.jar; do
++        CLASSPATH=${CLASSPATH}:$f;
++    done
++fi
++
++if [ -d "${PIG_HOME}/share/hadoop/hdfs" ]; then
++    for f in ${PIG_HOME}/share/hadoop/hdfs/hadoop*.jar; do
++        CLASSPATH=${CLASSPATH}:$f;
++    done
++fi
++
++if [ -d "${PIG_HOME}/share/hadoop/mapreduce" ]; then
++    for f in ${PIG_HOME}/share/hadoop/mapreduce/hadoop*.jar; do
++        CLASSPATH=${CLASSPATH}:$f;
++    done
++fi
+ 
+ if which hadoop >/dev/null; then
+     HADOOP_BIN=`which hadoop`

Added: head/devel/pig/files/patch-ivy-ivysettings.xml
==============================================================================
--- /dev/null	00:00:00 1970	(empty, because file is newly added)
+++ head/devel/pig/files/patch-ivy-ivysettings.xml	Sun Feb 15 14:21:28 2015	(r379038)
@@ -0,0 +1,10 @@
+--- ivy/ivysettings.xml.bak	2014-11-17 04:37:53.000000000 +0300
++++ ivy/ivysettings.xml	2015-02-12 18:18:00.000000000 +0300
+@@ -1,5 +1,7 @@
+ <ivysettings>
+ 
++  <caches defaultCacheDir="%%WRKDIR%%/ivy"/>
++
+  <!--
+    Licensed to the Apache Software Foundation (ASF) under one or more
+    contributor license agreements.  See the NOTICE file distributed with

Added: head/devel/pig/pkg-descr
==============================================================================
--- /dev/null	00:00:00 1970	(empty, because file is newly added)
+++ head/devel/pig/pkg-descr	Sun Feb 15 14:21:28 2015	(r379038)
@@ -0,0 +1,23 @@
+Apache Pig is a platform for analyzing large data sets that consists of a
+high-level language for expressing data analysis programs, coupled with
+infrastructure for evaluating these programs.  The salient property of Pig
+programs is that their structure is amenable to substantial parallelization,
+which in turns enables them to handle very large data sets.
+
+At the present time, Pig's infrastructure layer consists of a compiler that
+produces sequences of Map-Reduce programs, for which large-scale parallel
+implementations already exist (e.g., the Hadoop subproject).  Pig's language
+layer currently consists of a textual language called Pig Latin, which has
+the following key properties:
+
+-- Ease of programming.  It is trivial to achieve parallel execution of simple,
+"embarrassingly parallel" data analysis tasks.  Complex tasks comprised of
+multiple interrelated data transformations are explicitly encoded as data flow
+sequences, making them easy to write, understand, and maintain.
+-- Optimization opportunities.  The way in which tasks are encoded permits the
+system to optimize their execution automatically, allowing the user to focus
+on semantics rather than efficiency.
+-- Extensibility.  Users can create their own functions to do special-purpose
+processing.
+
+WWW: http://pig.apache.org/

Added: head/devel/pig/pkg-plist
==============================================================================
--- /dev/null	00:00:00 1970	(empty, because file is newly added)
+++ head/devel/pig/pkg-plist	Sun Feb 15 14:21:28 2015	(r379038)
@@ -0,0 +1,50 @@
+bin/pig
+%%DATADIR%%/lib/ST4-4.0.4.jar
+%%DATADIR%%/lib/accumulo-core-1.5.0.jar
+%%DATADIR%%/lib/accumulo-fate-1.5.0.jar
+%%DATADIR%%/lib/accumulo-server-1.5.0.jar
+%%DATADIR%%/lib/accumulo-start-1.5.0.jar
+%%DATADIR%%/lib/accumulo-trace-1.5.0.jar
+%%DATADIR%%/lib/antlr-runtime-3.4.jar
+%%DATADIR%%/lib/asm-3.3.1.jar
+%%DATADIR%%/lib/automaton-1.11-8.jar
+%%DATADIR%%/lib/avro-1.7.5.jar
+%%DATADIR%%/lib/avro-tools-1.7.5-nodeps.jar
+%%DATADIR%%/lib/groovy-all-1.8.6.jar
+%%DATADIR%%/lib/guava-11.0.jar
+%%DATADIR%%/lib/h2/avro-mapred-1.7.5-hadoop2.jar
+%%DATADIR%%/lib/h2/commons-collections4-4.0.jar
+%%DATADIR%%/lib/h2/hbase-client-0.96.0-hadoop2.jar
+%%DATADIR%%/lib/h2/hbase-common-0.96.0-hadoop2.jar
+%%DATADIR%%/lib/h2/hbase-hadoop-compat-0.96.0-hadoop2.jar
+%%DATADIR%%/lib/h2/hbase-hadoop2-compat-0.96.0-hadoop2.jar
+%%DATADIR%%/lib/h2/hbase-protocol-0.96.0-hadoop2.jar
+%%DATADIR%%/lib/h2/hbase-server-0.96.0-hadoop2.jar
+%%DATADIR%%/lib/h2/hive-shims-0.23-0.14.0.jar
+%%DATADIR%%/lib/h2/tez-api-0.5.2.jar
+%%DATADIR%%/lib/h2/tez-common-0.5.2.jar
+%%DATADIR%%/lib/h2/tez-dag-0.5.2.jar
+%%DATADIR%%/lib/h2/tez-mapreduce-0.5.2.jar
+%%DATADIR%%/lib/h2/tez-runtime-internals-0.5.2.jar
+%%DATADIR%%/lib/h2/tez-runtime-library-0.5.2.jar
+%%DATADIR%%/lib/hive-common-0.14.0.jar
+%%DATADIR%%/lib/hive-exec-0.14.0-core.jar
+%%DATADIR%%/lib/hive-serde-0.14.0.jar
+%%DATADIR%%/lib/hive-shims-common-0.14.0.jar
+%%DATADIR%%/lib/hive-shims-common-secure-0.14.0.jar
+%%DATADIR%%/lib/jackson-core-asl-1.8.8.jar
+%%DATADIR%%/lib/jackson-mapper-asl-1.8.8.jar
+%%DATADIR%%/lib/jansi-1.9.jar
+%%DATADIR%%/lib/jline-1.0.jar
+%%DATADIR%%/lib/joda-time-2.1.jar
+%%DATADIR%%/lib/jruby-complete-1.6.7.jar
+%%DATADIR%%/lib/js-1.7R2.jar
+%%DATADIR%%/lib/json-simple-1.1.jar
+%%DATADIR%%/lib/jython-standalone-2.5.3.jar
+%%DATADIR%%/lib/kryo-2.22.jar
+%%DATADIR%%/lib/protobuf-java-2.5.0.jar
+%%DATADIR%%/lib/snappy-java-1.0.5.jar
+%%DATADIR%%/lib/trevni-avro-1.7.5.jar
+%%DATADIR%%/lib/trevni-core-1.7.5.jar
+%%DATADIR%%/lib/zookeeper-3.4.5.jar
+%%DATADIR%%/pig-0.14.0-SNAPSHOT-core-h2.jar



Want to link to this message? Use this URL: <https://mail-archive.FreeBSD.org/cgi/mid.cgi?201502151421.t1FELSNb065043>