-
Notifications
You must be signed in to change notification settings - Fork 708
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Move parquet cascading schemes to subprojects #1514
base: develop
Are you sure you want to change the base?
Changes from all commits
6447bdb
2f2feb9
119f87f
96607da
443929f
8079633
46bb22f
3d1e76a
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -43,6 +43,7 @@ val scroogeVersion = "3.20.0" | |
val slf4jVersion = "1.6.6" | ||
val thriftVersion = "0.5.0" | ||
val junitVersion = "4.10" | ||
val junitInterfaceVersion = "0.11" | ||
|
||
val printDependencyClasspath = taskKey[Unit]("Prints location of the dependencies") | ||
|
||
|
@@ -64,7 +65,7 @@ val sharedSettings = Project.defaultSettings ++ assemblySettings ++ scalariformS | |
"org.scalacheck" %% "scalacheck" % scalaCheckVersion % "test", | ||
"org.scalatest" %% "scalatest" % scalaTestVersion % "test", | ||
"org.slf4j" % "slf4j-log4j12" % slf4jVersion % "test", | ||
"com.novocode" % "junit-interface" % "0.10" % "test" | ||
"com.novocode" % "junit-interface" % junitInterfaceVersion % "test" | ||
), | ||
|
||
resolvers ++= Seq( | ||
|
@@ -384,27 +385,36 @@ lazy val scaldingParquetFixtures = module("parquet-fixtures") | |
) | ||
) | ||
|
||
lazy val scaldingParquet = module("parquet").settings( | ||
libraryDependencies <++= (scalaVersion) { scalaVersion => Seq( | ||
// separate target that only depends on parquet, thrift, eb and cascading. Not scalding. | ||
lazy val scaldingParquetCascading = module("parquet-cascading").settings( | ||
libraryDependencies ++= Seq( | ||
"org.apache.parquet" % "parquet-column" % parquetVersion, | ||
"org.apache.parquet" % "parquet-hadoop" % parquetVersion, | ||
"org.apache.parquet" % "parquet-thrift" % parquetVersion | ||
// see https://issues.apache.org/jira/browse/PARQUET-143 for exclusions | ||
exclude("org.apache.parquet", "parquet-pig") | ||
exclude("com.twitter.elephantbird", "elephant-bird-pig") | ||
exclude("com.twitter.elephantbird", "elephant-bird-core"), | ||
"org.apache.thrift" % "libthrift" % "0.7.0", | ||
"org.apache.thrift" % "libthrift" % thriftVersion, | ||
"org.apache.hadoop" % "hadoop-client" % hadoopVersion % "provided", | ||
"cascading" % "cascading-core" % cascadingVersion, | ||
"cascading" % "cascading-hadoop" % cascadingVersion, | ||
"com.twitter.elephantbird" % "elephant-bird-core" % elephantbirdVersion % "test" | ||
) | ||
).dependsOn(scaldingParquetFixtures % "test->test") | ||
|
||
lazy val scaldingParquet = module("parquet").settings( | ||
libraryDependencies <++= (scalaVersion) { scalaVersion => Seq( | ||
"org.apache.parquet" % "parquet-column" % parquetVersion, | ||
"org.apache.parquet" % "parquet-hadoop" % parquetVersion, | ||
"org.slf4j" % "slf4j-api" % slf4jVersion, | ||
"org.apache.hadoop" % "hadoop-client" % hadoopVersion % "provided", | ||
"org.scala-lang" % "scala-reflect" % scalaVersion, | ||
"com.twitter" %% "bijection-macros" % bijectionVersion, | ||
"com.twitter" %% "chill-bijection" % chillVersion, | ||
"com.twitter.elephantbird" % "elephant-bird-core" % elephantbirdVersion % "test" | ||
"com.twitter" %% "chill-bijection" % chillVersion | ||
) ++ (if(isScala210x(scalaVersion)) Seq("org.scalamacros" %% "quasiquotes" % quasiquotesVersion) else Seq()) | ||
}, addCompilerPlugin("org.scalamacros" % "paradise" % paradiseVersion cross CrossVersion.full)) | ||
.dependsOn(scaldingCore, scaldingHadoopTest % "test", scaldingParquetFixtures % "test->test") | ||
|
||
|
||
.dependsOn(scaldingCore, scaldingParquetCascading, scaldingHadoopTest % "test") | ||
|
||
lazy val scaldingParquetScroogeFixtures = module("parquet-scrooge-fixtures") | ||
.settings(ScroogeSBT.newSettings:_*) | ||
|
@@ -432,22 +442,37 @@ lazy val scaldingParquetScroogeFixtures = module("parquet-scrooge-fixtures") | |
) | ||
) | ||
|
||
lazy val scaldingParquetScrooge = module("parquet-scrooge") | ||
// separate target that only depends on parquet, scrooge, eb and cascading. Not scalding. | ||
lazy val scaldingParquetScroogeCascading = module("parquet-scrooge-cascading") | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. again, this only depends on cascading, parquet and scrooge, right? Comment? |
||
.settings( | ||
libraryDependencies ++= Seq( | ||
"org.slf4j" % "slf4j-api" % slf4jVersion, | ||
// see https://issues.apache.org/jira/browse/PARQUET-143 for exclusions | ||
"cascading" % "cascading-core" % cascadingVersion, | ||
"org.apache.parquet" % "parquet-thrift" % parquetVersion % "test" classifier "tests" | ||
exclude("org.apache.parquet", "parquet-pig") | ||
exclude("com.twitter.elephantbird", "elephant-bird-pig") | ||
exclude("com.twitter.elephantbird", "elephant-bird-core"), | ||
"com.twitter" %% "scrooge-serializer" % scroogeVersion, | ||
"org.apache.hadoop" % "hadoop-client" % hadoopVersion % "provided", | ||
"com.novocode" % "junit-interface" % "0.11" % "test", | ||
"junit" % "junit" % junitVersion % "test" | ||
) | ||
).dependsOn(scaldingParquetCascading % "compile->compile;test->test", scaldingParquetScroogeFixtures % "test->test") | ||
|
||
lazy val scaldingParquetScrooge = module("parquet-scrooge") | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. shouldn't we merge this with There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I separated these so that the cascading schemes go in a different sub-project. parquet-scrooge, after this change would contain only the ParquetScrooge trait and related time pathed sources (which need scalding-core). If this is too thin to be its own sub-project, then I can merge back the two. |
||
.settings( | ||
libraryDependencies ++= Seq( | ||
// see https://issues.apache.org/jira/browse/PARQUET-143 for exclusions | ||
"org.apache.parquet" % "parquet-thrift" % parquetVersion % "test" classifier "tests" | ||
exclude("org.apache.parquet", "parquet-pig") | ||
exclude("com.twitter.elephantbird", "elephant-bird-pig") | ||
exclude("com.twitter.elephantbird", "elephant-bird-core"), | ||
"com.twitter" %% "scrooge-serializer" % scroogeVersion, | ||
"org.apache.hadoop" % "hadoop-client" % hadoopVersion % "provided", | ||
"com.twitter.elephantbird" % "elephant-bird-core" % elephantbirdVersion % "test", | ||
"com.novocode" % "junit-interface" % junitInterfaceVersion % "test", | ||
"junit" % "junit" % junitVersion % "test" | ||
) | ||
).dependsOn(scaldingCore, scaldingParquet % "compile->compile;test->test", scaldingParquetScroogeFixtures % "test->test") | ||
).dependsOn(scaldingCore, scaldingParquetScroogeCascading, scaldingParquet % "compile->compile;test->test", scaldingParquetScroogeFixtures % "test->test") | ||
|
||
lazy val scaldingHRaven = module("hraven").settings( | ||
libraryDependencies ++= Seq( | ||
|
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,6 @@ | ||
package com.twitter.scalding.parquet | ||
|
||
package object scrooge { | ||
type Parquet346ScroogeScheme[T <: com.twitter.scrooge.ThriftStruct] = com.twitter.scalding.parquet.cascading.scrooge.Parquet346ScroogeScheme[T] | ||
} | ||
|
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,10 @@ | ||
package com.twitter.scalding | ||
|
||
package object parquet { | ||
type ParquetValueScheme[T] = com.twitter.scalding.parquet.cascading.ParquetValueScheme[T] | ||
|
||
object ParquetValueScheme { | ||
type Config[T] = com.twitter.scalding.parquet.cascading.ParquetValueScheme.Config[T] | ||
} | ||
} | ||
|
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,6 @@ | ||
package com.twitter.scalding.parquet | ||
|
||
package object thrift { | ||
type Parquet346TBaseScheme[T <: org.apache.thrift.TBase[_, _]] = com.twitter.scalding.parquet.cascading.thrift.Parquet346TBaseScheme[T] | ||
} | ||
|
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,6 @@ | ||
package com.twitter.scalding.parquet | ||
|
||
package object tuple { | ||
type ParquetTupleScheme = com.twitter.scalding.parquet.cascading.tuple.ParquetTupleScheme | ||
} | ||
|
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
ok, so the point here is that this target only depends on cascading + parquet, not scalding. Can we add a comment so that is not overlooked as to the purpose?