From 1b39d03ba87e737f54c632dca20bdc7adbd02fe5 Mon Sep 17 00:00:00 2001 From: matfax Date: Tue, 27 Sep 2016 11:06:05 +0200 Subject: [PATCH] Bump to Spark 2.0 with Scala 2.11 --- pom.xml | 18 +++++++++--------- .../spark/mllib/clustering/dbscan/DBSCAN.scala | 3 +-- .../dbscan/EvenSplitPartitioner.scala | 4 ++-- .../clustering/dbscan/LocalDBSCANArchery.scala | 10 +++------- .../clustering/dbscan/LocalDBSCANNaive.scala | 6 +++--- .../mllib/clustering/dbscan/DBSCANSuite.scala | 1 - 6 files changed, 18 insertions(+), 24 deletions(-) diff --git a/pom.xml b/pom.xml index e5e660c..748e7f9 100644 --- a/pom.xml +++ b/pom.xml @@ -5,8 +5,8 @@ 4.0.0 com.irvingc.spark - dbscan-on-spark_2.10 - 0.2.0-SNAPSHOT + dbscan-on-spark_2.11 + 0.3.0-SNAPSHOT Distributed DBSCAN on Apache Spark http://www.irvingc.com/dbscan-on-spark @@ -30,10 +30,10 @@ UTF-8 UTF-8 - 2.10.4 - 2.10 - 2.2.1 - 1.6.1 + 2.11.8 + 2.11 + 2.2.6 + 2.0.0 @@ -71,7 +71,7 @@ com.meetup archery_${scala.binary.version} - 0.3.0 + 0.4.0 org.scalatest @@ -86,7 +86,7 @@ net.alchim31.maven scala-maven-plugin - 3.2.0 + 3.2.2 @@ -99,7 +99,7 @@ org.scalastyle scalastyle-maven-plugin - 0.6.0 + 0.8.0 false true diff --git a/src/main/scala/org/apache/spark/mllib/clustering/dbscan/DBSCAN.scala b/src/main/scala/org/apache/spark/mllib/clustering/dbscan/DBSCAN.scala index 3d9c470..70acb5c 100644 --- a/src/main/scala/org/apache/spark/mllib/clustering/dbscan/DBSCAN.scala +++ b/src/main/scala/org/apache/spark/mllib/clustering/dbscan/DBSCAN.scala @@ -16,8 +16,7 @@ */ package org.apache.spark.mllib.clustering.dbscan -import org.apache.spark.Logging -import org.apache.spark.SparkContext.rddToPairRDDFunctions +import org.apache.spark.internal.Logging import org.apache.spark.mllib.clustering.dbscan.DBSCANLabeledPoint.Flag import org.apache.spark.mllib.linalg.Vector import org.apache.spark.rdd.RDD diff --git a/src/main/scala/org/apache/spark/mllib/clustering/dbscan/EvenSplitPartitioner.scala b/src/main/scala/org/apache/spark/mllib/clustering/dbscan/EvenSplitPartitioner.scala index b2d5e7f..b9cda4e 100644 --- a/src/main/scala/org/apache/spark/mllib/clustering/dbscan/EvenSplitPartitioner.scala +++ b/src/main/scala/org/apache/spark/mllib/clustering/dbscan/EvenSplitPartitioner.scala @@ -16,9 +16,9 @@ */ package org.apache.spark.mllib.clustering.dbscan -import scala.annotation.tailrec +import org.apache.spark.internal.Logging -import org.apache.spark.Logging +import scala.annotation.tailrec /** * Helper methods for calling the partitioner diff --git a/src/main/scala/org/apache/spark/mllib/clustering/dbscan/LocalDBSCANArchery.scala b/src/main/scala/org/apache/spark/mllib/clustering/dbscan/LocalDBSCANArchery.scala index d479b80..ae9a4a9 100644 --- a/src/main/scala/org/apache/spark/mllib/clustering/dbscan/LocalDBSCANArchery.scala +++ b/src/main/scala/org/apache/spark/mllib/clustering/dbscan/LocalDBSCANArchery.scala @@ -16,15 +16,11 @@ */ package org.apache.spark.mllib.clustering.dbscan -import scala.collection.mutable.Queue - -import org.apache.spark.Logging +import archery.{Box, Entry, Point, RTree} +import org.apache.spark.internal.Logging import org.apache.spark.mllib.clustering.dbscan.DBSCANLabeledPoint.Flag -import archery.Box -import archery.Entry -import archery.Point -import archery.RTree +import scala.collection.mutable.Queue /** * An implementation of DBSCAN using an R-Tree to improve its running time diff --git a/src/main/scala/org/apache/spark/mllib/clustering/dbscan/LocalDBSCANNaive.scala b/src/main/scala/org/apache/spark/mllib/clustering/dbscan/LocalDBSCANNaive.scala index 1f067da..2115fb8 100644 --- a/src/main/scala/org/apache/spark/mllib/clustering/dbscan/LocalDBSCANNaive.scala +++ b/src/main/scala/org/apache/spark/mllib/clustering/dbscan/LocalDBSCANNaive.scala @@ -16,12 +16,12 @@ */ package org.apache.spark.mllib.clustering.dbscan -import scala.collection.mutable.Queue - -import org.apache.spark.Logging +import org.apache.spark.internal.Logging import org.apache.spark.mllib.clustering.dbscan.DBSCANLabeledPoint.Flag import org.apache.spark.mllib.linalg.Vectors +import scala.collection.mutable.Queue + /** * A naive implementation of DBSCAN. It has O(n2) complexity * but uses no extra memory. This implementation is not used diff --git a/src/test/scala/org/apache/spark/mllib/clustering/dbscan/DBSCANSuite.scala b/src/test/scala/org/apache/spark/mllib/clustering/dbscan/DBSCANSuite.scala index 271883b..16a8b8e 100644 --- a/src/test/scala/org/apache/spark/mllib/clustering/dbscan/DBSCANSuite.scala +++ b/src/test/scala/org/apache/spark/mllib/clustering/dbscan/DBSCANSuite.scala @@ -16,7 +16,6 @@ */ package org.apache.spark.mllib.clustering.dbscan -import org.apache.spark.SparkContext.rddToPairRDDFunctions import org.apache.spark.mllib.linalg.Vectors import org.apache.spark.mllib.util.MLlibTestSparkContext import org.scalatest.Matchers