* [BAEL-3634] Code for Spark DataFrame article * [BAEL-3634] Improve example data sample and sort aggregations * [BAEL-3634] change column name for clarity * [BAEL-3634] Update method name with U.S english standard Co-authored-by: uzma khan <uzma.khan@nominet.uk>
		
			
				
	
	
		
			113 lines
		
	
	
		
			4.7 KiB
		
	
	
	
		
			XML
		
	
	
	
	
	
			
		
		
	
	
			113 lines
		
	
	
		
			4.7 KiB
		
	
	
	
		
			XML
		
	
	
	
	
	
| <?xml version="1.0" encoding="UTF-8"?>
 | |
| <project xmlns="http://maven.apache.org/POM/4.0.0"
 | |
|     xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
 | |
|     xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
 | |
|     <modelVersion>4.0.0</modelVersion>
 | |
|     <artifactId>apache-spark</artifactId>
 | |
|     <version>1.0-SNAPSHOT</version>
 | |
|     <name>apache-spark</name>
 | |
|     <packaging>jar</packaging>
 | |
|     <url>http://maven.apache.org</url>
 | |
| 
 | |
|     <parent>
 | |
|         <groupId>com.baeldung</groupId>
 | |
|         <artifactId>parent-modules</artifactId>
 | |
|         <version>1.0.0-SNAPSHOT</version>
 | |
|     </parent>
 | |
| 
 | |
|     <dependencies>
 | |
|         <dependency>
 | |
|             <groupId>org.apache.spark</groupId>
 | |
|             <artifactId>spark-core_2.11</artifactId>
 | |
|             <version>${org.apache.spark.spark-core.version}</version>
 | |
|         </dependency>
 | |
|         <dependency>
 | |
|             <groupId>org.apache.spark</groupId>
 | |
|             <artifactId>spark-sql_2.11</artifactId>
 | |
|             <version>${org.apache.spark.spark-sql.version}</version>
 | |
|         </dependency>
 | |
|         <dependency>
 | |
|             <groupId>org.apache.spark</groupId>
 | |
|             <artifactId>spark-graphx_2.11</artifactId>
 | |
|             <version>${org.apache.spark.spark-graphx.version}</version>
 | |
|         </dependency>
 | |
|         <dependency>
 | |
|             <groupId>graphframes</groupId>
 | |
|             <artifactId>graphframes</artifactId>
 | |
|             <version>${graphframes.version}</version>
 | |
|         </dependency>
 | |
|         <dependency>
 | |
|             <groupId>org.apache.spark</groupId>
 | |
|             <artifactId>spark-streaming_2.11</artifactId>
 | |
|             <version>${org.apache.spark.spark-streaming.version}</version>
 | |
|         </dependency>
 | |
|         <dependency>
 | |
|             <groupId>org.apache.spark</groupId>
 | |
|             <artifactId>spark-mllib_2.11</artifactId>
 | |
|             <version>${org.apache.spark.spark-mllib.version}</version>
 | |
|         </dependency>
 | |
|         <dependency>
 | |
|             <groupId>org.apache.spark</groupId>
 | |
|             <artifactId>spark-streaming-kafka-0-10_2.11</artifactId>
 | |
|             <version>${org.apache.spark.spark-streaming-kafka.version}</version>
 | |
|         </dependency>
 | |
|         <dependency>
 | |
|             <groupId>com.datastax.spark</groupId>
 | |
|             <artifactId>spark-cassandra-connector_2.11</artifactId>
 | |
|             <version>${com.datastax.spark.spark-cassandra-connector.version}</version>
 | |
|         </dependency>
 | |
|         <dependency>
 | |
|             <groupId>com.datastax.spark</groupId>
 | |
|             <artifactId>spark-cassandra-connector-java_2.11</artifactId>
 | |
|             <version>${com.datastax.spark.spark-cassandra-connector-java.version}</version>
 | |
|         </dependency>
 | |
|         <dependency>
 | |
|             <groupId>org.postgresql</groupId>
 | |
|             <artifactId>postgresql</artifactId>
 | |
|             <version>${postgres.version}</version>
 | |
|         </dependency>
 | |
|     </dependencies>
 | |
| 
 | |
|     <build>
 | |
|         <plugins>
 | |
|             <plugin>
 | |
|                 <artifactId>maven-assembly-plugin</artifactId>
 | |
|                 <version>3.3.0</version>
 | |
|                 <executions>
 | |
|                     <execution>
 | |
|                         <phase>package</phase>
 | |
|                         <goals>
 | |
|                             <goal>single</goal>
 | |
|                         </goals>
 | |
|                     </execution>
 | |
|                 </executions>
 | |
|                 <configuration>
 | |
|                     <descriptorRefs>
 | |
|                         <descriptorRef>jar-with-dependencies</descriptorRef>
 | |
|                     </descriptorRefs>
 | |
|                 </configuration>
 | |
|             </plugin>
 | |
|         </plugins>
 | |
|     </build>
 | |
| 
 | |
|     <repositories>
 | |
|         <repository>
 | |
|             <id>SparkPackagesRepo</id>
 | |
|             <url>https://repos.spark-packages.org</url>
 | |
|         </repository>
 | |
|     </repositories>
 | |
| 
 | |
|     <properties>
 | |
|         <org.apache.spark.spark-core.version>2.4.8</org.apache.spark.spark-core.version>
 | |
|         <org.apache.spark.spark-sql.version>2.4.8</org.apache.spark.spark-sql.version>
 | |
|         <org.apache.spark.spark-streaming.version>2.4.8</org.apache.spark.spark-streaming.version>
 | |
|         <org.apache.spark.spark-mllib.version>2.4.8</org.apache.spark.spark-mllib.version>
 | |
|         <org.apache.spark.spark-graphx.version>2.4.8</org.apache.spark.spark-graphx.version>
 | |
|         <graphframes.version>0.8.1-spark3.0-s_2.12</graphframes.version>
 | |
|         <org.apache.spark.spark-streaming-kafka.version>2.4.8</org.apache.spark.spark-streaming-kafka.version>
 | |
|         <com.datastax.spark.spark-cassandra-connector.version>2.5.2</com.datastax.spark.spark-cassandra-connector.version>
 | |
|         <com.datastax.spark.spark-cassandra-connector-java.version>1.6.0-M1</com.datastax.spark.spark-cassandra-connector-java.version>
 | |
|         <postgres.version>42.3.3</postgres.version>
 | |
|     </properties>
 | |
| 
 | |
| </project> |