0% found this document useful (0 votes)

7 views

Dele

code

Uploaded by

Purushotham

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

7 views

Dele

code

Uploaded by

Purushotham

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 4

val data = List(

"State->TN~City->Chennai",
"State->UP~City->Lucknow"
)

val lis = List( "A~B" , "C~D" , "E~F" )

println
println("=====Raw List=====")
println
println(lis)
lis.foreach(println)

val split = lis.flatMap( x => x.split("~"))

println
println("=====split List=====")
println
println(split)
split.foreach(println)

package pack

object obj {
def main(args:Array[String]):Unit={

println("=====Started=====")

val data = List(

"State->TN~City->Chennai",
"State->UP~City->Lucknow"
)
println
println("=====Raw Data=====")
println
data.foreach(println)

val flat = data.flatMap( x => x.split("~"))

println
println("=====Splitted Data=====")
println
flat.foreach(println)

val statefil = flat.filter(x => x.contains("State"))

println
println("=====State Data=====")
println
statefil.foreach(println)
val cityfil = flat.filter(x=>x.contains("City"))
println
println("=====City Data=====")
println
cityfil.foreach(println)

val Statefinal = statefil.map(x=>x.replace("State->",""))

println
println("=====Final State Data=====")
println
Statefinal.foreach(println)

val Cityfinal = cityfil.map(x=>x.replace("City->",""))

println
println("=====Final City Data=====")
println
Cityfinal.foreach(println)
}
}

"file:///F:/Practice/Data/datatxns"

============Reading USDATA ==================

package pack

import org.apache.spark.SparkContext
import org.apache.spark.SparkConf
import org.apache.spark.sql.SparkSession

object obj {

def main(args:Array[String]):Unit={

println("===started===")
println

val conf = new

SparkConf().setAppName("wcfinal").setMaster("local[*]").set("spark.driver.host","lo
calhost").set("spark.driver.allowMultipleContexts", "true")

val sc = new SparkContext(conf) // RDD

sc.setLogLevel("ERROR")

val spark =
SparkSession.builder().config(conf).getOrCreate() //Dataframe
val data = sc.textFile("file:///D:/data/usdata",1)

data.take(10).foreach(println)

val lendata = data.filter(x => x.length>200)

println
println("===len > 200===")
println
lendata.foreach(println)

val flatdata = lendata.flatMap( x => x.split(","))

println
println("===flatdata===")
println
flatdata.foreach(println)

val repdata = flatdata.map( x => x.replace("-",""))

println
println("===repdata===")
println
repdata.foreach(println)

val condata = repdata.map( x => x + ",zeyo")

println
println("===condata===")
println
condata.foreach(println)

==================Column based filter/Schema rdd filter========================

package pack
import org.apache.spark.SparkContext
import org.apache.spark.SparkConf
import org.apache.spark.sql.SparkSession

object obj {

case class columns(id:String,category:String,product:String)

def main(args:Array[String]):Unit={

println("===started===")
println

val conf = new

SparkConf().setAppName("wcfinal").setMaster("local[*]")

val sc = new SparkContext(conf) // RDD

sc.setLogLevel("ERROR")

val spark =
SparkSession.builder().config(conf).getOrCreate() //Dataframe

val data = sc.textFile("file:///F:/Practice/Data/datatxns")

data.foreach(println)
val split=data.map(x=>x.split(","))
val schemardd=split.map(x=>columns(x(0),x(1),x(2)))
val filrdd=schemardd.filter(x=>x.product.contains("Gymnastics"))
println
filrdd.foreach(println)

Restaurant Opening &amp Closing Checklist
83% (197)
Restaurant Opening &amp Closing Checklist
2 pages
QuickBooks Online For Accounting 1st Edition Glenn Owen Solution Manual
100% (44)
QuickBooks Online For Accounting 1st Edition Glenn Owen Solution Manual
5 pages
Chemsheets AS 1078 Crude Oil
No ratings yet
Chemsheets AS 1078 Crude Oil
15 pages
C550 90
100% (4)
C550 90
16 pages
Incontinence 6th Edition 2017 Ebook v2-1 PDF
No ratings yet
Incontinence 6th Edition 2017 Ebook v2-1 PDF
2,636 pages
D9 Lab+Day+9
No ratings yet
D9 Lab+Day+9
6 pages
_SA Lab Manual.docx
No ratings yet
_SA Lab Manual.docx
7 pages
Spark RDD Commands - Spark Core
No ratings yet
Spark RDD Commands - Spark Core
7 pages
Apache Spark with Scala - cheatsheet (1) (1)
No ratings yet
Apache Spark with Scala - cheatsheet (1) (1)
7 pages
Lab Spark
No ratings yet
Lab Spark
3 pages
Pyspark_Coding_Interview_Questions
No ratings yet
Pyspark_Coding_Interview_Questions
19 pages
Spark
No ratings yet
Spark
12 pages
Action and Transformations (Wide and Narrow)
No ratings yet
Action and Transformations (Wide and Narrow)
7 pages
rdd
No ratings yet
rdd
48 pages
Pyspark File Commands and Theory
No ratings yet
Pyspark File Commands and Theory
29 pages
A204080739_28953_20_2025_unit 3 Introduction to RDD (1)
No ratings yet
A204080739_28953_20_2025_unit 3 Introduction to RDD (1)
51 pages
journal
No ratings yet
journal
47 pages
Week12 Assignment Solution
No ratings yet
Week12 Assignment Solution
10 pages
C.S PROJECT
No ratings yet
C.S PROJECT
15 pages
Transformations and Actions: A Visual Guide of The API
No ratings yet
Transformations and Actions: A Visual Guide of The API
122 pages
Spark Project Phase1
No ratings yet
Spark Project Phase1
3 pages
lab task mobile application development
No ratings yet
lab task mobile application development
17 pages
Copy of Workshop 5_pandas (6)
No ratings yet
Copy of Workshop 5_pandas (6)
2 pages
Aadhar Analysis
No ratings yet
Aadhar Analysis
2 pages
2.RDDs in Spark
No ratings yet
2.RDDs in Spark
38 pages
Spark Api Master
No ratings yet
Spark Api Master
51 pages
SA Ex 9,10 - I131
No ratings yet
SA Ex 9,10 - I131
5 pages
Ip Practical File
No ratings yet
Ip Practical File
20 pages
Practical
No ratings yet
Practical
27 pages
I037 - Manas Patel Experiment09
No ratings yet
I037 - Manas Patel Experiment09
9 pages
GLNJM
No ratings yet
GLNJM
15 pages
Informatics Practices Record class 12
No ratings yet
Informatics Practices Record class 12
60 pages
UEC735
No ratings yet
UEC735
2 pages
ScalaJVMBigData SparkLessons PDF
100% (1)
ScalaJVMBigData SparkLessons PDF
100 pages
Spark and Scala 2
No ratings yet
Spark and Scala 2
11 pages
vertopal.com_Final007
No ratings yet
vertopal.com_Final007
35 pages
Spark Revision
No ratings yet
Spark Revision
16 pages
Suppose You Have A Large Dataset Stored in A Distributed File System Like HDFS
No ratings yet
Suppose You Have A Large Dataset Stored in A Distributed File System Like HDFS
11 pages
3 Marks Class 12
No ratings yet
3 Marks Class 12
11 pages
RDD_Task1
No ratings yet
RDD_Task1
2 pages
Spark Commands
No ratings yet
Spark Commands
3 pages
Matplotlib linechatsy
No ratings yet
Matplotlib linechatsy
38 pages
Ip Practical (2) (Autosaved)
No ratings yet
Ip Practical (2) (Autosaved)
21 pages
practical file class xii
No ratings yet
practical file class xii
25 pages
Dejene Chala Stat606 Screening Quiz Programming Part
No ratings yet
Dejene Chala Stat606 Screening Quiz Programming Part
12 pages
066d3536-105d-471c-bda8-367c910b8ddc (1)
No ratings yet
066d3536-105d-471c-bda8-367c910b8ddc (1)
33 pages
Startup Case Study
No ratings yet
Startup Case Study
5 pages
LIST OF PRACTICAL IP065 XII SESSION 2025 CKC ACADEMY
No ratings yet
LIST OF PRACTICAL IP065 XII SESSION 2025 CKC ACADEMY
19 pages
Acknowledgement
No ratings yet
Acknowledgement
25 pages
Practice 1,2
No ratings yet
Practice 1,2
8 pages
IP Record Python 23-24 Aryan
No ratings yet
IP Record Python 23-24 Aryan
42 pages
2023MCS320004 HEMANTH TARRA-Assignment11
No ratings yet
2023MCS320004 HEMANTH TARRA-Assignment11
8 pages
Final Print Py Spark
No ratings yet
Final Print Py Spark
133 pages
Ip File
No ratings yet
Ip File
25 pages
IP Practical File Questions
No ratings yet
IP Practical File Questions
1 page
Pyspark coding questions from StrataScratch platform
No ratings yet
Pyspark coding questions from StrataScratch platform
23 pages
Midterm Report
No ratings yet
Midterm Report
24 pages
Pair RDD Operations: Flat Map
No ratings yet
Pair RDD Operations: Flat Map
4 pages
RDD Actions
No ratings yet
RDD Actions
18 pages
Spark RDD
No ratings yet
Spark RDD
4 pages
PDA_Assignment
No ratings yet
PDA_Assignment
6 pages
Practical File IP
No ratings yet
Practical File IP
27 pages
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet
How to a Developers Guide to 4k: Developer edition, #3
From Everand
How to a Developers Guide to 4k: Developer edition, #3
Xinc Cyberwizard
No ratings yet
No Ph.D. Game Design With Three.js
From Everand
No Ph.D. Game Design With Three.js
Nikiforos Kontopoulos
No ratings yet
SET A - Coding Questions - EASY - VVCE
No ratings yet
SET A - Coding Questions - EASY - VVCE
7 pages
Shredder-Dust Form Household Appliances Operational Plant, Up To 5mm Plastic Particle Size
No ratings yet
Shredder-Dust Form Household Appliances Operational Plant, Up To 5mm Plastic Particle Size
11 pages
Seismic Load Calculations Per The NYS 2002 Code
No ratings yet
Seismic Load Calculations Per The NYS 2002 Code
38 pages
Journal of Fatigue, Neural Networks
No ratings yet
Journal of Fatigue, Neural Networks
10 pages
Ajassp 2006 1924 1928 PDF
No ratings yet
Ajassp 2006 1924 1928 PDF
5 pages
Ball Valve: A Ball Valve Is A Device in Spherical Shape Which Controls The Flow
No ratings yet
Ball Valve: A Ball Valve Is A Device in Spherical Shape Which Controls The Flow
7 pages
Bentonite Clay
No ratings yet
Bentonite Clay
75 pages
Nuclear Waste
No ratings yet
Nuclear Waste
30 pages
Sorting of Plastic Waste For Effective Recycling: January 2015
No ratings yet
Sorting of Plastic Waste For Effective Recycling: January 2015
9 pages
Butterfly Valves Purushotham: Pro R&D PVT LTD
No ratings yet
Butterfly Valves Purushotham: Pro R&D PVT LTD
7 pages
Sorting of Plastic For Recycling: NIR (Near Infrared Rays) Technology
No ratings yet
Sorting of Plastic For Recycling: NIR (Near Infrared Rays) Technology
3 pages
Heaters:: Mechanical Construction
No ratings yet
Heaters:: Mechanical Construction
7 pages
DBTT and Cryogenic Temperature: Pro R&D PVT LTD
No ratings yet
DBTT and Cryogenic Temperature: Pro R&D PVT LTD
5 pages
Javee
No ratings yet
Javee
5 pages
New Microsoft Word Document (2
No ratings yet
New Microsoft Word Document (2
2 pages
Specialist Domain 2 Exploring Analyzing Data
No ratings yet
Specialist Domain 2 Exploring Analyzing Data
15 pages
Vegan Leathers Comparisons - Cleaned - Copie
No ratings yet
Vegan Leathers Comparisons - Cleaned - Copie
23 pages
Notes On Git
No ratings yet
Notes On Git
5 pages
KAS Mains 2025 GS-1
No ratings yet
KAS Mains 2025 GS-1
18 pages
IPC-4922-TOC
No ratings yet
IPC-4922-TOC
4 pages
Ryco Test-Points-and-Gauges
No ratings yet
Ryco Test-Points-and-Gauges
8 pages
Broad Leadership Competencies
No ratings yet
Broad Leadership Competencies
13 pages
Dsao 31
No ratings yet
Dsao 31
24 pages
PHE Micro-Project Roll No 43 Om Shinde 1
No ratings yet
PHE Micro-Project Roll No 43 Om Shinde 1
16 pages
Sairam V
No ratings yet
Sairam V
3 pages
7ME68103MC311KB0
No ratings yet
7ME68103MC311KB0
3 pages
Global Mapper Users Manual in
No ratings yet
Global Mapper Users Manual in
3 pages
The Ultimate Lead Magnet Examples List PDF
No ratings yet
The Ultimate Lead Magnet Examples List PDF
67 pages
Teks Bahasa Inggris Why Students Should Manage Their Stress
No ratings yet
Teks Bahasa Inggris Why Students Should Manage Their Stress
2 pages
Confirmation Laminated Glass 2020-06-02
No ratings yet
Confirmation Laminated Glass 2020-06-02
3 pages
2016 9-12-School Report Card
No ratings yet
2016 9-12-School Report Card
3 pages
A Review of Data Mining Technologies in Building Energy Systems
No ratings yet
A Review of Data Mining Technologies in Building Energy Systems
16 pages
100 30 E File User Guide - Version 2 - Final
No ratings yet
100 30 E File User Guide - Version 2 - Final
169 pages
Jet Bag Filter System PDF
No ratings yet
Jet Bag Filter System PDF
22 pages
Logistics Answer Key
No ratings yet
Logistics Answer Key
7 pages
05 - Principles of Inheritance and Variation
No ratings yet
05 - Principles of Inheritance and Variation
35 pages
Fourier Transform
No ratings yet
Fourier Transform
24 pages
Aligners The Science of Clear Orthodontics
No ratings yet
Aligners The Science of Clear Orthodontics
6 pages

Dele

Uploaded by

Dele

Uploaded by

val data = List(

val lis = List( "A~B" , "C~D" , "E~F" )

val split = lis.flatMap( x => x.split("~"))

val data = List(

val flat = data.flatMap( x => x.split("~"))

val statefil = flat.filter(x => x.contains("State"))

val Statefinal = statefil.map(x=>x.replace("State->",""))

val Cityfinal = cityfil.map(x=>x.replace("City->",""))

============Reading USDATA ==================

val conf = new

val sc = new SparkContext(conf) // RDD

val lendata = data.filter(x => x.length>200)

val flatdata = lendata.flatMap( x => x.split(","))

val repdata = flatdata.map( x => x.replace("-",""))

val condata = repdata.map( x => x + ",zeyo")

==================Column based filter/Schema rdd filter========================

case class columns(id:String,category:String,product:String)

val conf = new

val sc = new SparkContext(conf) // RDD

val data = sc.textFile("file:///F:/Practice/Data/datatxns")

You might also like