Вы находитесь на странице: 1из 3

-

--
ti
tl
e:"Assi
gnment1"
output:
html_
document
-
--

``
`{
rsetup,include=FALSE}
kni
tr:
:opts_
chunk$set (
echo=TRUE)
l
ibrar
y(dply
r)
l
ibrar
y(ggplot2)
l
ibrar
y(pl
otly)
``
`

##Dat asets
``
`{
rcar s}
parl
iament =read.
csv(fi
le="D:
/Sem 2/DataVisuali
zati
on/Dat aset
s/ parl
i
ament.
csv"
)
cri
cket=read.csv(f
il
e="D:/Sem 2/DataVisuali
zati
on/Datasets/odi-
batti
ng.
csv")
tweet=read.csv(f
il
e="D:/Sem 2/DataVisual
izati
on/Datasets/narendramodi
_tweet
s.csv
")
``
`

##1.Fort optenpar t
iescomputethefol
lowi
ngmetri
csfortheyear2009
###a)Tot alnumberofcont est
ants
```
{r
}
top=parl
iament %>%fil
ter
(Posi
ti
on==1)%>%gr
oup_by
(PARTY) %>%summarise(
tot
_wi
ns=n(
))%>%ar
r
ange(desc(t
ot_wins))
top_10=head(top,10)
##Top10par ti
esbywinni
ngposit
ions

##Dat
aoftop10Parti
es
dat
a_t
op_
parti
es=par
li
ament
%>%f
il
ter
(PARTY%i
n%t
op_
10$PARTY)

t
op_
parti
es_cont
est
nts=dat
a_top_par
ti
es%>%f
il
ter(
YEAR==2009)
%>%group_by
(PARTY)
%>%sum
mar
ise(
Tot_
contest
nt=n_di
sti
nct(
NAME) )
%>%arr
ange(desc(
Tot
_cont
est
nt))

ggpl
ot (
top_parti
es_contest
nts,aes(x=r
eorder(PARTY,
-
Tot_contestnt
),y=Tot
_contestnt,
fi
ll
=as.f
actor(PARTY))
)+geom_
bar
(st
at='
i
dent
it
y'
)+xl
ab(
"Par
ty"
)+y
l
ab("
Total Contestant
s")
+scale_fil
l
_discr
ete(name="Part
ies"
)
``
`

###b)Total ofnumberofwi nni


ngseats
```
{r
}
top_par
ti
es_wi ns=data_t
op_par
ti
es%>%fi
lt
er(YEAR==2009,
Positi
on==1)
%>%gr
oup_
by(
PARTY)
%>
%summar ise(Tot_win_seat
s=n(
))%>%ar
range(desc(
Tot_wi
n_seats)
)

ggpl
ot(t
op_par
ti
es_ wi
ns,aes(x=reorder(
PARTY,-
Tot_
win_seat
s),
y=Tot_win_seats,f
il
l=as.
factor
(PARTY))
)+geom_
bar
(st
at='
i
dent
it
y'
)+xl
ab(
"Par
ty"
)+
yl
ab("
WinningSeats")
+scale_fi
ll
_discret
e(name="Par
ti
es")
``
`

###c)Av g.
%ofv otes
``
`{r
}
Total_
Vot es=data_top_ par t
ies%>%fil
ter(YEAR==2009)
%>%summar i
se(
Tot_Votes=sum(VOTES))
avg_votes=data_top_ par t
ies%>%f i
lt
er(YEAR==2009)%>%group_by(
PARTY)%>%summar i
se(Avg_V
otes=(sum( VOTES)/ Tot al
_ Votes$Tot_Votes)*
100)
ggplot(avg_vot
es,aes( x=reor der
(PARTY, -
Avg_Vot es),
y=Avg_Vot es,fill
=as.f
actor(PARTY)))
+geom_bar(st
at='
I
denti
ty'
)+xl
ab("Par
ty"
)+y
lab("
Av
gVot
es"
)+scal
e_f
il
l_
discr
ete(
name="
Par
ti
es"
)
`
``

###d)Identi
fytoptencandidat
eswithhighest%mar ginofv
otesforthey ear2009
``
`{
r}
Pos1=parli
ament%>%f i
l
ter(
YEAR==2009,
Position==1)%>%gr
oup_by(PC)%>%mut at
e(Vote1=VOTE
S)%>%select(
NAME, PC,Vot
e1)
Pos2=parli
ament%>%f i
l
ter(
YEAR==2009,
Position==2)%>%gr
oup_by(PC)%>%mut at
e(Vote2=VOTE
S)%>%select(
NAME, PC,Vot
e2)
Total
= parl
iament %>% fi
lt
er(
YEAR==2009) %>% group_by(STATE,PC) %>%
summar i
se(Total
_Votes=sum(VOTES))

Margi
n_df
=data.f
rame(
Pos1$NAME,Total$PC,
Pos1$Vote1,
Pos2$Vot
e2,Tot
al$Tot
al_
Vot
es)
names(Margi
n_df)
=c(
"Name",
"PC"
,"
Winning_Vot
es",
"Runner
_Up_Vot
es",
"Tot
al_Vot
es"
)

Margin_
df=Mar
gin_
df%>%mutat
e(Mar
gin=(
(Winni
ng_Votes-
Runner_
Up_Vot
es)/
Total
_Vot
es)*
100)
%>%arrange(
-Margin)
%>%head(
10)
%>%sel
ect
(Name,
Mar
gin)

ggplot
(Margi
n_df,
aes(
x=r
eor
der
(Name,Mar
gin)
,y=Mar
gin)
)+geom_
bar
(st
at='
i
dent
it
y'
)+coor
d_f
li
p()
+xlab(
"Candi
dateName")
+yl
ab(
"Mar
gin%")
``
`

##2.I dentif
yy earwiseper centageofmal eandf emal ecandidates?
``
`{r
}
parl
iament _gender=parli
ament%>%gr oup_by(PARTY, YEAR,SEX) %>%summar ise(contestnt
s=n_dis
ti
nct(NAME) )
yearwi se_contestants=parl
iament _gender%>%gr oup_by(YEAR) %>%summar ise(total
_contestnt
s=
sum( contest nt
s))
parl
iament _gender=mer ge(par
liament _
gender ,
yearwise_contestant
s,by="YEAR" )
gender _percentage=par l
iament_ gender%>%mut ate(Gender_percent=(contestnts/tot
al_contest
nts)
*100)

gender
_per
cent
age$SEX=as.
char
act
er(
gender
_per
cent
age$SEX)

gender
_per
cent
age$SEX[
gender
_per
cent
age$SEX=="
"]
="NoDat
a"

ggplot
(gender_
per
centage,
aes(x=as.
fact
or(YEAR),
y=Gender
_per
cent
,f
il
l=SEX))
+geom_
bar
(st
at='
i
d
enti
ty'
)+xl
ab("
Year
")+y
lab("
GenderPercent"
)+scal
e_fi
l
l_di
scr
ete(
name="Gender"
)

`
``

##3.Cr eateanewcol umnbybi nningt heRunscol umnusi ngthefoll


owi
ngr angesandpl otthe
fr
equencycountofr anges0- 25,26-50, 51-75,76-100,100+
``
`{r
}
cri
cket =cricket%>%mut at e(Run_bin=case_ when(Runs %i n% c( 0:25)
~c("
0-25"), Runs %i n%
c(26:50) ~c("26-50"), Runs %i n% c( 51:
75) ~c( "51-75"), Runs %i n% c( 76:100)~c("
76-
100"),Runs>100~c( "
100+" )
))
Bin_Tabl e=cricket%>%gr oup_by(Run_ bin)%>%summar ise(Freq=n()
)
ggplot(na.omi t(Bin_Tabl e),
aes(x=reorder(Run_ bi
n,-
Freq),y=Freq,fil
l=Run_ bi
n) )+geom_ bar(stat='
identi
ty'
)+xlab("Run Range")+ylab("
Frequency
Count ")+scale_fil
l_di
scr ete(name=" RunSl ots")
``
`

##4.Considerthet
opt enpl
ayer
sbytotalrunsandcomput
eandv
isual
i
zet
henumberofcent
uri
es
acr
ossy ears(usefacet_
gri
dorfacet
_wrap)
``
`{
r}
cri
cket_
top10=cri
cket
%>%gr oup_by(
Play
er)%>%summar i
se(Tot
_runs=sum(
Runs)
)%>%ar
range(
-
Tot_r
uns)%>%head(10)
summar y=cr
icket
%>%fil
ter
(Player%i
n%cr i
cket
_top10$Pl
ayer)

summar
y$Year
=for
mat
(as.
Dat
e(summar
y$Mat
chDat
e,"
%m-
%d-
%Y"
),
"%Y"
)

Centur
y_tabl
e=summar y%>%mutat
e(Cent
ury
_Fl
ag=case_
when((bet
ween(
Runs,
100,
199))
~1,(
Runs
==200)~2,(
between(Runs,
0,
99)
)~0))
%>%group_
by(Pl
ayer
,Year
)%>%summari
se(
Total
_Centur
ies=s
um(Century_Fl
ag))

g=ggplot(Cent
ury
_tabl
e,aes(x=reorder(
as.
fact
or(Year)
,Tot
al_Centur
ies),
y=Total
_Cent
uri
es,
fi
ll
=Yea
r)
)+xlab(
"Year"
)+yl
ab("
Cent uri
es")+geom_bar(
stat='
i
dentit
y'
)+facet_
wr ap(
~Player)
ggplotl
y(g)

`
``

##5.Creat
eascat terplotwiththef ol
lowingdet ai
l
s: Xaxiscontai
nsnumberofr etweets:Yaxi
s
contai
nsnumberofl ikes:Col
orr epr
esentsdev i
cefrom whichitwastweeted.
``
`{
r}
ggpl
ot(tweet
,aes(
x=retweets_count,
y=favori
te_count,
col
or=source)
)+geom_point
()+scal
e_f
il
l_
con
ti
nuous(name="Source")+l
abs(color
="Source")
``
`

Вам также может понравиться