123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507 |
- #
- r2 = which(r1 == TRUE)
- #
- vowels = c('a','e','i','o','u','y')
- alphabet = letters
- r1 = letters %in% vowels
- #Le result est un vecteur de boolean
- #avec true quand les deux elements sont
- #egaux, et false quand c l'inverse
- v1 = seq(6)
- #
- #r2 = which(r1 == TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- ?which
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- ?letters
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- ?which
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- ?strsplit
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- myname_split[0]
- myname_split[1]
- myname_split[1][0]
- myname_split[2
- myname_split[2]
- myname_split[2].[0]
- myname_split[1].[0]
- myname_split[[1]][0]
- myname_split[[1]][1]
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- print(r6)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP1_2.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- rep(c(0,1),13)
- c(1,26,1)
- seq(1,26,1)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- install.packages("ggplot2")
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- head
- msleep
- head?
- s
- ?head
- head(msleep)
- ?names
- ?head
- head(letters)
- letters
- head(letters, n = 7)
- head(msleep, n=2)
- ?str
- str(1:12)
- str(freeny)
- str(msleep)
- ?summary
- sumamry(letters)
- summary(letters)
- summary(msleep)
- msleep
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- msleep
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- msleep
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- msleep
- msleep
- ?na.omit
- msleep
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- summary("pauline")
- summary('p','a','u')
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- summary(strsplit(Pauline, NULL))
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- summary(strsplit("Pauline", NULL))
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- summary(strsplit("Pauline", NULL))
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- View(p600)
- p600[[1]][1]
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- letters %in% p600
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', encoding = 'ASCII', echo=TRUE)
- ?substr
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- msleep
- which(msleep[[1]] ==Cow)
- which(msleep[[1]] =="Cow")
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- msleep
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- which( msleep[[1]] == "w")
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- p777 <- which( msleep[[1]] == "w")
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- install.packages("rapportools")
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- source('C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/TP2_1.R', echo=TRUE)
- n
- n
- n
- n
- library(tidyverse)
- library(ggplot2)
- setwd("C:/Users/nunes/OneDrive/Bureau/WorkDay/INSA/Big_Data/Projet")
- ##########################
- #Acquisition of the data #
- ##########################
- #Variable containing all the information
- tab <- read.table("yob1880.txt",h=FALSE,sep=",")
- Year <- matrix(1880,ncol=1,nrow = nrow(tab))
- tab <- cbind(Year,tab)
- for (i in seq(1881,2019,1)){
- #Dynamic name for the source txt file
- namesource <- "yob"
- namesource <- paste(c(namesource,i),collapse = "")
- namesource <- paste (c(namesource,".txt"), collapse="")
- # Table used inside the for loop to extrat the informations
- tabinter <- read.table(namesource,h=FALSE,sep=",")
- #Converting the table into the format "Year,Name,Sex,Number"
- Year <- matrix(i,ncol=1,nrow = nrow(tabinter))
- tabinter <- cbind(Year,tabinter)
- #Adding the new informations to the final table
- tab <- rbind(tab,tabinter)
- }
- final_table <- tab%>%
- rename(
- Name = V1,
- Sex = V2,
- Number = V3
- )
- ####################################################################
- # Partie 1 - L'influence de Marylin depuis 1880 #
- ####################################################################
- MarilynFemme <- final_table %>%
- filter(Name == "Marilyn")%>%
- group_by(Year,Number)%>%
- filter(Sex=='F')
- MarilynHomme <- final_table %>%
- filter(Name == "Marilyn")%>%
- group_by(Year,Number)%>%
- filter(Sex=='M')
- ggplot(MarilynFemme,aes(x=Year,y=Number, fill=Number))+
- geom_bar(stat = "identity")+
- ggtitle("Evolution des naissances avec le prénom Marilyn depuis 1880, femmes")
- ggplot(MarilynHomme,aes(x=Year,y=Number, fill=Number))+
- geom_bar(stat = "identity")+
- ggtitle("Evolution des naissances avec le prénom Marilyn depuis 1880, hommes")
- AdolphHomme <- final_table %>%
- filter(Name == "Adolph")%>%
- group_by(Year,Number)%>%
- filter(Sex=='M')
- ggplot(AdolphHomme,aes(x=Year,y=Number, fill=Number))+
- geom_bar(stat = "identity")+
- ggtitle("Evolution des naissances avec le prénom Adolph depuis 1880, hommes")
- ##################################
- # 1.1 - Number of births by year #
- ##################################
- NaissancesAnDepuis1880 <- final_table %>%
- group_by(Year)%>%
- summarise(
- NbrBirths = sum(Number)
- )
- ggplot(NaissancesAnDepuis1880,aes(x=Year,y=NbrBirths, color= NbrBirths))+
- geom_line(size = 3)+
- ggtitle("Nombre de naissances par année depuis 1880, sexes confondus")
- NaissancesAn6090 <- final_table %>%
- group_by(Year,Sex)%>%
- filter(Year < 1990)%>%
- filter(Year> 1960)%>%
- summarise(NbrBirths = sum(Number))
- ggplot(NaissancesAn6090,aes(x=Year,y=NbrBirths, color = Sex))+
- geom_line(size=5)+
- geom_point()+
- ggtitle("Nombre de naissances par année, entre 1960 et 1990")+
- NaissancesSexeSep <- final_table %>%
- group_by(Year,Sex)%>%
- summarise(NbrBirths = sum(Number))
- ggplot(NaissancesSexeSep,aes(x=Year,y=NbrBirths, color = Sex))+
- geom_line(size=5)+
- geom_point()+
- ggtitle("Nombre de naissances par année, sexe séparés")
- NaissancesSexeSep <- final_table %>%
- group_by(Year,Sex)%>%
- summarise(NbrBirths = sum(Number))
- ggplot(NaissancesSexeSep,aes(x=Year,y=NbrBirths, color = Sex))+
- geom_line(size=5)+
- geom_point()+
- ggtitle("Nombre de naissances par année, sexe séparés")
- PrenomsHommeDepuis1880 <- final_table %>%
- group_by(Name)%>%
- filter(Sex == "M")%>%
- summarise(
- NumberOfBirths = sum(Number)
- )%>%
- arrange(desc(NumberOfBirths))%>%
- top_n(5)
- ggplot(PrenomsHommeDepuis1880,aes(x=Name,y=NumberOfBirths))+
- geom_bar(stat = "identity")+
- ggtitle("Most given male names since 1880")
- # Create Data
- PrenomsHommeDepuis1880 <- data.frame(
- name=c('James','John','Robert','Michael','William','Others'),
- value= c(2.89,2.86,2.70,2.44,2.34,86.77)
- )
- # Basic piechart
- ggplot(data, aes(x="", y=value, fill=name)) +
- geom_bar(stat="identity", width=1) +
- coord_polar("y", start=0)+
- theme_void()
- # Create Data
- PrenomsHommeDepuis1880 <- data.frame(
- name=c('James','John','Robert','Michael','William','Others'),
- value= c(2.89,2.86,2.70,2.44,2.34,86.77)
- )
- # Basic piechart
- ggplot(data, aes(x="", y=value, fill=name)) +
- geom_bar(stat="identity", width=1) +
- coord_polar("y", start=0)+
- theme_void()
- # Create Data
- PrenomsHommeDepuis1880 <- data.frame(
- name=c('James','John','Robert','Michael','William','Others'),
- value= c(2.89,2.86,2.70,2.44,2.34,86.77)
- )
- # Basic piechart
- ggplot(PrenomsHommeDepuis1880, aes(x="", y=value, fill=name)) +
- geom_bar(stat="identity", width=1) +
- coord_polar("y", start=0)+
- theme_void()
- PrenomsFemmesDepuis1880 <- final_table %>%
- group_by(Name)%>%
- filter(Sex == "F")%>%
- summarise(
- NumberOfBirths = sum(Number)
- )%>%
- arrange(desc(NumberOfBirths))%>%
- top_n(5)
- ggplot(PrenomsFemmesDepuis1880,aes(x=Name,y=NumberOfBirths))+
- geom_bar(stat = "identity")+
- ggtitle("Most given female names since 1880")
- name= c('Mary','Elizabeth','Patricia','Jennifer','Linda','Others')
- value= c(2.35,0.94,0.89,0.84,0.83,94.15)
- # Create Data
- PrenonesFemmes1880 <- data.frame(name,value)
- # Basic piechart
- ggplot(PrenonesFemmes1880, aes(x="", y=value, fill=name)) +
- geom_bar(stat="identity", width=1) +
- coord_polar("y", start=0)+
- theme_void()
- PrenomsHommeDepuis2000 <- final_table %>%
- group_by(Name)%>%
- filter(Sex == "M")%>%
- filter(Year>2000)%>%
- summarise(
- NumberOfBirths = sum(Number)
- )%>%
- arrange(desc(NumberOfBirths))%>%
- top_n(5)
- ggplot(PrenomsHommeDepuis2000,aes(x=Name,y=NumberOfBirths))+
- geom_bar(stat = "identity")+
- ggtitle("Most given male names since 2000")
- NbrMaleBirths2000 <- final_table %>%
- group_by(Sex)%>%
- filter(Sex == "M")%>%
- filter(Year>2000)%>%
- summarise(
- NumberOfBirths = sum(Number)
- )
- top5MaleNames2000 <- tab233%>% summarise(
- N=sum(NumberOfBirths)
- )
- OtherNames2000 <- (NbrMaleBirths2000[2] - (top5MaleNames2000[1]))
- # Create Data
- PrenomsHomme2000 <- data.frame(
- name=c('Jacob','Michael','Ethan','William','Mathew','Others'),
- value= c(402290,363299,335423,333255,317778,OtherNames2000)
- )
- # Basic piechart
- ggplot(PrenomsHomme2000, aes(x="", y=value, fill=name)) +
- geom_bar(stat="identity", width=1) +
- coord_polar("y", start=0)+
- theme_void()
- NbrMaleBirths2000 <- final_table %>%
- group_by(Sex)%>%
- filter(Sex == "M")%>%
- filter(Year>2000)%>%
- summarise(
- NumberOfBirths = sum(Number)
- )
- top5MaleNames2000 <- tab233%>% summarise(
- N=sum(NumberOfBirths)
- )
- OtherMaleNames2000 <- (NbrMaleBirths2000[2] - (top5MaleNames2000[1]))
- # Create Data
- PrenomsHomme2000 <- data.frame(
- name=c('Jacob','Michael','Ethan','William','Mathew','Others'),
- value= c(402290,363299,335423,333255,317778,OtherMaleNames2000)
- )
- NbrMaleBirths2000 <- final_table %>%
- group_by(Sex)%>%
- filter(Sex == "M")%>%
- filter(Year>2000)%>%
- summarise(
- NumberOfBirths = sum(Number)
- )
- top5MaleNames2000 <- tab233%>% summarise(
- N=sum(NumberOfBirths)
- )
- OtherMaleNames2000 <- (NbrMaleBirths2000[2] - (top5MaleNames2000[1]))
- #########
- PrenomsHommeDepuis2000 <- final_table %>%
- group_by(Name)%>%
- filter(Sex == "M")%>%
- filter(Year>2000)%>%
- summarise(
- NumberOfBirths = sum(Number)
- )%>%
- arrange(desc(NumberOfBirths))%>%
- top_n(5)
- ggplot(PrenomsHommeDepuis2000,aes(x=Name,y=NumberOfBirths))+
- geom_bar(stat = "identity")+
- ggtitle("Most given male names since 2000")
- NbrMaleBirths2000 <- final_table %>%
- group_by(Sex)%>%
- filter(Sex == "M")%>%
- filter(Year>2000)%>%
- summarise(
- NumberOfBirths = sum(Number)
- )
- top5MaleNames2000 <- PrenomsHommeDepuis2000%>% summarise(
- N=sum(NumberOfBirths)
- )
- OtherMaleNames2000 <- (NbrMaleBirths2000[2] - (top5MaleNames2000[1]))
- # Create Data
- PrenomsHomme2000 <- data.frame(
- name=c('Jacob','Michael','Ethan','William','Mathew','Others'),
- value= c(402290,363299,335423,333255,317778,OtherMaleNames2000)
- )
- # Basic piechart
- ggplot(PrenomsHomme2000, aes(x="", y=value, fill=name)) +
- geom_bar(stat="identity", width=1) +
- coord_polar("y", start=0)+
- theme_void()
- #########
- PrenomsFemmeDepuis2000 <- final_table %>%
- group_by(Name)%>%
- filter(Sex == "F")%>%
- filter(Year>2000)%>%
- summarise(
- NumberOfBirths = sum(Number)
- )%>%
- arrange(desc(NumberOfBirths))%>%
- top_n(5)
- ggplot(PrenomsFemmeDepuis2000,aes(x=Name,y=NumberOfBirths))+
- geom_bar(stat = "identity")+
- ggtitle("Most given female names since 2000")
- NbrFemaleBirths2000 <- final_table %>%
- group_by(Sex)%>%
- filter(Sex == "F")%>%
- filter(Year>2000)%>%
- summarise(
- NumberOfBirths = sum(Number)
- )
- top5FemaleNames2000 <- PrenomsFemmeDepuis2000%>% summarise(
- N=sum(NumberOfBirths)
- )
- OtherFemaleNames2000 <- (NbrMaleBirths2000[2] - (top5FemaleNames2000[1]))
- name= c('Emma','Olivia','Emily','Isabella','Sophia','Others')
- value= c(363402,327356,315202,313471,293494,OtherFemaleNames2000)
- # Create Data
- PrenomsFemme2000 <- data.frame(name,value)
- # Basic piechart
- ggplot(PrenomsFemme2000, aes(x="", y=value, fill=name)) +
- geom_bar(stat="identity", width=1) +
- coord_polar("y", start=0)+
- theme_void()
- EvolutionJames <- final_table %>%
- group_by(Year)%>%
- filter(Name == "James")%>%
- summarise(
- NumberOfBirths = sum(Number)
- )
- ggplot(EvolutionJames,aes(x=Year,y=NumberOfBirths))+
- geom_line(size=5)+
- geom_point()+
- ggtitle("The evolution of the name James since 1880")
- # The evolution of the name Mary since 1880 #
- ##############################################
- EvolutionMary <- final_table %>%
- group_by(Year)%>%
- filter(Name == "Mary")%>%
- summarise(
- NumberOfBirths = sum(Number)
- )
- ggplot(EvolutionMary,aes(x=Year,y=NumberOfBirths))+
- geom_line(size=5)+
- geom_point()+
- ggtitle("The evolution of the name Mary since 1880")
|