Starting off as a muggle that naïve to the Math's and Data Science world.

Day 10 (2)

Data Structure (con’t)

data.frame(data) two dimension, multiple datatype

data.frame(
  string=c("zero","one"),
  number=c(0,1),
  boolean=c(FALSE,TRUE)
)

Result:


Add data

rbind(variable_name, variable_name)

df = data.frame(
  column_one=c(1,2,3),
  column_two=c(4,5,6))

rbind( df, c(7,8) )

Result:


cbind(variable_name, variable_name)

df = data.frame(
  column_one=c(1,2,3),
  column_two=c(4,5,6))

cbind( df, c(9,10,11) )

Result:


Import data

read.csv(file_path, header=TRUE/FALSE)

df = read.csv("C:/folder/file.csv", header=TRUE)

Access column
df = data.frame(
  column_one=c(1,2,3),
  column_two=c(4,5,6))

df["column_one"]
df$column_one
df[,2]

Result:


Delete column
df = data.frame(
  column_one=c(1,2,3),
  column_two=c(4,5,6))

df$column_one = NULL

Result:


Data frame function

nrow(variable_name)

nrow(
  data.frame(
    string=c("zero","one","two","three")
  )
)

Result: 4


ncol(variable_name)

ncol(
  data.frame(
    one=c("one"),
    two=c("two"),
    three=c("three")
  )
)

Result: 3


dim(variable_name)

dim(
  data.frame(one=c("one","two","three"),two=c(1,2,3))
)

Result:


names(variable_name)

names(
  data.frame(
    name_one=c(1),
    name_two=c(2)
  )
)

Result:


head(variable_name, quantity)

head(
  data.frame(column=c(1,2,3,4,5)),
  2
)

Result:


tail(variable_name, quantity)

tail(
  data.frame(column=c(1,2,3,4,5)),
  2
)

Result:


list(data) multi dimension, multiple datatype

a = c(FALSE)
b = c(1,2)
c = c("Three","Four")
list(a, b, c, 5)

Result:

Leave a comment