← 홈

📊

⌘K

Tailwind CSS 프로그래밍 언어

Ruby on Rails 프로그래밍 언어

Kubernetes DevOps & CLI

☁️

AWS CLI DevOps & CLI

🔄

GitHub Actions DevOps & CLI

🐧

Linux 명령어 DevOps & CLI

💻

Bash 스크립팅 DevOps & CLI

Makefile DevOps & CLI

Terraform DevOps & CLI

Prometheus DevOps & CLI

Fish Shell DevOps & CLI

💙

PowerShell DevOps & CLI

Azure CLI DevOps & CLI

☁️

Google Cloud CLI DevOps & CLI

Apache Airflow DevOps & CLI

TensorFlow 데이터베이스 & 데이터

📈

Matplotlib 데이터베이스 & 데이터

🐘

PostgreSQL 데이터베이스 & 데이터

Elasticsearch 데이터베이스 & 데이터

🤖

Scikit-learn 데이터베이스 & 데이터

👁️

OpenCV 데이터베이스 & 데이터

⚡

Apache Spark 데이터베이스 & 데이터

🪶

SQLite 데이터베이스 & 데이터

⚡

Supabase 데이터베이스 & 데이터

🔵

Neo4j 데이터베이스 & 데이터

📨

Apache Kafka 데이터베이스 & 데이터

🐰

RabbitMQ 데이터베이스 & 데이터

reStructuredText 유틸리티

Microsoft Excel 오피스 애플리케이션

📘

Microsoft Word 오피스 애플리케이션

📙

Microsoft PowerPoint 오피스 애플리케이션

Google 문서 Google Workspace

📊

Google 스프레드시트 Google Workspace

📽️

Google 프레젠테이션 Google Workspace

🔌

Cadence Virtuoso EDA & 하드웨어

⚙️

Synopsys EDA EDA & 하드웨어

💎

Verilog & VHDL EDA & 하드웨어

검색 결과가 없습니다

기초

변수와 데이터 타입

할당

x <- 10
x = 10  # also works

숫자

x <- 3.14

정수

x <- 5L

문자

name <- "R"

논리

flag <- TRUE

벡터

v <- c(1, 2, 3, 4, 5)

리스트

lst <- list(name="John", age=30)

타입 확인

class(x)
typeof(x)

벡터

벡터 생성

v <- c(1, 2, 3, 4, 5)

시퀀스

1:10
seq(1, 10, by=2)

반복

rep(1, times=5)
rep(1:3, each=2)

요소 접근

v[1]  # first element (1-indexed)
v[c(1,3)]  # 1st and 3rd

슬라이스

v[2:4]  # elements 2 to 4

음수 인덱스

v[-1]  # all except first

벡터 연산

v * 2  # element-wise
sum(v)
mean(v)
max(v), min(v)

데이터 프레임

데이터 프레임 생성

생성

df <- data.frame(
  name = c("Alice", "Bob"),
  age = c(25, 30)
)

벡터로부터

df <- data.frame(col1=v1, col2=v2)

구조 확인

str(df)
head(df)
tail(df)

차원

nrow(df)
ncol(df)
dim(df)

열 이름

names(df)
colnames(df)

데이터 접근

열

df$name
df["name"]
df[, "name"]

행

df[1, ]  # first row

셀

df[1, 2]  # row 1, col 2

여러 열

df[, c("name", "age")]

행 필터링

df[df$age > 25, ]

부분집합

subset(df, age > 25)

데이터 조작

열 추가

df$new_col <- values

열 제거

df$col <- NULL

병합

merge(df1, df2, by="id")

행 결합

rbind(df1, df2)

열 결합

cbind(df1, df2)

정렬

df[order(df$age), ]

제어 흐름

조건문과 반복문

If/else

if (x > 0) {
  print("positive")
} else if (x < 0) {
  print("negative")
} else {
  print("zero")
}

Ifelse (벡터화)

ifelse(x > 0, "pos", "neg")

For 루프

for (i in 1:10) {
  print(i)
}

While 루프

while (x < 10) {
  x <- x + 1
}

Break/Next

for (i in 1:10) {
  if (i == 5) break
  if (i == 3) next
  print(i)
}

함수

함수 정의

기본 함수

add <- function(a, b) {
  return(a + b)
}

기본 인자

greet <- function(name = "World") {
  paste("Hello,", name)
}

암시적 반환

square <- function(x) x^2

다중 반환

stats <- function(v) {
  list(mean=mean(v), sd=sd(v))
}

익명 함수

sapply(1:5, function(x) x^2)

Apply 함수

apply

apply(matrix, 1, sum)  # by row
apply(matrix, 2, sum)  # by col

lapply

lapply(list, function)  # returns list

sapply

sapply(list, function)  # simplifies

mapply

mapply(function, v1, v2)  # parallel

tapply

tapply(values, groups, mean)

Tidyverse (dplyr)

dplyr 기초

로드

library(dplyr)
library(tidyverse)

파이프 연산자

df %>% filter(x > 5) %>% select(a, b)

필터

df %>% filter(age > 25)

열 선택

df %>% select(name, age)
df %>% select(-id)  # exclude

변환

df %>% mutate(age2 = age * 2)

정렬

df %>% arrange(age)
df %>% arrange(desc(age))

그룹화

df %>% group_by(category)

요약

df %>% summarize(mean_age = mean(age))

dplyr 추가

조인

left_join(df1, df2, by = "id")
inner_join(df1, df2, by = "id")

고유값

df %>% distinct(category)

카운트

df %>% count(category)

이름 변경

df %>% rename(new_name = old_name)

슬라이스

df %>% slice(1:10)

추출

df %>% pull(column)

시각화

기본 R 플롯

산점도

plot(x, y)

선 그래프

plot(x, y, type = "l")

히스토그램

hist(x)

막대 그래프

barplot(table(x))

박스 플롯

boxplot(y ~ group)

ggplot2

기본 구조

ggplot(df, aes(x=col1, y=col2)) +
  geom_point()

산점도

ggplot(df, aes(x, y)) + geom_point()

선

ggplot(df, aes(x, y)) + geom_line()

막대

ggplot(df, aes(x)) + geom_bar()

히스토그램

ggplot(df, aes(x)) + geom_histogram()

면 분할

+ facet_wrap(~category)

테마

+ theme_minimal()

라벨

+ labs(title="Title", x="X", y="Y")

파일 입출력

읽기와 쓰기

CSV 읽기

df <- read.csv("file.csv")
df <- readr::read_csv("file.csv")

CSV 쓰기

write.csv(df, "file.csv", row.names=FALSE)

엑셀 읽기

library(readxl)
df <- read_excel("file.xlsx")

엑셀 쓰기

library(writexl)
write_xlsx(df, "file.xlsx")

R 객체 저장

saveRDS(obj, "file.rds")

R 객체 로드

obj <- readRDS("file.rds")

통계

기본 통계

요약

summary(df)

평균/중앙값

mean(x)
median(x)

표준편차/분산

sd(x)
var(x)

분위수

quantile(x, 0.25)

상관관계

cor(x, y)

t-검정

t.test(x, y)

카이제곱

chisq.test(table)

선형 회귀

model <- lm(y ~ x, data=df)
summary(model)