# 安装包
if (!requireNamespace("data.table", quietly = TRUE)) {
install.packages("data.table")
}
if (!requireNamespace("jsonlite", quietly = TRUE)) {
install.packages("jsonlite")
}
if (!requireNamespace("ggpubr", quietly = TRUE)) {
install.packages("ggpubr")
}
if (!requireNamespace("ggthemes", quietly = TRUE)) {
install.packages("ggthemes")
}
# 加载包
library(data.table)
library(jsonlite)
library(ggpubr)
library(ggthemes)箱式图
注记
Hiplot 网站
本页面为 Hiplot Boxplot 插件的源码版本教程,您也可以使用 Hiplot 网站实现无代码绘图,更多信息请查看以下链接:
箱形图是一种通过四分位数图形象化地描述一组数据分布特征的方法。
环境配置
系统: Cross-platform (Linux/MacOS/Windows)
编程语言: R
依赖包:
data.table;jsonlite;ggpubr;ggthemes
sessioninfo::session_info("attached")─ Session info ───────────────────────────────────────────────────────────────
setting value
version R version 4.5.2 (2025-10-31)
os Ubuntu 24.04.3 LTS
system x86_64, linux-gnu
ui X11
language (EN)
collate C.UTF-8
ctype C.UTF-8
tz UTC
date 2026-01-28
pandoc 3.1.3 @ /usr/bin/ (via rmarkdown)
quarto 1.8.27 @ /usr/local/bin/quarto
─ Packages ───────────────────────────────────────────────────────────────────
package * version date (UTC) lib source
data.table * 1.18.0 2025-12-24 [1] RSPM
ggplot2 * 4.0.1 2025-11-14 [1] RSPM
ggpubr * 0.6.2 2025-10-17 [1] RSPM
ggthemes * 5.2.0 2025-11-30 [1] RSPM
jsonlite * 2.0.0 2025-03-27 [1] RSPM
[1] /home/runner/work/_temp/Library
[2] /opt/R/4.5.2/lib/R/site-library
[3] /opt/R/4.5.2/lib/R/library
* ── Packages attached to the search path.
──────────────────────────────────────────────────────────────────────────────
数据准备
载入数据为数据集 (不同治疗方案的治疗效果数据)。
# 加载数据
data <- data.table::fread(jsonlite::read_json("https://hiplot.cn/ui/basic/boxplot/data.json")$exampleData$textarea[[1]])
data <- as.data.frame(data)
# 整理数据格式
groups <- unique(data[, 2])
my_comparisons <- combn(groups, 2, simplify = FALSE)
my_comparisons <- lapply(my_comparisons, as.character)
# 查看数据
head(data) Value Group1 Group2
1 4.2 low treat1
2 11.5 low treat1
3 7.3 low treat1
4 5.8 low treat1
5 6.4 low treat1
6 10.0 low treat1
可视化
# 箱式图
p <- ggboxplot(data, x = "Group1", y = "Value", notch = F, facet.by = "Group2",
add = "point", color = "Group1", xlab = "Group2", ylab = "Value",
palette = c("#e04d39","#5bbad6","#1e9f86"),
title = "Box Plot") +
stat_compare_means(comparisons = my_comparisons, label = "p.format",
method = "t.test") +
scale_y_continuous(expand = expansion(mult = c(0.1, 0.1))) +
theme_stata() +
theme(text = element_text(family = "Arial"),
plot.title = element_text(size = 12,hjust = 0.5),
axis.title = element_text(size = 12),
axis.text = element_text(size = 10),
axis.text.x = element_text(angle = 0, hjust = 0.5,vjust = 1),
legend.position = "right",
legend.direction = "vertical",
legend.title = element_text(size = 10),
legend.text = element_text(size = 10))
p
横坐标表示几组不同的数据,纵坐标分别表示各组数据的四分位数;即方框上、中、下的横线分别代表上四分位数,中位数,下四分位数;上下方线段代表的数值分别指数据最大值和最小值,方框以外的点代表离群值。图示上方数值表示两两变量间的 P 值,可认为治疗方案 1 中,中剂量组同低剂量组疗效有显著差异,以此类推。
