最新的Claude-opus-4-7在科研场景到底有多强...

张开发

• 2026/4/18 6:33:16 • 15 分钟阅读

分享文章

Claude Opus 4.7 深夜上线又一波AI的大更新开始了...听说新的Claude Opus 4.7 相比于之前在图像处理、处理任务、执行指令方面又有了新的提升。这咱不得吃上第一口热乎螃蟹用咱的单细胞数据来测试一下新模型在科研场景生信数据分析上的表现如何一、切换模型/model claude-opus-4-7首先输入上面的指令切换成最新的Claude-opus-4-7当电脑出现下面的界面就代表操作成功了二、实践环节小编这里用之前测序的C2样本换任何一个样本都可以单细胞数据为例。希望Claude可以生成成差异表达分析图GO图Venn图火山图和聚类分析图。输入下面指令请你帮我分析C2这个样本生成差异表达分析图GO图Venn图火山图和聚类分析图然后单细胞RNA-seq的数据进行了下面的深度分析小编就可以摸鱼去了不是。以下是Claude-opus-4-7模型生成的R包速速码住# C2 单细胞RNA-seq 深度分析 # 生成: 差异表达图、GO富集图、Venn图、火山图、聚类热图 # ---- 依赖包 ---- pkgs - c(Seurat, ggplot2, dplyr, clusterProfiler, org.Hs.eg.db, ggVennDiagram, pheatmap, ggrepel, RColorBrewer, enrichplot, patchwork) for (p in pkgs) { if (!requireNamespace(p, quietly TRUE)) { if (p %in% c(clusterProfiler, org.Hs.eg.db, enrichplot)) { BiocManager::install(p, ask FALSE) } else { install.packages(p, repos https://cloud.r-project.org) } } library(p, character.only TRUE) } outdir - C:/Users/BMbio/Desktop/C2 cat(加载 Seurat 对象...\n) seurat_obj - readRDS(file.path(outdir, C2_seurat.rds)) cat(sprintf(细胞数: %d | Cluster数: %d\n, ncol(seurat_obj), length(unique(Idents(seurat_obj))))) # # 1. 差异表达分析 (FindAllMarkers) # cat(\n[1/5] 差异表达分析...\n) markers_all - FindAllMarkers( seurat_obj, only.pos TRUE, min.pct 0.25, logfc.threshold 0.25, test.use wilcox ) # 每个cluster取top5 top5 - markers_all %% group_by(cluster) %% slice_max(order_by avg_log2FC, n 5) %% ungroup() # DotPlot: 差异表达概览 p_dot - DotPlot(seurat_obj, features unique(top5$gene), cols c(lightgrey, #E64B35)) RotatedAxis() ggtitle(各Cluster Top5差异表达基因) theme(plot.title element_text(hjust 0.5, face bold, size 14), axis.text.x element_text(size 7)) ggsave(file.path(outdir, DEG_dotplot.png), p_dot, width max(14, length(unique(top5$gene)) * 0.35 4), height 7, dpi 200, limitsize FALSE) cat( - DEG_dotplot.png\n) # 保存差异表达结果 write.csv(markers_all, file.path(outdir, DEG_all_markers.csv), row.names FALSE) cat( - DEG_all_markers.csv\n) # # 2. 火山图 (Cluster 0 vs rest) # cat(\n[2/5] 火山图...\n) # 对每个cluster做 vs rest 的双向检验 make_volcano - function(obj, cluster_id) { deg - FindMarkers(obj, ident.1 cluster_id, min.pct 0.1, logfc.threshold 0, test.use wilcox) deg$gene - rownames(deg) deg$neg_log10_p - -log10(deg$p_val_adj 1e-300) deg$status - NS deg$status[deg$avg_log2FC 0.5 deg$p_val_adj 0.05] - Up deg$status[deg$avg_log2FC -0.5 deg$p_val_adj 0.05] - Down top_genes - deg %% filter(status ! NS) %% arrange(p_val_adj) %% head(15) ggplot(deg, aes(avg_log2FC, neg_log10_p, color status)) geom_point(size 0.8, alpha 0.7) scale_color_manual(values c(Up #E64B35, Down #4DBBD5, NS grey70)) geom_vline(xintercept c(-0.5, 0.5), linetype dashed, color grey40) geom_hline(yintercept -log10(0.05), linetype dashed, color grey40) geom_text_repel(data top_genes, aes(label gene), size 2.5, max.overlaps 20, color black) labs(title paste0(Cluster , cluster_id, vs Rest), x log2 Fold Change, y -log10(adj. p-value), color NULL) theme_classic(base_size 12) theme(plot.title element_text(hjust 0.5, face bold)) } clusters - levels(Idents(seurat_obj)) # 最多画前6个cluster避免运行时间过长 n_volcano - min(6, length(clusters)) volcano_plots - lapply(clusters[seq_len(n_volcano)], function(cl) { cat(sprintf( Cluster %s...\n, cl)) make_volcano(seurat_obj, cl) }) ncol_v - min(3, n_volcano) nrow_v - ceiling(n_volcano / ncol_v) p_volcano_combined - wrap_plots(volcano_plots, ncol ncol_v) ggsave(file.path(outdir, volcano_plots.png), p_volcano_combined, width ncol_v * 5, height nrow_v * 4.5, dpi 200, limitsize FALSE) cat( - volcano_plots.png\n) # # 3. GO 富集分析图 (每个cluster top marker做GO BP) # cat(\n[3/5] GO富集分析...\n) run_go - function(gene_vec, cluster_id) { eg - tryCatch( bitr(gene_vec, fromType SYMBOL, toType ENTREZID, OrgDb org.Hs.eg.db), error function(e) NULL ) if (is.null(eg) || nrow(eg) 5) return(NULL) go_res - enrichGO(gene eg$ENTREZID, OrgDb org.Hs.eg.db, ont BP, pAdjustMethod BH, pvalueCutoff 0.05, qvalueCutoff 0.2, readable TRUE) if (is.null(go_res) || nrow(go_resresult) 0) return(NULL) go_res } # 取每个cluster top30 marker基因做GO go_results - list() for (cl in clusters) { genes_cl - markers_all %% filter(cluster cl) %% arrange(p_val_adj) %% head(30) %% pull(gene) if (length(genes_cl) 5) next cat(sprintf( Cluster %s GO...\n, cl)) go_results[[as.character(cl)]] - run_go(genes_cl, cl) } # 画 barplot (最多展示前4个有结果的cluster) go_valid - Filter(Negate(is.null), go_results) n_go - min(4, length(go_valid)) if (n_go 0) { go_plots - lapply(names(go_valid)[seq_len(n_go)], function(cl) { barplot(go_valid[[cl]], showCategory 10, title paste0(Cluster , cl, GO BP)) theme(plot.title element_text(hjust 0.5, face bold, size 11), axis.text.y element_text(size 8)) }) ncol_go - min(2, n_go) nrow_go - ceiling(n_go / ncol_go) p_go - wrap_plots(go_plots, ncol ncol_go) ggsave(file.path(outdir, GO_barplot.png), p_go, width ncol_go * 7, height nrow_go * 6, dpi 200, limitsize FALSE) cat( - GO_barplot.png\n) # dotplot for first cluster p_go_dot - dotplot(go_valid[[names(go_valid)[1]]], showCategory 15) ggtitle(paste0(Cluster , names(go_valid)[1], GO BP Dotplot)) theme(plot.title element_text(hjust 0.5, face bold)) ggsave(file.path(outdir, GO_dotplot.png), p_go_dot, width 8, height 8, dpi 200) cat( - GO_dotplot.png\n) } else { cat( 警告: 没有cluster通过GO富集分析\n) } # # 4. Venn 图 (各cluster特异性基因重叠) # cat(\n[4/5] Venn图...\n) # 取显著差异基因 (adj.p 0.05, log2FC 0.5) sig_markers - markers_all %% filter(p_val_adj 0.05, avg_log2FC 0.5) # 最多取前5个cluster做Venn venn_clusters - clusters[seq_len(min(5, length(clusters)))] venn_list - lapply(venn_clusters, function(cl) { sig_markers %% filter(cluster cl) %% pull(gene) %% unique() }) names(venn_list) - paste0(Cluster_, venn_clusters) # 过滤掉空集 venn_list - Filter(function(x) length(x) 0, venn_list) if (length(venn_list) 2) { p_venn - ggVennDiagram(venn_list, label_alpha 0, edge_size 0.8) scale_fill_gradient(low #F7FBFF, high #2171B5) scale_color_manual(values rep(grey30, length(venn_list))) ggtitle(各Cluster显著差异基因 Venn图) theme(plot.title element_text(hjust 0.5, face bold, size 14), legend.position right) ggsave(file.path(outdir, venn_diagram.png), p_venn, width 9, height 7, dpi 200) cat( - venn_diagram.png\n) } else { cat( 警告: 有效cluster不足2个跳过Venn图\n) } # # 5. 聚类热图 (top marker基因 × cluster) # cat(\n[5/5] 聚类热图...\n) # 每个cluster取top5 marker top5_heat - markers_all %% group_by(cluster) %% slice_max(order_by avg_log2FC, n 5) %% ungroup() heat_genes - unique(top5_heat$gene) # 计算每个cluster的平均表达量 avg_exp - AverageExpression(seurat_obj, features heat_genes, return.seurat FALSE)$RNA # 标准化到 z-score (按行) mat - as.matrix(avg_exp) mat_z - t(scale(t(mat))) mat_z[is.nan(mat_z)] - 0 mat_z - pmin(pmax(mat_z, -2.5), 2.5) # clip # 颜色 col_breaks - seq(-2.5, 2.5, length.out 101) col_pal - colorRampPalette(c(#4DBBD5, white, #E64B35))(100) # cluster颜色条 n_cl - ncol(mat_z) cl_col - setNames( colorRampPalette(brewer.pal(min(n_cl, 12), Set3))(n_cl), colnames(mat_z) ) ann_col - data.frame(Cluster colnames(mat_z), row.names colnames(mat_z)) png(file.path(outdir, heatmap_clusters.png), width max(800, n_cl * 60 300), height max(900, length(heat_genes) * 18 200), res 150) pheatmap(mat_z, color col_pal, breaks col_breaks, cluster_rows TRUE, cluster_cols FALSE, show_rownames TRUE, show_colnames TRUE, fontsize_row 7, fontsize_col 10, border_color NA, main Cluster Top5 Marker基因 Z-score热图, annotation_col ann_col, annotation_colors list(Cluster cl_col)) dev.off() cat( - heatmap_clusters.png\n) # # 完成 # cat(\n\n) cat(所有图表已生成:\n) cat( DEG_dotplot.png - 差异表达DotPlot\n) cat( DEG_all_markers.csv - 差异表达结果表\n) cat( volcano_plots.png - 火山图\n) cat( GO_barplot.png - GO富集柱状图\n) cat( GO_dotplot.png - GO富集点图\n) cat( venn_diagram.png - Venn图\n) cat( heatmap_clusters.png - 聚类热图\n) cat(\n)不出3分钟所有的图都生成好了如下图列表三、查看结果篇幅有限此处只列举部分数据分析图像1. heatmap_clusters图2. GO图3. Venn图4. DEG_dotplot图惊呆了...这个顶刊莫兰迪配色也是被新的 claude opus 4.7 模型给学习到了...对比之前的Claude 4.6生成的灰色图片如下上面这些彩色生信分析图实话讲确实会给投递顶刊的文章加不少分。四、图形解读最后我们在让百沐一下对以上生成的生信分析图用heatmap为例进行解读。百沐一下还给出了适合放在SCI里的图注的解析建议直接采纳学习Heatmap showing the top five marker genes for each cluster. Colors represent row-scaled expression levels (Z-score), with red indicating high expression and blue indicating low expression. Distinct cluster-specific transcriptional signatures support the identification of epithelial, stromal, antigen-presenting, mast cell, and melanocyte-like populations.最后总结研究生读的好工具少不了Claude Opus 4.7 模型用在科研场景进行深度实测后小编的第一反应是科研效率的天花板再一次拉高了。新模型更多的学习和探索从理论到实践还得看今后大家在各个科研工作场景中的运用。懂科研更要懂如何使用工具。进步来自于对一个个新工具的学习和运用。所以关注百沐一下不止是Claude opus 4.7期待与您一起在未来探索更多模型的学术实战上限。浏览器搜索“百沐一下AI科研助理平台”或者微信搜索“百沐一下”小程序更多体验等待您的探索

最新的Claude-opus-4-7在科研场景到底有多强...

最新文章

保姆级教程：在Ubuntu 18.04 + ROS Melodic上，用LeGO-LOAM跑通KITTI和速腾RS-16数据集

中小学信息技术，选择排序案例讲解

利用vrtk3.3 设计拉弓射箭效果

FlowState Lab 生成高质量合成时序数据，破解数据稀缺难题

从一次Jenkins安装报错，聊聊APT沙盒安全机制与日常运维的微妙冲突

MT5在内容去重降重的应用：批量生成同义句，提升文章原创度

推荐文章

CrossMgrLapCounter：嵌入式设备接入赛事计时系统的WebSocket协议库

Java Iterator

Mac上Xcode搞C++竞赛？手把手教你添加万能头文件stdc++.h（附完整代码）

利用BurpSuite Intruder模块实现验证码失效场景下的表单暴力破解

机器学习中的常用算法（非传统算法）

深度学习检测不准确智能电表:一个案例研究 python源代码，代码按照高水平文章复现

相关文章

科研绘图不止Origin：聊聊OriginPro 2021与Python/Matlab的共存与选择

StructBERT在客服系统中的实战应用：智能情绪分析与工单分类

30元玩客云变身全能软路由：手把手教你用Docker部署AllinOne直播服务

FinalBurn Neo终极指南：开源街机模拟器的技术架构与实战应用

OpCore-Simplify终极指南：10分钟完成黑苹果配置的完整解决方案

Qwen3.5-9B成本优化实践：Spot实例调度+自动启停+GPU资源弹性伸缩

分享文章

更多文章

Pixel Epic · Wisdom Terminal 物联网（IoT）后端开发：处理海量传感器数据的智能分析平台

雷达PD处理中的‘相参积累’到底强在哪？一个MATLAB仿真对比实验说清楚

你以为只是“换个顺序遍历”？二叉树垂直遍历，90%的人都写错了

一物一码有哪些公司：快消企业如何选择合适服务商

谁有GdiView工具呀

Playwright Python 自动化测试：零基础半个月的学习与踩坑记录

共探智能医疗与人工智能的新时代 | IHAI 2026

不锈钢彩涂板哪家信誉好

【硬件】2026最适合做家用NAS的CPU是哪一款

Gemini API 调用--提速100倍终极指南

洛谷 P1381 单词背诵

常见网络攻击