# 随机森林多分类模型 # packages 安装 —— install.packages("") setwd("D:/Rpackages") # packages 载入 —— library() library(randomForest) library(tidyverse) library(skimr) library(DataExplorer) library(caret) library(pROC) library(ggplot2) library(splines) library(reshape2) library(scales) library(ggprism) library(ggpubr) # 加载数据 boston <- read.csv(file.choose()) # 数据框转换 boston <- as.data.frame(boston) # boston <- na.pass(boston) # boston <- na.omit(boston) # na.action = na.omit 返回删除所有包含NA值的行的数据框或矩阵 # na.action = na.pass 将NA值传递给后续的计算，可能会导致结果中也出现NA # 查看数据概貌 skim(boston) # 查看数据缺失情况 plot_missing(boston) boston[is.na(boston)] <- 0 #将matrix（此处为boston）中的NA值替换为0，按需运行 # 数据类型修正，将boston中的i列转为factor，i 将依次取c()中的值 for (i in c(1:2)) { boston[,i] <- factor(boston[,i]) } # 因变量分布情况 table(boston$Class) # 拆分数据 set.seed(1) trains <- createDataPartition( y = boston$Class, p = 0.7, list = F ) traindata <- boston[trains,] testdata <- boston[-trains,] # # test：自选训练集测试集（无特殊可不理 # traindata <- read.csv(file.choose()) # traindata <- as.data.frame(traindata) # for (i in c(1:5)) { # traindata[,i] <- factor(traindata[,i]) # } # # testdata <- read.csv(file.choose()) # testdata <- as.data.frame(testdata) # for (i in c(1:5)) { # testdata[,i] <- factor(testdata[,i]) # } # 拆分后因变量分布 table(traindata$Class) table(testdata$Class) dim(boston) # # 构建公式，自变量列名~a到b列（colnames[a:b]） # # colnames(boston) 用于获取数据框的列名， # form_clsm <- as.formula( # paste0( # "class~", # paste(colnames(traindata)[3:112],collapse = "+") # ) # ) # form_clsm # # # 构建模型 # set.seed(100001) # fit_rf_clsm <- randomForest( # form_clsm, # data = traindata, # ntree = 500, # 默认500，error & trees不稳定需增加树的数量 # mtry = 6, # 每个节点可提供选择的变量数目（指定节点中用于二叉树的变量个数 # # 默认情况下数据集变量个数的二次方根(分类模型)或三分之一(预测模型)） # importance = T # importance = TRUE: 启用特征重要性计算 # # 随机森林会根据每个特征对模型性能的影响，计算出每个特征的重要性 # ) # print(fit_rf_clsm) # 定义训练集特征和目标变量 X_train <- traindata[, -(1:2)] #traindata中除第1、2列外的列为自变量 x y_train <- as.factor(traindata[, 2]) #traindata中第2列为因变量 y # # 创建随机森林分类模型（基准模型 # model <- randomForest(x = X_train, y = y_train, ntree = 500) # # # 创建训练控制对象 # ctrl <- trainControl(method = "repeatedcv", number = 5, repeats = 10) # # k 折交叉验证作为模型评估方法,小数据做重复10次5折交叉验证 # # # 进行参数调优 # # mtry参数调节 # grid1 <- expand.grid(mtry = c(48:52)) # 定义mtry范围 # # grid1 <- expand.grid(mtry = c(10, 20, 30, 40, 50, 60, 70, 80, 90, 100)) # # 进阶 # # num_features <- ncol(X_train) # # mtry_range <- floor(sqrt(num_features)) # 取平方根并向下取整 # # grid_mtry <- expand.grid(mtry = seq(max(2, mtry_range - 5), # # min(mtry_range + 5, num_features))) # # # 使用caret包进行调参 # rf_model <- train(x = X_train, y = y_train, # 自变量 x，因变量 y # method = "rf", # 使用的模型方法为随机森林（rf） # trControl = ctrl, # tuneGrid = grid1,) # # 输出结果 # print(rf_model) # # # # 定义最佳mtry参数 # grid2 <- expand.grid(mtry = c(30)) # # # 定义模型列表，存储每一个模型评估结果 # modellist <- list() # # 调整的参数是决策树的数量 # for (ntree in seq(100, 2000, by=100)) { # seq函数构建一个集合，间距by = 100 # set.seed(101) # fit <- train(x = X_train, y = y_train, method="rf", # metric="Accuracy", tuneGrid=grid2, # trControl=ctrl, ntree=ntree) # key <- toString(ntree) # modellist[[key]] <- fit # } # # # compare results # results <- resamples(modellist) # # # 输出最佳模型和参数 # summary(results) # # # 可视化模型性能，accuracy越近1越好，kappa越近1越好 # bwplot(results) # 箱线图 # dotplot(results) # 点图 # densityplot(results) # 密度图 # 使用最佳参数训练模型 set.seed(1001) fit_rf_clsm <- randomForest(x = X_train, y = y_train, mtry = 50, ntree = 500, importance = T) print(fit_rf_clsm) # ntree参数与error之间的关系图示 plot(fit_rf_clsm,main = "ERROR & TREES") legend("top", legend = colnames(fit_rf_clsm$err.rate), lty = 1:6, col = 1:6, horiz = T, cex = 0.9) plot(randomForest::margin(fit_rf_clsm), main = '观测值被判断正确的概率图') # 变量重要性 varImpPlot(fit_rf_clsm,main ="varImpPlot") varImpPlot(fit_rf_clsm,main = "varImpPlot",type = 1) varImpPlot(fit_rf_clsm,main = "varImpPlot",type = 2) importance_genus <- data.frame(importance(fit_rf_clsm)) importance_genus <- importance_genus[order(importance_genus$MeanDecreaseGini, decreasing=TRUE),] importance_genus <- importance_genus[order(importance_genus$MeanDecreaseAccuracy, decreasing=TRUE),] head(importance_genus) write.table(importance_genus,"importance_genus_DaChuang_SiteClass_unexposed20250209.txt", sep = '\t',col.names = NA,quote = FALSE) # 保存重要特征到文件 # # 预测 # # 训练集预测概率 # trainpredprob <- predict(fit_rf_clsm,newdata = traindata,type = "prob") # # 训练集ROC # multiclass.roc(response = traindata$class,predictor = trainpredprob) # # 训练集预测分类 # trainpredlab <- predict(fit_rf_clsm,newdata = traindata,type = "Class") # # 训练集混淆矩阵 # confusionMatrix_train <- confusionMatrix(data = trainpredlab, # reference = traindata$Class, # mode = "everything") # # 训练集综合结果 # multiClassSummary( # data.frame(obs = traindata$Class,pred=trainpredlab), # lev = levels(traindata$Class) # ) # # # # 作图展示 top N 重要的 OTUs # varImpPlot(fit_rf_clsm, n.var = min(20, nrow(fit_rf_clsm$importance)), # main = 'Top 20 - variable importance') # # # 测试集预测概率 # # X_test <- testdata[, -(1:2)] #testdata中除第1、2列外的列为自变量 x # # y_test <- as.factor(testdata[, 2]) #testdata中第2列为因变量 y # testpredprob <- predict(fit_rf_clsm,newdata = testdata,type = "prob") # # 测试集ROC # multiclass.roc(response = testdata$Class,predictor = testpredprob) # # 测试集预测分类 # testpredlab <- predict(fit_rf_clsm,newdata = testdata,type = "Class") # # 测试集混淆矩阵 # confusionMatrix_test <- confusionMatrix(data = testpredlab, # reference = testdata$Class, # mode = "everything") # confusionMatrix_test # # 测试集综合结果 # multiClassSummary( # data.frame(obs = testdata$Class,pred=testpredlab), # lev = levels(testdata$Class) # ) # 交叉验证帮助选择特定数量的特征 # 5次重复十折交叉验证 set.seed(10001) otu_train.cv <- replicate(5, rfcv(traindata[,-(1:2)], # 除去第a到b列(a:b) traindata$Class, cv.fold = 10, step = 1.5), simplify = FALSE) otu_train.cv <- data.frame(sapply(otu_train.cv, '[[', 'error.cv')) otu_train.cv$otus <- rownames(otu_train.cv) otu_train.cv <- reshape2::melt(otu_train.cv, id = 'otus') otu_train.cv$otus <- as.numeric(as.character(otu_train.cv$otus)) otu_train.cv.mean <- aggregate(otu_train.cv$value, by = list(otu_train.cv$otus), FUN = mean) head(otu_train.cv.mean, 18) # 绘图观察拐点 p <- ggplot(otu_train.cv,aes(otus,value)) + geom_smooth(se = FALSE, method = 'glm',formula = y~ns(x,6)) + theme(panel.grid = element_blank(), panel.background = element_rect(color = 'black',fill = 'transparent')) + labs(title = '',x='Number of genus',y='Cross-validation error') p # 在横坐标(xintecept)绘制竖线 p + geom_vline(xintercept = 160) # # 备用 # p2 <- ggplot(otu_train.cv,aes(otus,value)) + # geom_line() + # theme(panel.grid = element_blank(), # panel.background = element_rect(color = 'black', fill = 'transparent')) + # labs(title = '',x = 'Number of OTUs', y = 'Cross-validation error') # p2 # # p2 + geom_vline(xintercept = 30) # 大约提取前 N个重要的特征 importance_genus[1:160,] # importance_Ngenus <- importance_genus[1:160,] # # 输出表格 # write.table(importance_genus[1:70, ], # 'importance_genus_top70_of_zhangxiaofeng_human_drowning.txt', # sep = '\t', col.names = NA, quote = FALSE) # # 变量重要性 # varImpPlot(fit_rf_clsm,main ="varImpPlot") # varImpPlot(fit_rf_clsm,main = "varImpPlot",type = 1) # varImpPlot(fit_rf_clsm,main = "varImpPlot",type = 2) # # varImpPlot(fit_rf_clsm, n.var = min(160, nrow(fit_rf_clsm$importance)), # min(num,)处的num为图中的菌属数量 # main = 'Top 19 - variable importance',type = 1) # 简约分类器(只取部分高影响的自变量) # 选择 top N 重要的 OTUs，例如上述已经根据“Mean Decrease Accuracy”排名获得 genus_select <- rownames(importance_genus)[1:160] # 数据子集的训练集和测试集 genus_train_top <- traindata[ ,c(genus_select, 'Class')] genus_test_top<- testdata[ ,c(genus_select, 'Class')] # set.seed(10001) # form_clsm1 <- as.formula( # paste0( # "class~", # paste(colnames(genus_train_top)[1:10],collapse = "+") # ) # ) # 构建模型 # fit_rf_clsm1 <- randomForest( # form_clsm1, # data = genus_train_top, # ntree = 500, # mtry = 6, # importance = T # ) x_train1 <- genus_train_top[, -160 - 1] # 自变量 x y_train1 <- as.factor(genus_train_top[, 160 + 1]) # 因变量 y # fit_rf_clsm_test1 <- randomForest(x = x_train1, # y = y_train1, # ntree = 500, # 增加树的数量以提高稳定性 # importance = TRUE # 启用特征重要性计算 # ) # # fit_rf_clsm_test1 # # # 5 折交叉验证，重复 10 次 # ctrl1 <- trainControl(method = "repeatedcv", number = 5, repeats = 10) # # # 定义 mtry 和 ntree 的参数范围 # grid3 <- expand.grid(mtry = c(2:15)) # 定义mtry范围 # # # 进阶 # # num_features <- ncol(X_train) # # mtry_range <- floor(sqrt(num_features)) # 取平方根并向下取整 # # grid_mtry <- expand.grid(mtry = seq(max(2, mtry_range - 5), # # min(mtry_range + 5, num_features))) # # # 使用caret包进行调参 # fit_rf_clsm_test2 <- train(x = x_train1, y = y_train1, # 自变量 x，因变量 y # method = "rf", # 使用的模型方法为随机森林（rf） # trControl = ctrl1, # tuneGrid = grid3,) # # 输出结果 # print(fit_rf_clsm_test2) # # # 定义最佳mtry参数 # grid4 <- expand.grid(mtry = c(16)) # # # 定义模型列表，存储每一个模型评估结果 # modellist1 <- list() # # 调整的参数是决策树的数量 # for (ntree in seq(100, 2000, by=100)) { # seq函数构建一个集合，间距by = 100 # set.seed(100003) # fit1 <- train(x = x_train1, y = y_train1, method="rf", # metric="Accuracy", tuneGrid=grid4, # trControl=ctrl1, ntree=ntree) # key1 <- toString(ntree) # modellist1[[key1]] <- fit1 # } # # # compare results # results1 <- resamples(modellist1) # # # 输出最佳模型和参数 # summary(results1) # # # 可视化模型性能，accuracy越近进1越好，kappa越近1越好 # bwplot(results1) # 箱线图 # dotplot(results1) # 点图 # densityplot(results1) # 密度图 # 使用最佳参数训练模型 set.seed(1) fit_rf_clsm1 <- randomForest(x = x_train1, y = y_train1, mtry = 12, ntree = 500, importance = T) print(fit_rf_clsm1) # # "ERROR & TREES" # plot(fit_rf_clsm1,main = "ERROR & TREES") # # # plot(randomForest::margin(fit_rf_clsm1), main = '观测值被判断正确的概率图') # # 预测 # # 训练集预测概率 # trainpredprob <- predict(fit_rf_clsm1,newdata = genus_train_top,type = "prob") # # 训练集ROC # multiclass.roc(response = genus_train_top$Class,predictor = trainpredprob) # # 训练集预测分类 #trainpredlab <- predict(fit_rf_clsm1,newdata = genus_train_top,type = "Class") # # 训练集混淆矩阵 # confusionMatrix(data = trainpredlab, # reference = genus_train_top$Class, # mode = "everything") # 预测 # 测试集预测概率 # x_test1 <- genus_test_top[, -11] # 自变量 x # y_test1 <- as.factor(genus_test_top[, 11]) # 因变量 y testpredprob <- predict(fit_rf_clsm1,newdata = genus_test_top,type = "prob") write.table(testpredprob, file = "D:/Rpackages/testpredprob.txt", sep = "\t", row.names = FALSE, col.names = TRUE) # 测试集ROC multiclass.roc(response = genus_test_top$Class,predictor = testpredprob) # 测试集预测分类 testpredlab <- predict(fit_rf_clsm1,newdata = genus_test_top,type = "Class") # 测试集混淆矩阵 confusion_matrix <- confusionMatrix(data = testpredlab, reference = genus_test_top$Class, mode = "everything") # 测试集综合结果 multiClassSummary( data.frame(obs = genus_test_top$Class,pred=testpredlab), lev = levels(genus_test_top$Class) ) # 查看样本预测结果 results <- data.frame(Actual = genus_test_top$Class, Predicted = testpredlab) # 测试集预测分类 # testpredlab <- predict(fit_rf_clsm1,newdata = testdata,type = "class") # t <- table(testpredlab,testdata$class) # acc = sum(diag(t))/nrow(testdata)*100 # print(paste("模型准确率为：",round(acc,4),sep='')) # 绘制混淆矩阵热图(内容复杂，好汉谨慎处之) # confusion_matrix是混淆矩阵对象 # 转换混淆矩阵为数据框 roc1 <- multiclass.roc(response = genus_test_top$Class,predictor =testpredprob[,1:6]) roc1 <- multiclass.roc(response = genus_test_top$Class,predictor =testpredprob[,1]) plot(roc1$rocs[[1]],col="#1f77b4",print.auc = TRUE,print.auc.x=0.8,print.auc.y=0.8) roc2 <- multiclass.roc(response = genus_test_top$Class,predictor =testpredprob[,2]) plot(roc2$rocs[[1]],add=TRUE,col="#ff7f0e",print.auc = TRUE,print.auc.x=0.6,print.auc.y=0.6) roc3 <- multiclass.roc(response = genus_test_top$Class,predictor =testpredprob[,3]) plot(roc3$rocs[[1]],add=TRUE,col="#2ca02c",print.auc=TRUE,print.auc.x=0.5,print.auc.y=0.5) roc4 <- multiclass.roc(response = genus_test_top$Class,predictor =testpredprob[,4]) plot(roc4$rocs[[1]],add=TRUE,col="#d62728",print.auc=TRUE,print.auc.x=0.4,print.auc.y=0.4) roc5 <- multiclass.roc(response = genus_test_top$Class,predictor =testpredprob[,5]) plot(roc5$rocs[[1]],add=TRUE,col="#9467bd",print.auc=TRUE,print.auc.x=0.3,print.auc.y=0.3) roc6 <- multiclass.roc(response = genus_test_top$Class,predictor =testpredprob[,6]) plot(roc1$rocs[[6]], add = TRUE, col = "#8c564b", print.auc = TRUE, print.auc.x = 0.2, print.auc.y = 0.2) # confusion_matrix_df <- as.data.frame.matrix(confusion_matrix$table) # colnames(confusion_matrix_df) <- c("F","H") # rownames(confusion_matrix_df) <- c("F","H") # # #c("1", "2", "3", "4", "5", "6", "7", "8", "9", "10", "11", "12", "13", "14", "15") # colnames(confusion_matrix_df) <- c("01", "02", "03", "04", "05", "06", "07", "08", "09", "10", "11", "12", "13", "14", "15") # rownames(confusion_matrix_df) <- c("01", "02", "03", "04", "05", "06", "07", "08", "09", "10", "11", "12", "13", "14", "15") # # 计算归一化值 # draw_data <- round(confusion_matrix_df / colSums(confusion_matrix_df),2) # draw_data <- as.data.frame(t(draw_data)) #使用t()函数转换draw_data的行列，原本列为真实类别，现转为行 # draw_data$real <- rownames(draw_data) #提取行名作为新生成列real的类别 # draw_data <- melt(draw_data) #将宽格式的数据框转换为长格式 # # # 绘制矩阵热图 # confusion1 <- ggplot(draw_data, aes(real, variable, fill = value)) + # geom_tile() + # geom_text(aes(label = scales::percent(value))) + # scale_fill_gradient(low = "#F0F0F0", high = "#3575b5") + # labs(x = "Prediction", y = "Reference", title = "Confusion matrix") + # theme_prism(border = T) + # theme(panel.border = element_blank(), # axis.ticks.y = element_blank(), # axis.ticks.x = element_blank(), # legend.position="right", # plot.title = element_text(hjust = 0.5)) # # confusion1 # # 二分类ROC曲线绘制 # # 计算ROC曲线的参数 # roc_obj <- roc(response = genus_test_top$class, predictor = testpredprob[, 2]) # roc_auc <- auc(roc_obj) # # 将ROC对象转换为数据框 # roc_data <- data.frame(1 - roc_obj$specificities, roc_obj$sensitivities) # # 绘制ROC曲线 # ROC1 <- ggplot(roc_data, aes(x = 1 - roc_obj$specificities, y = roc_obj$sensitivities)) + # geom_line(color = "#0073C2FF", size = 1) + # annotate("segment", x = 0, y = 0, xend = 1, yend = 1, linetype = "dashed", color = "gray") + # annotate("text", x = 0.8, y = 0.2, label = paste("AUC =", round(roc_auc, 3)), size = 4, color = "black") + # coord_cartesian(xlim = c(0, 1), ylim = c(0, 1)) + # theme_pubr() + # labs(x = "1 - Specificity", y = "Sensitivity") + # ggtitle("ROC Curve") + # theme(plot.title = element_text(size = 14, face = "bold")) + # theme_prism(border = T) # ROC1 # # # 计算 ROC 和 AUC # roc_obj <- roc(response = genus_test_top$class, predictor = testpredprob[, 2]) # roc_auc <- auc(roc_obj) # # # 将 ROC 对象转换为数据框 # roc_data <- data.frame( # FPR = 1 - roc_obj$specificities, # TPR = roc_obj$sensitivities # ) # # # 平滑处理 # smooth_roc <- data.frame( # FPR = spline(roc_data$FPR, n = 500)$x, # TPR = spline(roc_data$TPR, n = 500)$y # ) # # # 绘制平滑后的 ROC 曲线 # ROC1 <- ggplot(smooth_roc, aes(x = FPR, y = TPR)) + # geom_line(color = "#0073C2FF", size = 1) + # annotate("segment", x = 0, y = 0, xend = 1, yend = 1, linetype = "dashed", color = "gray") + # annotate("text", x = 0.8, y = 0.2, label = paste("AUC =", round(roc_auc, 2)), size = 4, color = "black") + # coord_cartesian(xlim = c(0, 1), ylim = c(0, 1)) + # theme_pubr() + # labs(x = "1 - Specificity", y = "Sensitivity") + # ggtitle("Smoothed ROC Curve") + # theme(plot.title = element_text(size = 14, face = "bold")) + # theme_prism(border = T) # # ROC1 # # geom_smooth(se = FALSE, method = 'glm',formula = y~ns(x,6)) # # # 保存模型 # saveRDS(fit_rf_clsm, # file = "D:/Documents/R.data/fit_rf_clsm1_UnSimplifiedSiteClass_ConcernGender_UnexposedTop19_240209.rds") # # # 读取模型 # fit_rf_clsm1 <- readRDS("D:/Documents/R.data/fit_rf_clsm1_hand_Simplified_240102.rds") # # # 读取待分类数据 # testdata1 <- read.csv(file.choose()) # testdata1 <- as.data.frame(testdata) # for (i in c(1:2)) { # testdata1[,i] <- factor(testdata1[,i]) # } # # # 应用 # # 待分类数据集预测概率 # testpredprob <- predict(fit_rf_clsm1, newdata = testdata1, type = "prob") # # 测试集ROC # multiclass.roc(response = testdata1$class, predictor = testpredprob) # # 待分类数据集预测分类 # testpredlab <- predict(fit_rf_clsm1, newdata = testdata1,type = "class") # # 待分类数据集混淆矩阵 # confusion_matrix <- confusionMatrix(data = testpredlab, # reference = testdata1$class, # mode = "everything") # # 待分类数据集综合结果 # multiClassSummary( # data.frame(obs = testdata1$class,pred=testpredlab), # lev = levels(testdata1$class) # ) # # # 查看样本分类结果 # results <- data.frame(Actual = testdata1$class, Predicted = testpredlab) （这是整个的代码，testpredprob <- predict(fit_rf_clsm1,newdata = genus_test_top[1:5, ],type = "prob")，跑不下来）

install.packages("os") WARNING: Rtools is required to build R packages but is not currently installed. Please download and install the appropriate version of Rtools before proceeding: https://cran.rstudio.com/bin/windows/Rtools/ Warning in install.packages : package ‘os’ is not available for this version of R A version of this package for your version of R might be available elsewhere, see the ideas at https://cran.r-project.org/doc/manuals/r-patched/R-admin.html#Installing-packages

好的，用户遇到了在R中安装名为“os”的包的问题，错误提示说这个包不可用，还建议安装Rtools。首先，我需要确认用户的需求是什么。用户可能是在R中尝试安装一个不存在的包，或者可能打错了包的名字。接下来，我需要...

library(metricsets) Error in library(package, pos = pos, lib.loc = lib.loc, character.only = TRUE, : 不存在叫‘metricsets’这个名字的程辑包 > install.packages("metricsets") WARNING: Rtools is required to build R packages but is not currently installed. Please download and install the appropriate version of Rtools before proceeding: https://cran.rstudio.com/bin/windows/Rtools/ 将程序包安装入‘C:/Users/啊/AppData/Local/R/win-library/4.2’ (因为‘lib’没有被指定) Warning in install.packages : package ‘metricsets’ is not available for this version of R A version of this package for your version of R might be available elsewhere, see the ideas at https://cran.r-project.org/doc/manuals/r-patched/R-admin.html#Installing-packages > library(metricsets) Error in library(package, pos = pos, lib.loc = lib.loc, character.only = TRUE, : 不存在叫‘metricsets’这个名字的程辑包

根据你提供的信息，可以看出 metricsets 包可能尚未在 ...install.packages("devtools") 4. 安装完成后，使用以下命令加载该包： R library(metricsets) 这样，你就可以使用 metricsets() 函数了。

> #安装包包 > reticulate::py_install("path/to/kaleido-0.1.0-py2.py3-none-any.whl", pip = TRUE) Using virtual environment "C:/Users/HanRan/r-reticulate-venv" ... + "C:/Users/HanRan/r-reticulate-venv/Scripts/python.exe" -m pip install --upgrade --no-user path/to/kaleido-0.1.0-py2.py3-none-any.whl WARNING: Requirement 'path/to/kaleido-0.1.0-py2.py3-none-any.whl' looks like a filename, but the file does not exist Processing c:\rwork\path\to\kaleido-0.1.0-py2.py3-none-any.whl ERROR: Could not install packages due to an OSError: [Errno 2] No such file or directory: 'C:\\Rwork\\path\\to\\kaleido-0.1.0-py2.py3-none-any.whl' 错误: Error installing package(s): "path/to/kaleido-0.1.0-py2.py3-none-any.whl"

我们正在解决用户在使用 reticulate::py_install() 安装本地 WHL 文件时遇到的路径错误问题。用户提供的命令是： reticulate::py_install("path/to/kaleido-0.1.0-py2.py3-none-any.whl", pip = TRUE) 但出现了...

> Glycosites <- read.csv("D:/SCLC组学/糖基化/Glycosites.csv") > View(Glycosites) > NGT <- read.csv("D:/SCLC组学/糖基化/NGT.csv") > View(NGT) > View(Glycosites) > View(NGT) > View(Glycosites) > View(NGT) > View(Glycosites) > setwd("D:/SCLC组学/糖基化") > library(tidyverse) > > library(psych) > > library(pheatmap) > > library(qvalue) 错误于library(qvalue): 不存在叫‘qvalue’这个名称的程序包 > BiocManager::install("qvalue") 'getOption("repos")' replaces Bioconductor standard repositories, see 'help("repositories", package = "BiocManager")' for details. Replacement repositories: CRAN: https://mirrors.tuna.tsinghua.edu.cn/CRAN/ Bioconductor version 3.21 (BiocManager 1.30.25), R 4.5.0 (2025-04-11 ucrt) Installing package(s) 'qvalue' 试开URL’https://bioconductor.org/packages/3.21/bioc/bin/windows/contrib/4.5/qvalue_2.40.0.zip' Content type 'application/zip' length 2810649 bytes (2.7 MB) downloaded 2.7 MB 程序包‘qvalue’打开成功，MD5和检查也通过下载的二进制程序包在 C:\Users\lenovo\AppData\Local\Temp\RtmpIl7yPX\downloaded_packages里 Old packages: 'annotate', 'BiocManager', 'BiocParallel', 'commonmark', 'ComplexHeatmap', 'cowplot', 'curl', 'data.table', 'dendextend', 'Deriv', 'doBy', 'DropletUtils', 'edgeR', 'emmeans', 'evaluate', 'fitdistrplus', 'future', 'future.apply', 'ggforce', 'ggpubr', 'gh', 'h5mread', 'haven', 'httr2', 'KEGGREST', 'limma', 'maps', 'openssl', 'parallelly', 'patchwork', 'pheatmap', 'pillar', 'pkgbuild', 'pkgdown', 'plotly', 'promises', 'purrr', 'Rcpp', 'RcppArmadillo', 'restfulr', 'rhdf5', 'rprojroot', 'RSQLite', 'S4Arrays', 'shiny', 'spatstat.explore', 'spatstat.geom', 'spatstat.random', 'spatstat.univar', 'spatstat.utils', 'statnet.common', 'tensor', 'tibble', 'utf8', 'waldo', 'xgboost', 'zip', 'lattice', 'mgcv' Update all/some/none? [a/s/n]: n > library(qvalue) > > Glycosites <- Glycosites[, colnames(NGT)] 错误于[.data.frame(Glycosites, , colnames(NGT)): 选择了未定义的列 > Glycosites <- Glycosites[, colnames(NGT)] 错误于[.data.frame(Glycosites, , colnames(NGT)): 选择了未定义的列 > View(NGT) > colnames(Glycosites)[1] <- "Gene.Name" > Glycosites <- Glycosites[, colnames(NGT)] > > results <- data.frame( + Gene = rownames(NGT), + Rho = numeric(nrow(NGT)), + P_value = numeric(nrow(NGT)), + Q_value = numeric(nrow(NGT)) + ) > for(i in 1:nrow(NGT)) { + gene <- rownames(NGT)[i] + + # 仅当两个表中都存在该基因时才计算 + if(gene %in% rownames(Glycosites)) { + cor_test <- cor.test( + x = NGT[gene, ], + y = Glycosites[gene, ], + method = "spearman", + exact = FALSE # 精确计算在大样本中较慢 + ) + + results[i, "Rho"] <- cor_test$ estimate + results[i, "P_value"] <- cor_test$ p.value + } + } 错误于cor.test.default(x = NGT[gene, ], y = Glycosites[gene, ], method = "spearman", : 'x'必需是数值向量 > library(WGCNA) 错误于library(WGCNA): 不存在叫‘WGCNA’这个名称的程序包 > BiocManager::install("WGCNA") 'getOption("repos")' replaces Bioconductor standard repositories, see 'help("repositories", package = "BiocManager")' for details. Replacement repositories: CRAN: https://mirrors.tuna.tsinghua.edu.cn/CRAN/ Bioconductor version 3.21 (BiocManager 1.30.25), R 4.5.0 (2025-04-11 ucrt) Installing package(s) 'WGCNA' 还安装依赖关系‘htmlTable’, ‘dynamicTreeCut’, ‘Hmisc’, ‘preprocessCore’, ‘GO.db’ 试开URL’https://mirrors.tuna.tsinghua.edu.cn/CRAN/bin/windows/contrib/4.5/htmlTable_2.4.3.zip' 试开URL’https://mirrors.tuna.tsinghua.edu.cn/CRAN/bin/windows/contrib/4.5/dynamicTreeCut_1.63-1.zip' 试开URL’https://mirrors.tuna.tsinghua.edu.cn/CRAN/bin/windows/contrib/4.5/Hmisc_5.2-3.zip' 试开URL’https://bioconductor.org/packages/3.21/bioc/bin/windows/contrib/4.5/preprocessCore_1.70.0.zip' 试开URL’https://mirrors.tuna.tsinghua.edu.cn/CRAN/bin/windows/contrib/4.5/WGCNA_1.73.zip' download.packages(pkgs, destdir = tmpd, available = available, 里有警告: 下载程序包‘Hmisc’时出了问题 download.packages(pkgs, destdir = tmpd, available = available, 里有警告: 下载程序包‘WGCNA’时出了问题程序包‘htmlTable’打开成功，MD5和检查也通过程序包‘dynamicTreeCut’打开成功，MD5和检查也通过程序包‘preprocessCore’打开成功，MD5和检查也通过下载的二进制程序包在 C:\Users\lenovo\AppData\Local\Temp\RtmpIl7yPX\downloaded_packages里安装源码包‘GO.db’ 试开URL’https://bioconductor.org/packages/3.21/data/annotation/src/contrib/GO.db_3.21.0.tar.gz' Content type 'application/x-gzip' length 25563907 bytes (24.4 MB) downloaded 24.4 MB * installing source package 'GO.db' ... this is package 'GO.db' version '3.21.0' using staged installation R inst byte-compile and prepare package for lazy loading help * installing help indices building package indices testing if installed package can be loaded from temporary location testing if installed package can be loaded from final location ** testing if installed package keeps a record of temporary installation path * DONE (GO.db) 下载的程序包在 ‘C:\Users\lenovo\AppData\Local\Temp\RtmpIl7yPX\downloaded_packages’里 Old packages: 'annotate', 'BiocManager', 'BiocParallel', 'commonmark', 'ComplexHeatmap', 'cowplot', 'curl', 'data.table', 'dendextend', 'Deriv', 'doBy', 'DropletUtils', 'edgeR', 'emmeans', 'evaluate', 'fitdistrplus', 'future', 'future.apply', 'ggforce', 'ggpubr', 'gh', 'h5mread', 'haven', 'httr2', 'KEGGREST', 'limma', 'maps', 'openssl', 'parallelly', 'patchwork', 'pheatmap', 'pillar', 'pkgbuild', 'pkgdown', 'plotly', 'promises', 'purrr', 'Rcpp', 'RcppArmadillo', 'restfulr', 'rhdf5', 'rprojroot', 'RSQLite', 'S4Arrays', 'shiny', 'spatstat.explore', 'spatstat.geom', 'spatstat.random', 'spatstat.univar', 'spatstat.utils', 'statnet.common', 'tensor', 'tibble', 'utf8', 'waldo', 'xgboost', 'zip', 'lattice', 'mgcv' Update all/some/none? [a/s/n]: n 警告信息: 1: In download.file(urls, destfiles, "libcurl", mode = "wb", ...) : URL 'https://mirrors.tuna.tsinghua.edu.cn/CRAN/bin/windows/contrib/4.5/Hmisc_5.2-3.zip': status was 'Failure when receiving data from the peer' 2: In download.file(urls, destfiles, "libcurl", mode = "wb", ...) : URL 'https://mirrors.tuna.tsinghua.edu.cn/CRAN/bin/windows/contrib/4.5/WGCNA_1.73.zip': status was 'Failed sending data to the peer' 3: In download.file(urls, destfiles, "libcurl", mode = "wb", ...) : some files were not downloaded > library(WGCNA) 错误于library(WGCNA): 不存在叫‘WGCNA’这个名称的程序包 > BiocManager::install("WGCNA") 'getOption("repos")' replaces Bioconductor standard repositories, see 'help("repositories", package = "BiocManager")' for details. Replacement repositories: CRAN: https://mirrors.tuna.tsinghua.edu.cn/CRAN/ Bioconductor version 3.21 (BiocManager 1.30.25), R 4.5.0 (2025-04-11 ucrt) Installing package(s) 'WGCNA' 还安装依赖关系‘Hmisc’ 试开URL’https://mirrors.tuna.tsinghua.edu.cn/CRAN/bin/windows/contrib/4.5/Hmisc_5.2-3.zip' 试开URL’https://mirrors.tuna.tsinghua.edu.cn/CRAN/bin/windows/contrib/4.5/WGCNA_1.73.zip' 程序包‘Hmisc’打开成功，MD5和检查也通过程序包‘WGCNA’打开成功，MD5和检查也通过下载的二进制程序包在 C:\Users\lenovo\AppData\Local\Temp\RtmpIl7yPX\downloaded_packages里 Old packages: 'annotate', 'BiocManager', 'BiocParallel', 'commonmark', 'ComplexHeatmap', 'cowplot', 'curl', 'data.table', 'dendextend', 'Deriv', 'doBy', 'DropletUtils', 'edgeR', 'emmeans', 'evaluate', 'fitdistrplus', 'future', 'future.apply', 'ggforce', 'ggpubr', 'gh', 'h5mread', 'haven', 'httr2', 'KEGGREST', 'limma', 'maps', 'openssl', 'parallelly', 'patchwork', 'pheatmap', 'pillar', 'pkgbuild', 'pkgdown', 'plotly', 'promises', 'purrr', 'Rcpp', 'RcppArmadillo', 'restfulr', 'rhdf5', 'rprojroot', 'RSQLite', 'S4Arrays', 'shiny', 'spatstat.explore', 'spatstat.geom', 'spatstat.random', 'spatstat.univar', 'spatstat.utils', 'statnet.common', 'tensor', 'tibble', 'utf8', 'waldo', 'xgboost', 'zip', 'lattice', 'mgcv' Update all/some/none? [a/s/n]: n > library(WGCNA) 载入需要的程序包：dynamicTreeCut 载入需要的程序包：fastcluster 载入程序包：‘fastcluster’ The following object is masked from ‘package:stats’: hclust 载入程序包：‘WGCNA’ The following object is masked from ‘package:qvalue’: qvalue The following object is masked from ‘package:stats’: cor 警告信息: 程序包‘WGCNA’是用R版本4.5.1 来建造的 > > library(reshape2) 载入程序包：‘reshape2’ The following object is masked from ‘package:tidyr’: smiths > > library(pheatmap) > > if (!all(colnames(NGT) == colnames(Glycosites))) { + # 调整代谢组数据的列顺序与蛋白质组相同 + Glycosites <- Glycosites[, colnames(NGT)] + } > rm(results) > rm(gene) > rm(i) > NGT_t <- t(NGT) > View(NGT_t) > colnames(NGT_t) <- NGT[,1] > NGT_t <- NGT_t[,-1] > View(NGT) > View(NGT_t) > View(NGT) > View(NGT) > View(NGT_t) > rm(NGT_t) > NGT_t <- t(NGT) > > View(NGT_t) > colnames(NGT_t) <- NGT_t[,1] 错误于dimnames(x) <- dn: 'dimnames'的长度[2]必需与陈列范围相等 > colnames(NGT_t) <- NGT_t[1,] > NGT_t <- NGT_t[-1,] > > Glycosites <- t(Glycosites) # 代谢物 > > colnames(Glycosites) <- Glycosites[1,] > Glycosites <- Glycosites[-1,] > cor_res <- corAndPvalue(NGT_t, Glycosites, method = "spearman", use = "pairwise.complete.obs") 错误于stats::cor(x, y, use, method): 'x'必需为数值 > class(Glycosites) # 应返回"numeric"或"integer" [1] "matrix" "array" > > str(Glycosites) chr [1:9, 1:385] " 71.24190827" "2.448226e+00" " 3.404418298" "6.343631e+00" NA ... - attr(*, "dimnames")=List of 2 ..$ : chr [1:9] "B" "C" "D" "G" ... ..$ : chr [1:385] "CEACAM5_580" "CEACAM5_480" "IL4I1_134" "THBS2_1069" ... > Glycosites <- as.numeric(as.character(Glycosites)) > Glycosites <- read.csv("D:/SCLC组学/糖基化/Glycosites.csv", row.names=1) > View(Glycosites) > View(Glycosites) > View(NGT) > rownames(NGT) <- NGT[,1] > NGT <- NGT[,-1] > common_samples <- intersect(colnames(NGT), colnames(Glycosites)) > > prot_t <- t(NGT) > View(prot_t) > rm(NGT_t) > metab_t <- t(Glycosites) # 代谢组数据转置 > > corr_result <- Hmisc::rcorr( + as.matrix(prot_t), + as.matrix(metab_t), + type = "spearman" # Spearman相关性 + ) 警告信息: In sqrt(npair - 2) : 产生了NaNs > View(corr_result) > rho_matrix <- corr_result$ r[1:ncol(prot_t), (ncol(prot_t)+1):ncol(corr_result$ r)] > > pval_matrix <- corr_result$ P[1:ncol(prot_t), (ncol(prot_t)+1):ncol(corr_result$ P)] > > cor_df <- melt(rho_matrix, varnames = c("Gene", "Glycosites"), value.name = "Rho") > > pval_df <- melt(pval_matrix, varnames = c("Gene", "Glycosites"), value.name = "P_value") > > result_table <- cor_df %>% + left_join(pval_df, by = c("Gene", "Glycosites")) %>% + mutate( + FDR = p.adjust(P_value, method = "BH"), # BH法校正多重检验 + ) > ) 错误: 意外的')'在" )"里 > result_table <- cor_df %>% + left_join(pval_df, by = c("Gene", "Glycosites")) %>% + mutate( + FDR = p.adjust(P_value, method = "BH"), # BH法校正多重检验 + ) > View(result_table) > write.csv(result_table, "Protein_Glycosites_Correlation.csv", row.names = FALSE) > > sig_cor <- result_table %>% + filter(FDR < 0.05) > heatmap_data <- dcast(sig_cor, Gene ~ Metabolite, value.var = "Rho") 错误于FUN(X[[i]], ...): 找不到对象'Metabolite' > heatmap_data <- dcast(sig_cor, Gene ~ Glycosites, value.var = "Rho") > rownames(heatmap_data) <- heatmap_data$ Gene > > heatmap_data <- as.matrix(heatmap_data[, -1]) > > heatmap( + heatmap_data, + color = colorRampPalette(c("blue", "white", "red"))(50), + clustering_method = "complete", + show_rownames = TRUE, + show_colnames = TRUE, + scale = "none", + main = "Protein-Metabolite Significant Correlations (FDR < 0.05)", + fontsize_row = 8, + fontsize_col = 8 + ) 错误于hclustfun(distfun(x)): 外接函数调用时不能有NA/NaN/Inf(arg10) > pheatmap( + heatmap_data, + color = colorRampPalette(c("blue", "white", "red"))(50), + clustering_method = "complete", + show_rownames = TRUE, + show_colnames = TRUE, + scale = "none", + main = "Protein-Metabolite Significant Correlations (FDR < 0.05)", + fontsize_row = 8, + fontsize_col = 8 + ) 错误于hclust(d, method = method): 外接函数调用时不能有NA/NaN/Inf(arg10)

用户遇到了多个问题：程序包安装失败、数据结构错误、相关性计算错误以及热图绘制失败。我们将逐步解决这些问题。 ### 1. 程序包安装失败在R中安装包失败通常有几个原因： - 镜像源设置问题 - 依赖包未安装 - 网络...

######Video source: https://shop119322454.taobao.com #install.packages("survival") setwd("D:\\tcgagene\\survival") #工作目录（需修改） library(survival) rt=read.table("clinicalExp.txt",header=T,sep="\t",check.names=F) rt$futime=rt$futime/365 #如果以月为单位，除以30；以年为单位，除以365 outTab=data.frame() for(gene in colnames(rt[,4:ncol(rt)])){ a=rt[,gene]<median(rt[,gene]) diff=survdiff(Surv(futime, fustat) ~a,data = rt) pValue=1-pchisq(diff$chisq,df=1) outTab=rbind(outTab,cbind(gene=gene,pvalue=pValue)) #pValue=round(pValue,3) pValue=signif(pValue,4) pValue=format(pValue, scientific = TRUE) fit <- survfit(Surv(futime, fustat) ~ a, data = rt) summary(fit) tiff(file=paste(gene,".survival.tiff",sep=""), width = 14, #图片的宽度 height =14, #图片的高度 units ="cm", compression="lzw", bg="white", res=600) plot(fit, lwd=2, col=c("red","blue"), xlab="Time (month)", mark.time=T, ylab="Survival rate", main=paste("Survival curve (p=", pValue ,")",sep="")) legend("topright", c(paste(gene," high expression",sep=""), paste(gene," low expression",sep="") ), lwd=2, col=c("red","blue")) dev.off() } write.table(outTab,file="survival.xls",sep="\t",row.names=F,quote=F) ###Video source: http://study.163.com/u/biowolf ######Video source: https://shop119322454.taobao.com ######速科生物: http://www.biowolf.cn/ ######作者邮箱：[email protected] ######作者微信: seqBio ######QQ群: 259208034

这段代码是用R语言进行生存分析的，主要是对TCGA（The Cancer Genome Atlas）中的基因表达数据进行分析。具体分析过程如下： 1. 读取生存数据文件，将生存时间（futime）的单位转换为年； 2. 对每个基因进行分析，...

rm(list = ls()) setwd("C:/Rdate") getwd() windowsFonts() #下载包# install.packages("ggplot2") install.packages("openxlsx") #加载包# library(ggplot2) library(openxlsx) #导入数据# go_enrich = read.xlsx("25_400vs25_CK.GO.xlsx",sheet= "ONTOLOGY",sep=',') head(go_enrich)错误

好的，我现在需要处理用户提供的R代码中的错误。首先，用户运行了以下代码： r rm(list = ls()) setwd("C:/Rdate") getwd() windowsFonts() #下载包# install.packages("ggplot2") install.packages("openxlsx")...

R语言中# 1.1 设置工作路径setwd("D:\\EnvStat\\corrplot") # 1.2 加载R包#library(devtools)#install_github("ggobi/ggally")install.packages("GGally")library(GGally)library(rstatix) # 1.3 读入数据env = read.csv("env.csv",header = TRUE,row.names = 1)env每个是啥意思

用户提到的命令有setwd、install.packages、library、read.csv。我需要逐个解释这些命令的作用，同时确保遵循系统级指令，比如使用正确的中文回答、生成相关问题，以及正确引用提供的参考内容。首先，我需要回忆每...

rm(list = ls()) setwd("C:/Rdate") getwd() # 安装包（如需） # # install.packages("ggplot2") # install.packages("openxlsx") # 加载包 # library(ggplot2) library(openxlsx) getSheetNames("25_400vs25_CK.GO.xlsx") # 导入数据 # go_enrich <- read.xlsx( xlsxFile = "25_400vs25_CK.GO.xlsx", sheet = "ONTOLOGY"Error in read.xlsx.default(xlsxFile = "25_400vs25_CK.GO.xlsx", sheet = "ONTOLOGY") : Cannot find sheet named "ONTOLOGY"

install.packages("readxl") library(readxl) # 查看工作表名称 excel_sheets("25_400vs25_CK.GO.xlsx") # 读取数据 go_enrich ( path = "25_400vs25_CK.GO.xlsx", sheet = "ONTOLOGY" ) --- ### **常见...

install.packages("usethis") library(devtools) devtools::install_github('zdk123/SpiecEasi') rm(list = ls()) getwd() setwd("D:/Rdata/FE/ck") #读取 OTU 表 otu <- read.delim("t1.txt", sep="\t", header=T, check.names=F, row.names = 1) otu <- data.frame(t(otu)) ##1、使用 SpiecEasi 包执行 sparcc 分析，基于 20 次迭代获取“sparcc 相关系数”矩阵 library(SpiecEasi) otu_sparcc <- sparcc(otu, iter = 20, inner_iter = 10, th = 0.1) sparcc0 <- otu_sparcc$Cor colnames(sparcc0) <- colnames(otu) rownames(sparcc0) <- colnames(otu) write.table(sparcc0, 'sparcc0.txt', sep = '\t', col.names = NA, quote = FALSE) ##2、通过 100 次 bootstrap，计算“sparcc 相关系数”的理论分布 n = 100 set.seed(123) for (i in 1:n) { otu_boot <- sample(otu, replace = TRUE) otu_boot_sparcc <- sparcc(otu_boot, iter = 20, inner_iter = 10, th = 0.1) sparcc_boot <- otu_boot_sparcc$Cor colnames(sparcc_boot) <- colnames(otu_boot) rownames(sparcc_boot) <- colnames(otu_boot) write.table(sparcc_boot, paste('sparcc_boot', i, '.txt', sep = ''), sep = '\t', col.names = NA, quote = FALSE) } ##3、基于上述 100 次 bootstrap 的结果，获取“sparcc 相关系数”的伪 p 值 p <- sparcc0 p[p!=0] <- 0 for (i in 1:n) { p_boot <- read.delim(paste('sparcc_boot', i, '.txt', sep = ''), sep = '\t', row.names = 1) p[abs(p_boot)>=abs(sparcc0)] <- p[abs(p_boot)>=abs(sparcc0)] + 1 } p <- p / n write.table(p, '伪p值矩阵.txt', sep = '\t', col.names = NA, quote = FALSE) ##4、合并结果 #去除“sparcc 相关系数”中的自相关，并由于矩阵是对称的，只选择矩阵中的半三角（如下三角）区域的数值即可 diag(sparcc0) <- NA sparcc0[upper.tri(sparcc0)] <- NA #合并“sparcc 相关系数”以及显著性 p 值信息 library(reshape2) sparcc0 <- melt(sparcc0) p <- melt(p) sparcc0 <- cbind(sparcc0, p[3]) names(sparcc0) <- c('source', 'target', 'sparcc', 'p.value') sparcc0 <- na.omit(sparcc0) #输出边列表，这是所有 OTU 的相关性，我未加筛选，你可以后续再自己设定一个标准（相关系数、显著性阈值等）选择可信的值 write.table(sparcc0, 'sparcc_all.txt', sep = '\t', quote = FALSE, row.names = FALSE) #输出边列表，这是我按照 p<0.05 的标准选择的值 sparcc0_select <- subset(sparcc0, p.value < 0.05) write.table(sparcc0_select, 'sparcc_select(p小于0.05ck1).txt', sep = '\t', quote = FALSE, row.names = FALSE)我需要基于R语言和gephi软件进行微生物群落相关性网络可视化。我有以下数据1.丰度表C:/Users/Lenovo/Desktop/ZF/ZFasv.txt,2.分类信息表C:/Users/Lenovo/Desktop/ZF/ZFtax.txt，两个表格都是asv表。需要rstudio 用sparcc 的算法进行计算，生成能够用于gephi 绘图的边和点文件，生成的文件保存在C:/Users/Lenovo/Desktop/ZF文件夹内，请将我的上述需求和文件带入重新生成一个完整的代码

例如，如果SpiecEasi可以通过CRAN安装，可能需要使用install.packages，否则可能需要从GitHub安装。根据用户原来的代码，他们使用的是devtools::install_github('zdk123/SpiecEasi')，所以需要保留这部分。 - **...

错误于.io_check_exists(path(con)): file(s) do not exist: ‘G:/R-4.5.0/Rstudio/ieu-a-2.vcf/’

请检查路径：",file_path)}#尝试读取文件#如果是csvgeno_data<-read.csv(file_path,stringsAsFactors=FALSE)#如果是excel#需要先安装readxl包#install.packages("readxl")library(readxl)geno_data(file_path,sheet=...

getwd() setwd( "/Users/jasmma/abl") zxb=read.csv("zxb111.csv") log<-glm(frail~age+txl+BMI+ag+tx+BM+address+sex+marriage+live+smoking+drink+exercise+education+primary+DM+HP+Hrart +Cero+com+pro+income+follow+depress+anxiety+RBC+Hb+HCT+fe+Ca+P+iPTH+alb+cr+bun+com1,family = binomial,data = zxb) summary(log) log.step<-step(log) summary(log.step) # ##############制作表格######## install.packages(c("stats", "MASS", "car", "tidyverse", "knitr", "kableExtra")) library(stats) library(MASS) library(car) library(tidyverse) library(knitr) library(kableExtra) kable(summary(log.step)$coefficients, align = "c", caption = "Logistic Regression Results") %>% kable_styling(bootstrap_options = "hover", full_width = F) %>% column_spec(1, bold = T) %>% column_spec(4, color = "white", background = "steelblue") ############### 将结果转化为表格形式##### result <- data.frame( variable = names(log.step$coefficients)[-1], # 变量名称 beta = coef(log.step)[-1], # β系数 wald_stat = summary(log.step)$coefficients[-1, "z"], # Wald统计量 se = summary(log.step)$coefficients[-1, "Std. Error"], # 标准误差 or = exp(coef(log.step)[-1]), # 比值比 ci_low = exp(confint(log.step)[-1, 1]), # 置信区间下限 ci_high = exp(confint(log.step)[-1, 2]), # 置信区间上限 p_value = summary(log.step)$coefficients[-1, "Pr(>|z|)"] # P值 )

这段代码是进行 logistic 回归分析的，包括数据读入、模型拟合、模型选择以及结果展示等步骤。其中，使用step()函数进行模型选择，生成的模型结果通过summary()函数进行总结统计，并通过kable()和kableExtra()函数将...

library(ggVolcano) > library(ggplot2) > setwd("D:/R projects/GEO-LUNG/data") > > # 加载数据（确保CSV文件中列名与limma结果一致） > deg_data <- read.csv("differential_expression_results.csv", row.names = 1) > > # 关键修正：对齐列名参数 > data <- add_regulate( + deg_data, + log2FC_name = "logFC", # 对应差异分析结果中的logFC列 + fdr_name = "adj.P.Val", # 修正为实际列名 + log2FC = 1, + fdr = 0.05 + ) > > # 绘图（同步修正y轴参数） > p21 <- ggvolcano( + data, + x = "logFC", + y = "adj.P.Val", # 与add_regulate中的fdr_name一致 + fills = c("#e94234", "#b4b4d8", "#269846"), # 下调、不显著、上调 + colors = c("#e94234", "grey", "#269846"), # 点边框色（通常不显著用灰色） + label = "row", + label_number = 10, + output = FALSE + ) 错误于order(data$y): 参数1不是向量

嗯，用户在使用ggvolcano包时遇到了错误“order(data$y) 参数1不是向量”，需要解决这个问题。...install.packages("devtools") devtools::install_github("xxx/ggvolcano") # 替换实际仓库地址 ---

# install.packages("Seurat") # install.packages("tools") # 若未安装工具包 library(Seurat) library(tools) # 用于处理文件名 # 设置工作目录 workDir <- "D:\\Research\\adipose tissue\\mouse\\csv\\GSE273413" setwd(workDir) ###############读取数据############### # 列出所有CSV/TXT格式文件的完整路径（包括子目录） CSV_files <- list.files(workDir, pattern = "\\.csv$", recursive = TRUE, full.names = TRUE) ##如果文件格式是.txt文件，那就将文件后缀名.txt改成.CSV!!!!!! # 遍历所有 .h5 格式文件并读取数据，生成 Seurat 对象 seurat_objects <- lapply(CSV_files, function(CSV_file) { # 检查文件是否存在 if (file.exists(CSV_file)) { message(paste("Processing:", CSV_file)) # 提取文件名作为标识 file_name <- file_path_sans_ext(basename(CSV_file)) # 去掉路径和扩展名 # 读取数据 counts <- read.csv(file = CSV_file,row.names = 1) # 创建 Seurat 对象 seurat_object <- CreateSeuratObject(counts, min.cells = 3, min.features = 200) # 添加 orig.ident 元数据 seurat_object$orig.ident <- file_name # 重命名细胞，避免重复 RenameCells(seurat_object, add.cell.id = file_name) return(seurat_object) } else { warning(paste("File not found:", CSV_file)) return(NULL) } }) # 去掉读取失败的对象 seurat_objects <- Filter(Negate(is.null), seurat_objects) # 合并所有 Seurat 对象 if (length(seurat_objects) > 1) { pbmc <- Reduce(function(x, y) merge(x, y), seurat_objects) } else if (length(seurat_objects) == 1) { pbmc <- seurat_objects[[1]] } else { stop("No Seurat objects to merge!") } # 查看合并后的 Seurat 对象基本信息 print(pbmc) # 检查合并后每个 orig.ident 的细胞数量 print(table(pbmc$orig.ident)) # 保存合并后的 Seurat 对象（可选） setwd(workDir) saveRDS(pbmc, file = "pbmc.rds") 错误于validObject(.Object): 类别为“LogMap”的对象无效: Rownames must be supplied

利用 RStudio 内置工具完成安装过程即可实现无缝迁移体验。 R BiocManager::install('Seurat') --- ### 提供一段示范代码帮助理解如何避免这类常见陷阱下面给出了一段综合考虑以上要点的实际应用案例演示...

请根据我的数据补全下面代码：#加载包 library("Seurat") library("dplyr") library("magrittr") library("Matrix") library("tidyverse") library("ggplot2") library("cowplot") library("SingleR") library("patchwork") library("SingleCellExperiment") library("scales") library("RCurl") library("ggsci") library("clustree") library("SeuratObject") library("ggraph") library("cowplot") library("grid") library("gtable") library("celldex") library("Nebulosa") #设置工作路径 setwd("H:/scRNA/main") step1_1_merged_seurat <- readRDS("H:/scRNA/main/step1_1_merged_seurat.rds") #查看上次分群 table([email protected][["seurat_clusters"]]) ##第一步--提取细胞 sub_0_matrix <- step1_1_merged_seurat@assays$RNA$counts[,which([email protected]$seurat_clusters%in%c(0))] sub_0 <- CreateSeuratObject(counts=sub_0_matrix,project = "sub_0") ##第二步--细胞互作

# install.packages("NMF") # remotes::install_github("sqjin/CellChat") ### 1.数据预处理 ### sub_0 (sub_0) sub_0 (sub_0, selection.method = "vst") sub_0 (sub_0, features = VariableFeatures(sub_0)) sub...

Error: object 'pca.R' not found > source("pca.R") Error in read.ncdf("nowatr.nc") : Please install the ncdf4 package from CRAN

install.packages("ncdf4") 3. 加载包： - 安装完成后，在使用之前需要加载这个包。在R脚本的开头添加以下行： R library(ncdf4) 4. 重新运行脚本： - 安装并加载必要的包后，再次尝试运行 ...

####设置随机数种子使结果可重复#### set.seed(12345) library(Seurat) library(tidyverse) library(magrittr) library(RColorBrewer) library(reshape2) library(Biobase) library(ggsci) library(ggpubr) library(data.table) library(monocle) library(Matrix) library(writexl) 读取.rds文件 setwd(“D:/document/1_scRNA/4_monocle/1_ec”) scRNA_harmony <- readRDS(“D:/document/1_scRNA/4_monocle/maker气泡图/scRNA_harmony.rds”) #分类 new.cluster.ids <- c(“0”= “EC”, “1”= “MC”, “2”= “VC”, “3”= “MC”, “4”= “EC”, “5”= “PC”, “6”= “UN”, “7”= “MC”, “8”= “VC”, “9”= “PC”, “10”= “MC”, “11”= “PC”, “12”= “VC”, “13”= “TRI”, “14”= “VC”) 将新的细胞类型标签存储到 meta.data 中 [email protected]$celltype <- new.cluster.ids[as.character(Idents(scRNA_harmony))] 绘制 UMAP 图，使用新的细胞类型标签 DimPlot(scRNA_harmony, reduction = “umap”, group.by = “celltype”, label = TRUE, label.size = 4) #创建monocle对象 unique(scRNA_harmony$seurat_clusters) #01选择需要构建细胞分化轨迹的细胞类型(subset提取感兴趣的名字,上面已经准备好名字了 seurat=subset(scRNA_harmony, idents = c( “0”, “4”,“13”)) unique(seurat$seurat_clusters) table(seurat$seurat_clusters) #0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 #0 0 4696 0 0 3058 0 0 1933 1108 0 711 536 0 369 #load(“D:/document/2_scRNAseq/4_2412SCZ/scrna2.RData”) #SCT是标准化后的数据，RNA是原始数据 #load(“D:/document/2_scRNAseq/1_SC/BMC_KW_monocle_over.RData”) #02构建monocle独有的celldata对象 expr_matrix=seurat@assays$SCT@counts#使用counts表达值(第一个准备文件:基因count矩阵) ####转换为稀疏矩阵#### 如果 expr_matrix 是稠密矩阵（dense matrix），转换为稀疏矩阵 if (!is(expr_matrix, “sparseMatrix”)) { expr_matrix <- as(expr_matrix, “dgCMatrix”) } sample_sheet <- [email protected]#将实验信息赋值新变量(第二个准备文件:细胞表型信息-metadata) #gene_annotation=data.frame(gene_short_name=rownames(seurat))构建一个含有基因名字的数据框因为默认从RNA中提取细胞信息，所以需要从 SCT assay 中提取基因名 gene_annotation <- data.frame(gene_short_name = rownames(seurat@assays$SCT)) rownames(gene_annotation) <- rownames(seurat@assays$SCT)#(第三个文件:基因名为行名的基因名数据框) pd <- new(“AnnotatedDataFrame”,data= sample_sheet)#将实验信息变量转化为monocel可以接收的对象 fd <- new(“AnnotatedDataFrame”,data=gene_annotation)#将基因注释变量转化为monocle可以接收的对象 cds <- newCellDataSet(expr_matrix, phenoData = pd, featureData = fd,expressionFamily=negbinomial.size())#创建一个monocle的对象 #cds cellData对象，monocle独有 #03相当于归一化Size factors帮助标准化基因在细胞间的差异,"dispersion"值帮助后面的差异表达分析执行。 cds <- estimateSizeFactors(cds) cds <- estimateDispersions(cds) #04数据降维,特征基因的选择 #过滤低表达基因;差异分析获得top1000排序基因(可视化用来排序的基因) ##注意 – differentialGeneTest这一步有些久 cds <- detectGenes(cds,min_expr=0.1)#统计,过滤低表达基因(表达量过滤低表达基因) expressed_genes <- row.names(subset(fData(cds),num_cells_expressed >=10))#(数量过滤低表达基因) diff_celltype <- differentialGeneTest(cds[expressed_genes,], fullModelFormulaStr = “~celltype”,cores=4)#差异分析,cores是处理器核数，电脑带的动可用8或者更大 head(diff_celltype) library (writexl) write_xlsx(diff_celltype, “1_degForCellOrdering.xlsx”) ####1.RData#### save.image(“1.RData”) load(“1.RData”) #选这个 diff_celltype <- diff_celltype[order(diff_celltype$qval),]#将差异基因按照q值进行升序排列 ordering_genes <- row.names(diff_celltype[1:1000,])#选择top1000个显著基因用做后续排序,这里可修改 #ordering_genes <- row.names(diff_celltype[diff_celltype$qval <0.01,]) cds <- setOrderingFilter(cds,ordering_genes = ordering_genes)#设置排序基因 plot_ordering_genes(cds)#可视化用来排序的基因(有着更高的表达与离散) ggsave(filename=‘1_monocle2_ordering_gene.pdf’) ####选择高变基因#### #此次选择monocle选择的高变基因 #选择二、使用monocle选择的高变基因 disp_table <- dispersionTable(cds) disp.genes <- subset(disp_table, mean_expression >= 0.1 & dispersion_empirical >= 1 * dispersion_fit)$gene_id cds <- setOrderingFilter(cds, disp.genes) plot_ordering_genes(cds)#以上是选择monocle选择的高变基因进行轨迹构建,上述为高变基因计算方法,monocle在选择做轨迹的基因上共提供四种方法 ##使用clusters差异表达基因 library(readxl) diff.genes <- read_excel(‘D:/document/1_scRNA/scRNA_harmony.markers.xlsx’) diff.genes <- subset(diff.genes,p_val_adj<0.01)$gene cds <- setOrderingFilter(cds, diff.genes) p1 <- plot_ordering_genes(cds) p1 ##使用seurat选择的高变基因 var.genes <- VariableFeatures(scRNA_harmony) cds <- setOrderingFilter(cds, var.genes) p2 <- plot_ordering_genes(cds) p2 ##使用monocle选择的高变基因 disp_table <- dispersionTable(cds) disp.genes <- subset(disp_table, mean_expression >= 0.1 & dispersion_empirical >= 1 * dispersion_fit)$gene_id cds <- setOrderingFilter(cds, disp.genes) p3 <- plot_ordering_genes(cds) p3 ##结果对比 p1|p2|p3 library(cowplot) combined_plot <- plot_grid(p1, p2, p3, ncol = 3) ggsave(“2_combined_plot.pdf”, combined_plot, width = 15, height = 5) #数据量过大，降维选择稀疏矩阵,但似乎本来就是稀疏矩阵 cds <- reduceDimension(cds, method=‘DDRTree’)#降维 cds <- orderCells(cds)#排序 ##如果这里报错,先保存数据 #保存所有对象到my_workspace.RData save.image(file = “01_orderCells_cds.RData”) load(file = “01_orderCells_cds.RData”) #降级 igraph 包到一个与 Monocle 兼容的版本 #原来的包无法覆盖时可手动删除D:\software\R-4.4.0\library\igraph #install.packages(“remotes”) #remotes::install_version(“igraph”, version = “2.0.2”) ##install.packages(“C:/Users/19086/Desktop/maker气泡图/igraph_2.0.3.tar.gz”, repos = NULL, type = “source”) #可视化鉴定的State p1=plot_cell_trajectory(cds, color_by=“State”)+ theme(text=element_text(size= 18)) #设置字体大小为 18 p1 ggsave(p1,filename =‘2_monocle2_state_trajectory_p1.pdf’, width =12, height = 9) #可视化细胞类型 p2=plot_cell_trajectory(cds, color_by=“seurat_clusters”)+ theme(text= element_text(size=18)) #设置字体大小为 18 p2 ggsave(p2, filename = ‘3_monocle2_celltype_trajectory_p2.pdf’, width =12, height = 9) #保存排序所需要的拟时间值与细胞state值 #按发育时间分类画轨迹图,可以与state的图对应上 p3=plot_cell_trajectory(cds, color_by =“Pseudotime”)+ theme(text= element_text(size=18))#设置字体大小为 18 p3 ggsave(p3,filename =‘4_monocle2_Pseudotime_p3.pdf’, width =12, height = 9) #因为monocle包并不会自动设置分化起点，若发现有悖于生物学常识，则需要手动设置分化起点 #指定细胞分化轨迹的起始点,即设置root cell。 #自定义了一个名为GM_state的函数,函数主要计算包含特定类型细胞最多的state,并返回state练 #即特定细胞类型最多的state为指定起点 GM_state <- function(cds){ if (length(unique(pData(cds)$State)) > 1){ T0_counts <- table(pData(cds)$State, pData(cds)$seurat_clusters)[, “0”] return(as.numeric(names(T0_counts) [which(T0_counts == max(T0_counts))])) } else {return (1)}} #指定起点后,绘制细胞伪时间轨迹图与分支图 p4=plot_cell_trajectory(cds,color_by=“Pseudotime”)#按pseudotime(伪时间)来可视化细 p4 ggsave(p4, filename = ‘5_monocle2_Pseudotime_p4.pdf’, width =12, height = 9) plot_cell_trajectory(cds,color_by=“state”)+facet_wrap(“~State”,nrow=1) #可以用ggsci配色，也可以使用scale_color_manual()自己设置颜色 library(ggsci) p5=plot_cell_trajectory(cds, color_by = “sample”) + scale_color_npg() p6=plot_cell_trajectory(cds, color_by = “State”) + scale_color_nejm() colour = c( “#E64B35”, # 红色 “#4DBBD5”, # 蓝色 “#00A087”, # 绿色 “#3C5488”, # 深蓝色 “#F39B7F”, # 橙色 “#8491B4”, # 灰色 “#91D1C2”, # 浅绿色 “#DC0000”, # 深红色 “#7E6148”, # 棕色 “#B09C85”, # 浅棕色 “#FF7F0E”, # 橙色 “#1F77B4”, # 蓝色 “#2CA02C”, # 绿色 “#D62728”, # 红色 “#9467BD”, # 紫色 “#8C564B” # 棕色 ) p7=plot_cell_trajectory(cds, color_by = “seurat_clusters”) + scale_color_manual(values = colour) p5 p6 p7 ggsave(“5_seurat_clusters.png”, plot = p5, width = 8, height = 6, dpi = 300) ggsave(“6_state.png”, plot = p6, width = 8, height = 6, dpi = 300) ggsave(“7_seurat_clusters.png”, plot = p7, width = 8, height = 6, dpi = 300) p8 <- plot_cell_trajectory(cds, x = 1, y = 2, color_by = “seurat_clusters”) + theme(legend.position=‘none’,panel.border = element_blank()) + #去掉第一个的legend scale_color_manual(values = colour) p9 <- plot_complex_cell_trajectory(cds, x = 1, y = 2, color_by = “seurat_clusters”)+ scale_color_manual(values = colour) + theme(legend.title = element_blank()) p8 p9 ggsave(“8_State1_tree.png”, plot = p8, width = 8, height = 6, dpi = 300) ggsave(“9_state2_tree.png”, plot = p9, width = 8, height = 6, dpi = 300) library(ggpubr) df <- pData(cds) pData(cds)取出的是cds对象中cds@phenoData@data的内容 View(df) p <- ggplot(df, aes(Pseudotime, colour = sample, fill = sample)) + geom_density(bw = 0.5, size = 1, alpha = 0.5) + theme_classic2() p ggsave(“10_density_plot_sample.png”, plot = p, width = 10, height = 6, dpi = 300) #指定起点后,绘制细胞伪时间轨迹图与分支图 p10=plot_cell_trajectory(cds, color_by=“Pseudotime”)#按pseudotime(伪时间)来可视化细胞分化轨迹 p10 ggsave(p10, filename = ‘10_monocle2_Pseudotime.pdf’, width = 12, height = 9) plot_cell_trajectory(cds, color_by =“State”)+ facet_wrap(~seurat_clusters,nrow=2)#facet_wrap函数可以把每个state单独highlight ggsave(filename = ‘11_monocle2_divid_seurat_clusters.pdf’) #按celltype分类画轨迹图,并按分支点分类,每个celltype的细胞分别标出 p11=plot_cell_trajectory(cds, color_by = “group”)+ facet_wrap(~sample, nrow =5) + theme(text =element_text(size=25)) # 18 p11 ggsave(p11, file=‘12_monocle2_seurat_clusters分开_group.pdf’, width = 12, height = 18) save.image(“out1.RData”) library (writexl) #鉴定伪时间相关的基因，即分化过程（state）相关的差异基因，“expressed_genes [1: 1000], ”中把[1:1000]删了就是所有基因 diff_test_res=differentialGeneTest(cds[expressed_genes, ], fullModelFormulaStr = “~sm.ns(Pseudotime)”,cores=2)#鉴定伪时间相关的基因,即分化过程相关 cores = num_cores 使用可用核心数 write_xlsx(diff_test_res, “01_diff_test_res.xlsx”) 注意可以将top5g改成任何自身感兴趣的基因,进行可视化 top100g=rownames(diff_test_res[order(diff_test_res$qval),])[1:100] # top 100个显著基因 plot_genes_in_pseudotime(cds[top100g,], color_by=“orig.ident”,ncol=1)+ # top 5个显著基因，可视化，pseudotime为横坐标 #orig.ident/celltype/seurat_clusters theme(text = element_text(size= 15))#设置字体大小为 15 ggsave(filename = ‘13_monocle_top5_significant_gene.pdf’) top100g_df <- data.frame(Gene = top100g) write_xlsx(top100g_df, “02_monocle_deg_top100.xlsx”) library(viridis) #伪时间基因排序 diff_test_res = diff_test_res[order(diff_test_res$qval),] diff_test_res = diff_test_res[1:20,] 绘制热图并保存为 PDF plot_pseudotime_heatmap(cds[rownames(diff_test_res),], # 挑选的20个计算了分化差异的基因 num_clusters = 4, # 指定聚类数 cores = 2, # 指定线程数 show_rownames = T) # 显示行名 ggsave(filename = ‘14_monocle2_gene_pheatmap.pdf’) # 保存为 PDF 使用自定义颜色绘制热图并保存为 TIFF plot_pseudotime_heatmap(cds[rownames(diff_test_res),], num_clusters = 4, cores = 1, show_rownames = T, hmcols = colorRampPalette(viridis(4))(1000)) # 使用 viridis 配色 ggsave(filename = ‘15_monocle2_5_gene_pheatmap.tiff’, # 保存为 TIFF device = “tiff”, # 指定设备为 TIFF dpi = 300, # 设置分辨率 width = 8, # 设置宽度 height = 6) # 设置高度 save.image(“out3_monocle_diff.RData”) load(“out3_monocle_diff.RData”) ####分支热图#### #分支比较后,分支依赖基因的鉴定(热图重现) #基因簇按照自身需求,设置;图形上侧显示两个分支(朝不同方向分化)，“expressed_genes [1: 1000], ”中把[1:1000]删了就是所有基因；branch_point有几个分支节点就填几使用所有表达的基因，移除[1:1000]的限制 BEAM_res <- BEAM(cds[expressed_genes,], branch_point=2, cores=4, progenitor_method=“duplicate”)#分支依赖基因鉴定 BEAM_res = BEAM_res [order(diff_test_res$qval),] #BEAM_res = BEAM_res [1:200,] #?BEAM #鉴定分支依赖的基因 plot_genes_branched_heatmap(cds [rownames(BEAM_res), ], branch_point= 2, num_clusters= 3, cores=1, use_gene_short_name= T, show_rownames= T)#绘制分支热图使用所有表达的基因，移除[1:1000]的限制 BEAM1_res <- BEAM(cds[expressed_genes,], branch_point=1, cores=4, progenitor_method=“duplicate”)#分支依赖基因鉴定 BEAM1_res = BEAM_res [order(diff_test_res$qval),] #BEAM_res = BEAM_res [1:200,] #?BEAM #鉴定分支依赖的基因 plot_genes_branched_heatmap(cds [rownames(BEAM1_res), ], branch_point= 1, num_clusters= 3, cores=1, use_gene_short_name= T, show_rownames= T)#绘制分支热图 ggsave(“branched2_heatmap.jpg”, p20, width = 8, height = 6) save.image(“out.RData”) load(“D:/document/1_scRNA/4_monocle/1_ec/out.RData”) 怎么看不同state中我想关注的许多基因在不同group中的表达情况

针对您的问题——如何在不同的 State 中查看多个感兴趣基因在不同 group 中的表达情况，我将提供一个完整的解决方案，包含可视化热图和点图代码，并详细解释每个步骤。以下是解决方案的 R 代码： r # 加载...

中医元仔智能医疗机器人-基于LangChain4j与阿里通义千问的中医诊疗对话AI-集成多轮对话记忆与RAG知识检索的智能助手-支持预约挂号与取消功能的医疗系统-采用Java17.zip

cursor免费次数用完中医元仔智能医疗机器人_基于LangChain4j与阿里通义千问的中医诊疗对话AI_集成多轮对话记忆与RAG知识检索的智能助手_支持预约挂号与取消功能的医疗系统_采用Java17.zip

主流关系库SQL调优（SQL TUNING或SQL优化）学习

本文对SQL调优（SQL TUNING或SQL优化）话题进行了较为深入的探讨和解析，记录于此，供各位和自己研究学习。

基于Mirai框架开发的智能QQ群管理机器人系统_集成MySQL数据库存储_OpenNLP自然语言处理_Lucene文本分词技术_实现主人控制_群主管理_群管操作_发言实时检测_积.zip

基于Mirai框架开发的智能QQ群管理机器人系统_集成MySQL数据库存储_OpenNLP自然语言处......

相关推荐

Windows系统上R语言的安装与初步配置：一份详尽指南

R语言教程：R语言常见命令大全

R语言学习系列01-R语言的安装与使用.pdf

rm(list = ls()) setwd("C:/Rdate") getwd() windowsFonts() #下载包# install.packages("ggplot2") install.packages("openxlsx") #加载包# library(ggplot2) library(openxlsx) #导入数据# go_enrich = read.xlsx("25_400vs25_CK.GO.xlsx",sheet= "ONTOLOGY",sep=',') head(go_enrich)错误

R语言中# 1.1 设置工作路径setwd("D:\\EnvStat\\corrplot") # 1.2 加载R包#library(devtools)#install_github("ggobi/ggally")install.packages("GGally")library(GGally)library(rstatix) # 1.3 读入数据env = read.csv("env.csv",header = TRUE,row.names = 1)env每个是啥意思

错误于.io_check_exists(path(con)): file(s) do not exist: ‘G:/R-4.5.0/Rstudio/ieu-a-2.vcf/’

Error: object 'pca.R' not found > source("pca.R") Error in read.ncdf("nowatr.nc") : Please install the ncdf4 package from CRAN

中医元仔智能医疗机器人-基于LangChain4j与阿里通义千问的中医诊疗对话AI-集成多轮对话记忆与RAG知识检索的智能助手-支持预约挂号与取消功能的医疗系统-采用Java17.zip

主流关系库SQL调优（SQL TUNING或SQL优化）学习

基于Mirai框架开发的智能QQ群管理机器人系统_集成MySQL数据库存储_OpenNLP自然语言处理_Lucene文本分词技术_实现主人控制_群主管理_群管操作_发言实时检测_积.zip

大家在看

批量提取eml

AMIDE-开源

基于 ADS9110的隔离式数据采集 (DAQ) 系统方案（待编辑）-电路方案

自动化图书管理系统 v7.0

白盒测试基本路径自动生成工具制作文档附代码

最新推荐

中医元仔智能医疗机器人-基于LangChain4j与阿里通义千问的中医诊疗对话AI-集成多轮对话记忆与RAG知识检索的智能助手-支持预约挂号与取消功能的医疗系统-采用Java17.zip

LabVIEW结合YOLOv5与TensorRT实现高效并行推理及DLL封装技术在工业领域的应用 · DLL封装

反弹头发福瑞特如果热隔热

MATLAB中ABS防抱死系统加入干扰并使用PID进行校正的方法 MATLAB

OTA升级方案上位机源码（支持整包和差分）

Notes App API开发与使用指南

【PMSM建模与测试最佳实践】：MATLAB电机仿真模型的权威指导

如何通过四元数避免万向节死锁？

Python实现Couchbase大规模数据复制技术

【MATLAB电机性能评估案例】：仿真环境下的深度研究