##----代码,echo=FALSE-------------------------------------------------------date=“`r文档日期()`”pkg=“`r pkg_ver('CNEr')`”##----全局选项,echo=FALSE-----------------------------------------------short=TRUE#如果short==TRUE,则不回显代码块调试=FALSEknitr::opts_chunk$set(echo=!short,warning=debug,message=debup,error=FALSE,cache.path=“缓存/”,图路径=“数字/”)##----轴,评估=真,回声=真------------------------------------------------图书馆(CNEr)##这些axt文件是专门为该地区准备的##(chr6:24000000..2700000)axtFilesHg38DanRer10<-file.path(system.file(“extdata”,package=“CNEr”),“hg38.danRer10.net.axt”)axtFilesDanRer10Hg38<-file.path(system.file(“extdata”,package=“CNEr”),“danRer10.hg38.net.axt”)##----readAxt,eval=TRUE,echo=TRUE--------------------------------------------axtHg38DanRer10<-readAxt(axtFilesHg38丹Rer10)axtDanRer10Hg38<-readAxt(axtFilesDanRer10 Hg38)##----showAxt,eval=真,echo=真--------------------------------------------##Axt类以UCSC Axt格式显示axtHg38DanRer10公司axtDanRer10Hg38公司##----matchDistribution,eval=TRUE,echo=TRUE----------------------------------##匹配比对的分布;给定Axt对齐,用每个匹配对齐的百分比绘制热图匹配分发(axtHg38DanRer10)匹配分发(axtDanRer10Hg38)##----syntenyDotplot,eval=TRUE,echo=TRUE-------------------------------------##hg19和galGal3上的chr4示例##人类和斑马鱼的共性在点图上并不十分明显。文库(BSgenome.Hsapiens.UCSC.hg19)库(BSgenome.Ggallus.UCSC.galGal3)fn<-file.path(system.file(“extdata”,package=“CNEr”),“chr4.hg19.galGal3.net.axt.gz”)axt<-readAxt(fn,tAssemblyFn=文件路径(system.file(“extdata”,package=“BSgenome.Hsapiens.UCSC.hg19”),“single_sequences.2bit”),qAssemblyFn=file.path(system.file(“extdata”,package=“BSgenome.Ggallus.UCSC.galGal3”),“single_sequences.2bit”))库(GenomeInfoDb)syntenicDotplot(axt,firstChrs=c(“chr4”),secondChrs=“chr5”,type=“dot”)##----UCSC,eval=FALSE,echo=TRUE----------------------------------------------###从UCSC获取rmsk表#库(rtracklayer)#mySession<-browserSession(“UCSC”)#基因组(mySession)<-“hg38”#hg38.rmsk<-getTable(ucscTableQuery(mySession,track=“RepeatMasker”,#表=“rmsk”))#hg38.rmskGRanges<-GRanges(seqnames=hg38.rmsk$genoName,###UCSC坐标是基于0的。#ranges=I范围(start=hg38.rmsk$genoStart+1,#end=hg38.rmsk$genoEnd),#strand=hg38.rmsk$strand)###从BioMart获取集合基因外显子#图书馆(bioRt)#信号群<-useMart(biomart=“ensembl_MART_ensembl”,#host=“dec2015.archive.ensembl.org”)#ensembl<-useDataset(“hsapiens_gene_ensembl”,mart=ensembl)#属性<-listAttributes(信号群)#外显子<-getBM(attributes=c(“chromosome_name”,“exon_chrom_start”,#“exon_chrome_end”,“strand”),#mart=集合)#exonsRanges<-GRanges(seqnames=exons$chromosome_name,#ranges=I范围(开始=外显子$exon_chrom_start,#end=外显子$exon_chrom_end),#strand=ifelse(外显子$strand==1L,“+”,“-”)# )#seqlevelsStyle(外显子范围)<-“UCSC”###使用hg38的现有Bioconductor注释包#库(TxDb.Hsapiens.UCSC.hg38.knownGene)#外显子范围<-外显子(TxDb.Hsapiens.UCSC.hg38.knownGene)##----床,评估=真,回声=真------------------------------------------------##Zebrafish danRer10的chr6:24000000..2700000的现有床文件bedDanRer10Fn<-file.path(system.file(“extdata”,package=“CNEr”),“filter_regions.danRer10.bed”)danRer10过滤器<-读取床(床DanRer10Fn)danRer10过滤器##Human hg38中对齐区域的现有床文件##chr6:24000000..27000000丹雷尔10bedHg38Fn<-file.path(system.file(“extdata”,package=“CNEr”),“filter_regions.hg38.bed”)hg38过滤器<-readBed(bedHg38Fn)hg38过滤器##----CNE,eval=真,echo=真------------------------------------------------##这里我们有来自Bioconductor包的两位文件##英国基因组。Drerio.UCSC.danRer10和BSgenome。哈皮恩斯。加州大学旧金山分校hg38cneDanRer10Hg38<-CNE(assembly1Fn=文件路径(system.file(“extdata”,package=“BSgenome.Drerio.UCSC.danRer10”),“single_sequences.2bit”),assembly2Fn=文件路径(system.file(“extdata”,package=“BSgenomen.Hsapiens.UCSC.hg38”),“single_sequences.2bit”),axt12Fn=axtFilesDanRer10Hg38,axt21Fn=axtFilesHg38DanRer10,切断1=8L,切断2=4L)cneDanRer10Hg38##----CNEScan,eval=真,echo=真--------------------------------------------标识<-c(45L、48L、49L)窗户<-c(50L、50L、50L)##这里,danRer10Filter是tFilter,因为danRer是组件1cneListDanRer10Hg38<-ceScan(x=cneDanRer10Hg38,tFilter=danRer10Filter,qFilter=hg38过滤器,窗口=窗口,标识=标识)##----CNEScanHead,eval=真,echo=真----------------------------------------##以danRer10为参考的路线CNECNE12(cneListDanRer10Hg38[[“45_50”]])##以hg38为参考的路线CNECNE21(cneListDanRer10Hg38[[“45_50”]])##----CNEMerge,eval=真,echo=真-------------------------------------------cneMergedListDanRer10Hg38<-lapply(cneListDanRer10Hg38,cneMerge)##----CNE应答,eval=FALSE,echo=TRUE------------------------------------#cneFinalListDanRer10Hg38<-重叠(cneMergedListDanRer10Hg38,blatCNE)##----saveCNE,eval=TRUE,echo=TRUE--------------------------------------------##在单个表上数据库名称<-tempfile()数据(cneFinalListDanRer10Hg38)表格名称<-paste(“danRer10”,“hg38”,名称(cneFinalListDanRer10Hg38),sep=“_”)对于(i in 1:长度(cneFinalListDanRer10Hg38)){saveCNEToSQLite(cneFinalListDanRer10Hg38[[i]],数据库名,表名[i],覆盖=真)}##----查询CNE,eval=TRUE,echo=TRUE-------------------------------------------chr<-“chr6”启动<-2400000L末端<-27000000L最小长度<-50L表格名称<-“danRer10_hg38_45_50”fetchedCNERanges<-readCNERangesFromSQLite(dbName,tableName,chr,start,end,whichAssembly=“first”,minLength=最小长度)获取的CNE范围##----CNEWidthDistribution,eval=TRUE,echo=TRUE-------------------------------dbName<-file.path(system.file(“extdata”,package=“CNEr”),“danRer10CNE.sqlite”)t装配Fn<-file.path(system.file(“extdata”,package=“BSgenome.Drerio.UCSC.danRer10”),“single_sequences.2bit”)qAssemblyFn<-file.path(system.file(“extdata”,package=“BSgenomen.Hsapiens.UCSC.hg38”),“single_sequences.2bit”)cneGRangePairs<-readCNERangesFromSQLite(dbName=dbName,tableName=“danRer10_hg38_45_50”,t总成Fn=t总成fn,qAssemblyFn=qAssembleFn)plotCNEWidth(cneGRangePairs)##----plotCNE分布,eval=TRUE,echo=TRUE--------------------------------plotCNE分布(第一个(cneGRangePairs))##----outputBedBW,eval=FALSE,echo=TRUE---------------------------------------#制造CNE密度(cneGRangePairs[1:1000])##----queryUCSC,eval=FALSE,echo=TRUE,cache=TRUE-----------------------------#图书馆(Gviz)#图书馆(bioRt)#基因组<-“danRer10”#轴跟踪<-GenemeAxisTrack()#cpg群岛<-UcscTrack(基因组=基因组,染色体=chr,#track=“cpgIslandExt”,从=开始,到=结束,#trackType=“AnnotationTrack”,start=“chromStart”,#end=“chromEnd”,id=“name”,shape=“box”,#showId=假,#fill=“#006400”,name=“CpG”,#background.title=“棕色”)#refGenes<-UcscTrack(基因组=基因组,染色体=chr,#track=“refGene”,from=开始,to=结束,#trackType=“GeneRegionTrack”,rstarts=“exonStarts”,#rends=“exonEnds”,gene=“name2”,symbol=“name3”,#transcript=“name”,strand=“strand”,fill=“#8282d2”,#name=“refSeq Genes”,collapseTranscripts=TRUE,#showId=TRUE,background.title=“棕色”)#信号群<-useMart(biomart=“ensembl_MART_ensembl”,#host=“dec2015.archive.ensembl.org”)#ensembl<-useDataset(“drerio_gene_ensembl”,mart=ensembl)#biomTrack<-BiomartGeneRegionTrack(基因组=基因组,染色体=chr,#biomart=信号群,#start=开始,end=结束,name=“集合基因”)##----loadAnnotation,eval=TRUE,echo=FALSE------------------------------------数据(axisTrack)数据(cpg群岛)数据(参考基因)##----plotAnnotation,eval=TRUE,echo=TRUE,fig.height=5,fig.width=7----------图书馆(Gviz)plotTracks(列表(axisTrack,cpgIslands,refGenes),collapseTranscripts=TRUE,shape=“箭头”,transcriptAnnotation=“symbol”)##----保密性,评估=真,回声=真-----------------------------------------dbName<-file.path(system.file(“extdata”,package=“CNEr”),“danRer10CNE.sqlite”)基因组<-“danRer10”窗户尺寸<-200L最小长度<-50LcneDanRer10Hg38_21_30CNEDensity(数据库名称=数据库名称,tableName=“danRer10_hg38_21_30”,whichAssembly=“first”,chr=chr,start=start,end=结束,windowSize=窗口大小,minLength=最小长度)cneDan重置10Hg38_45_50<-CNEDensity(数据库名称=数据库名称,tableName=“danRer10_hg38_45_50”,whichAssembly=“first”,chr=chr,start=start,end=结束,windowSize=窗口大小,minLength=最小长度)cneDan回路10Hg38_49_50<-CNEDensity(数据库名称=数据库名称,tableName=“danRer10_hg38_49_50”,whichAssembly=“first”,chr=chr,start=start,end=结束,windowSize=窗口大小,minLength=最小长度)cneDanRer10AstMex102_48_50<-CNEDensity(数据库名称=数据库名称,tableName=“AstMex102_danRer10_48_50”,whichAssembly=“second”,chr=chr,start=start,end=结束,windowSize=窗口大小,minLength=最小长度)cneDanRer10标准1_75_75<-CNEDensity(数据库名称=数据库名称,tableName=“cteIde_danRer10_75_75”,whichAssembly=“second”,chr=chr,start=start,end=结束,windowSize=窗口大小,minLength=最小长度)##----GvizDataTrack,eval=真,echo=真--------------------------------------dTrack1<-DataTrack(范围=cneDanRer10Hg38_21_30,基因组=基因组,type=“水平”,horizon.scale=最大值(cneDanRer10Hg38_21_30$score)/3,填充地平线=c(“#B41414”,“#E03231”,“#F7A99C”,“黄色”、“橙色”、“红色”),name=“人类21/30”,背景。title=“棕色”)dTrack2<-DataTrack(范围=cneDanRer10Hg38_45_50,基因组=基因组,type=“水平”,horizon.scale=最大值(cneDanRer10Hg38_45_50$score)/2,填充地平线=c(“#B41414”,“#E03231”,“#F7A99C”,“黄色”、“橙色”、“红色”),name=“human 45/50”,background.title=“brown”)dTrack3<-数据跟踪(范围=cneDanRer10Hg38_49_50,基因组=基因组,type=“水平”,horizon.scale=最大值(cneDanRer10Hg38_21_30$score)/3,填充地平线=c(“#B41414”,“#E03231”,“#F7A99C”,“黄色”、“橙色”、“红色”),name=“human 49/50”,background.title=“brown”)dTrack4<-DataTrack(范围=cneDanRer10AstMex102_48_50,基因组=基因组,type=“水平”,horizon.scale=最大值(cneDanRer10Hg38_21_30$score)/3,填充地平线=c(“#B41414”,“#E03231”,“#F7A99C”,“黄色”、“橙色”、“红色”),name=“盲洞鱼48/50”,background.title=“棕色”)dTrack5<-DataTrack(范围=cneDanRer10TeIde1_75_75,基因组=基因组,type=“水平”,horizon.scale=最大值(cneDanRer10TeIde1_75_75$score)/3,填充地平线=c(“#B41414”,“#E03231”,“#F7A99C”,“黄色”、“橙色”、“红色”),name=“草鱼75/75”,background.title=“棕色”)##----plotCNE,eval=TRUE,echo=TRUE,图高=10,图宽=8----------------ht<-HighlightTrack(trackList=list(refGenes,dTrack5,dTrack 4,dTrack1、dTrack2、dTrack3),开始=c(24200000,25200000,26200000),end=c(2510000026150002700000),染色体=chr)plotTracks(列表(axisTrack,cpgIslands,ht),collapseTranscripts=TRUE,shape=“箭头”,transcriptAnnotation=“symbol”,从=24000000到=2700000)##----sessionInfo,eval=真,echo=真----------------------------------------sessionInfo()