@@ -3900,37 +3900,42 @@ entrez_over_to_gsea = function(my_entrez_rank, species, gene_collections = NULL
3900
3900
# Check if package is installed, otherwise install
3901
3901
check_and_install_packages(c(" fastmatch" , " clusterProfiler" ))
3902
3902
3903
+ # Check msigdbr version
3904
+ if (packageVersion(" msigdbr" ) < " 10.0.0" ) {
3905
+ stop(" tidybulk says: msigdbr version must be >= 10.0.0" )
3906
+ }
3903
3907
3904
3908
3905
3909
# Get gene sets signatures
3906
- msigdbr :: msigdbr(species = species ) %> %
3910
+ # Get MSigDB data
3911
+ msigdb_data = msigdbr :: msigdbr(species = species )
3907
3912
3908
- # Filter specific gene_collections if specified. This was introduced to speed up examples executionS
3909
- when(
3910
- ! is.null(gene_collections ) ~ filter(. , gs_cat %in% gene_collections ),
3911
- ~ (. )
3912
- ) %> %
3913
+ # Filter for specific gene collections if provided
3914
+ if (! is.null(gene_collections )) {
3915
+ msigdb_data = filter(msigdb_data , gs_collection %in% gene_collections )
3916
+ }
3913
3917
3914
- # Execute calculation
3915
- nest(data = - gs_cat ) %> %
3918
+ # Process the data
3919
+ msigdb_data | >
3920
+ nest(data = - gs_collection ) | >
3916
3921
mutate(test =
3917
3922
map(
3918
3923
data ,
3919
3924
~ clusterProfiler :: enricher(
3920
3925
my_entrez_rank ,
3921
- TERM2GENE = .x % > % select(gs_name , entrez_gene ),
3926
+ TERM2GENE = .x | > select(gs_name , ncbi_gene ),
3922
3927
pvalueCutoff = 1
3923
- ) % > %
3924
- as_tibble
3925
- )) % > %
3926
- select(- data ) % > %
3927
- unnest(test ) % > %
3928
+ ) | >
3929
+ as_tibble()
3930
+ )) | >
3931
+ select(- data ) | >
3932
+ unnest(test ) | >
3928
3933
3929
3934
# Order
3930
- arrange(`p.adjust` ) % > %
3935
+ arrange(`p.adjust` ) | >
3931
3936
3932
3937
# format transcripts
3933
- mutate(entrez = strsplit(geneID , " /" )) % > %
3938
+ mutate(entrez = strsplit(geneID , " /" )) | >
3934
3939
select(- geneID )
3935
3940
3936
3941
}
0 commit comments