Skip to content
GitLab
Explore
Sign in
Primary navigation
Search or go to…
Project
DOGMA
Manage
Activity
Members
Labels
Plan
Issues
Issue boards
Milestones
Iterations
Wiki
Requirements
Code
Merge requests
Repository
Branches
Commits
Tags
Repository graph
Compare revisions
Snippets
Locked files
Build
Pipelines
Jobs
Pipeline schedules
Test cases
Artifacts
Deploy
Releases
Package Registry
Container Registry
Model registry
Operate
Environments
Terraform modules
Monitor
Incidents
Service Desk
Analyze
Value stream analytics
Contributor analytics
CI/CD analytics
Repository analytics
Code review analytics
Issue analytics
Insights
Model experiments
Help
Help
Support
GitLab documentation
Compare GitLab plans
Community forum
Contribute to GitLab
Provide feedback
Keyboard shortcuts
?
Snippets
Groups
Projects
Show more breadcrumbs
domain-world
DOGMA
Commits
ea2640bd
Commit
ea2640bd
authored
1 year ago
by
Dr. Elias Dohmen
Browse files
Options
Downloads
Plain Diff
Merge branch 'ed_develop' into 'master'
DOGMA v3.8 See merge request
!4
parents
b66fa5a6
c715ce04
No related branches found
Branches containing commit
Tags
v3.8
Tags containing commit
1 merge request
!4
DOGMA v3.8
Changes
4
Hide whitespace changes
Inline
Side-by-side
Showing
4 changed files
CHANGELOG
+6
-0
6 additions, 0 deletions
CHANGELOG
README.md
+1
-1
1 addition, 1 deletion
README.md
UserManual.pdf
+0
-0
0 additions, 0 deletions
UserManual.pdf
dogma.py
+10
-10
10 additions, 10 deletions
dogma.py
with
17 additions
and
11 deletions
CHANGELOG
+
6
−
0
View file @
ea2640bd
DOGMA 3.8
=========
- update to Pfam Database version 36 (default for DOGMA from this version on)
DOGMA 3.7
=========
- update to Pfam Database version 35 (default for DOGMA from this version on)
- runs with new RADIANT version 1.0
- updated error handling for initial RADIANT annotation of fasta files if RADIANT is not in the PATH variable
...
...
This diff is collapsed.
Click to expand it.
README.md
+
1
−
1
View file @
ea2640bd
...
...
@@ -16,7 +16,7 @@ Current dependencies are (but you will need just one of them):
-
RADIANT (https://domainworld.uni-muenster.de/programs/radiant/)
OR
-
pfam_scan.pl (
f
tp://ftp.ebi.ac.uk/pub/databases/Pfam/Tools/)
-
pfam_scan.pl (
ht
tp://ftp.ebi.ac.uk/pub/databases/Pfam/Tools/)
Furthermore you will need a core set to run DOGMA.
...
...
This diff is collapsed.
Click to expand it.
UserManual.pdf
100644 → 100755
+
0
−
0
View file @
ea2640bd
No preview for this file type
This diff is collapsed.
Click to expand it.
dogma.py
+
10
−
10
View file @
ea2640bd
#!/usr/bin/env python
# DOGMA version 3.
7
# DOGMA version 3.
8
# DOGMA is a python script that can assess proteome or transcriptome quality based on conserved protein domains.
# To score the domain completeness of a proteome or transcriptome, DOGMA searches its domain annotation for conserved
# domains. By default, the conserved domains comprise domains that are shared by six eukaryotic model species.
# Copyright (C) 2015-2023 Elias Dohmen
# <e.dohmen@
wwu
.de> based on code by Lukas Kremer.
# <e.dohmen@
uni-muenster
.de> based on code by Lukas Kremer.
# DOGMA is free software: you can redistribute it and/or modify it
# under the terms of the GNU General Public License as published by
...
...
@@ -48,7 +48,7 @@ conversion_dictionary = None
def
main
():
dogma_version
=
'
3.
7
'
dogma_version
=
'
3.
8
'
try
:
# top level argument parsing
...
...
@@ -94,8 +94,8 @@ def main():
parser_proteome
.
add_argument
(
"
-o
"
,
"
--outfile
"
,
action
=
"
store
"
,
type
=
str
,
default
=
None
,
help
=
"
Summary will be saved in a file with the given name (and path),
"
"
instead of printed in the console.
"
)
parser_proteome
.
add_argument
(
"
-m
"
,
"
--pfam
"
,
action
=
"
store
"
,
type
=
str
,
default
=
"
3
5
"
,
help
=
"
The version number of the pfam database that should be used (Default is 3
5
).
"
)
parser_proteome
.
add_argument
(
"
-m
"
,
"
--pfam
"
,
action
=
"
store
"
,
type
=
str
,
default
=
"
3
6
"
,
help
=
"
The version number of the pfam database that should be used (Default is 3
6
).
"
)
parser_proteome
.
add_argument
(
"
-d
"
,
"
--database
"
,
action
=
"
store
"
,
type
=
str
,
default
=
None
,
help
=
"
If the RADIANT database is not located in the RADIANT directory, please specify
"
"
path and name of the database. (Just necessary for -i option)
"
)
...
...
@@ -126,9 +126,9 @@ def main():
parser_transcriptome
.
add_argument
(
"
-s
"
,
"
--cda_size
"
,
action
=
"
store
"
,
default
=
3
,
type
=
int
,
help
=
"
Specifies up to which size subsets of CDAs should be considered
"
"
(default=3; A-B-C-D --> A-B-C, A-B-D, B-C-D etc.).
"
)
parser_transcriptome
.
add_argument
(
"
-m
"
,
"
--pfam
"
,
action
=
"
store
"
,
type
=
str
,
default
=
"
3
5
"
,
parser_transcriptome
.
add_argument
(
"
-m
"
,
"
--pfam
"
,
action
=
"
store
"
,
type
=
str
,
default
=
"
3
6
"
,
help
=
"
The version number of the pfam database that should be used
"
"
(Default is 3
5
).
"
)
"
(Default is 3
6
).
"
)
parser_transcriptome
.
add_argument
(
"
-d
"
,
"
--database
"
,
action
=
"
store
"
,
default
=
None
,
help
=
"
If the RADIANT database is not located in the RADIANT directory, please specify
"
"
path and name of the database. (Just necessary for -i option)
"
)
...
...
@@ -267,7 +267,7 @@ class ConversionDictionary(dict):
def
score_single_transcriptome
(
annotation_file
,
outfile
=
None
,
max_dom_tup_len
=
3
,
hq_transcriptomes
=
None
,
mode
=
'
transcriptome
'
,
pfam
=
'
3
5
'
,
initial
=
None
,
version
=
'
3.
7
'
,
hq_transcriptomes
=
None
,
mode
=
'
transcriptome
'
,
pfam
=
'
3
6
'
,
initial
=
None
,
version
=
'
3.
8
'
,
annotype
=
'
pfsc
'
,
coverage
=
0.5
):
"""
combines the functions and classes to score a sample proteome in terms of it
'
s domain completeness.
...
...
@@ -345,7 +345,7 @@ def score_single_transcriptome(annotation_file, outfile=None, max_dom_tup_len=3,
def
score_single_proteome
(
annotation_file
,
outfile
=
None
,
cutoff
=
2
,
max_dom_tup_len
=
3
,
hq_proteomes
=
None
,
mode
=
'
proteome
'
,
pfam
=
'
3
5
'
,
initial
=
None
,
version
=
'
3.
7
'
,
max_dom_tup_len
=
3
,
hq_proteomes
=
None
,
mode
=
'
proteome
'
,
pfam
=
'
3
6
'
,
initial
=
None
,
version
=
'
3.
8
'
,
annotype
=
'
pfsc
'
,
coverage
=
0.5
):
"""
combines the functions and classes to score a sample proteome in terms of it
'
s domain completeness.
...
...
@@ -776,7 +776,7 @@ class QualityChecker:
if
count_in_candidate
<
count_in_HQ
:
self
.
doms_missing_number
+=
count_in_HQ
-
count_in_candidate
self
.
out
.
append
((
count_in_candidate
,
self
.
cda_count_dict
[
dom
],
dom
))
self
.
out
.
sort
(
key
=
lambda
l
:
l
[
2
])
self
.
out
.
sort
(
key
=
lambda
ele
:
ele
[
2
])
if
self
.
number_of_CDA
==
0
:
self
.
percentage
=
"
NA
"
...
...
This diff is collapsed.
Click to expand it.
Preview
0%
Loading
Try again
or
attach a new file
.
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Save comment
Cancel
Please
register
or
sign in
to comment