From 79de98366de429c387d702b7eba246b5042c86ab Mon Sep 17 00:00:00 2001 From: steve-fischer-200 Date: Mon, 16 Feb 2026 12:31:18 -0500 Subject: [PATCH 1/7] 3 new ortho tables --- .../tuningManager/orthomclTuningManager.xml | 158 +++++++++++++++++- 1 file changed, 157 insertions(+), 1 deletion(-) diff --git a/Model/lib/xml/tuningManager/orthomclTuningManager.xml b/Model/lib/xml/tuningManager/orthomclTuningManager.xml index c6ae9afa..821a12ec 100644 --- a/Model/lib/xml/tuningManager/orthomclTuningManager.xml +++ b/Model/lib/xml/tuningManager/orthomclTuningManager.xml @@ -2,6 +2,70 @@ + + + + + + + + + + + + + + + @@ -144,8 +208,100 @@ + + + + + + + + + + + + + + + + + + + - + + + + + + From c21385c38424281ddfa3799346c634f118de0f6c Mon Sep 17 00:00:00 2001 From: Eve <53914655+ebapidb@users.noreply.github.com> Date: Mon, 16 Feb 2026 12:27:30 +0000 Subject: [PATCH 2/7] a.armitage --- .../xml/datasetPresenters/contacts/allContacts.xml | 12 ++++++++++++ 1 file changed, 12 insertions(+) diff --git a/Model/lib/xml/datasetPresenters/contacts/allContacts.xml b/Model/lib/xml/datasetPresenters/contacts/allContacts.xml index 16deb52f..180c23ca 100644 --- a/Model/lib/xml/datasetPresenters/contacts/allContacts.xml +++ b/Model/lib/xml/datasetPresenters/contacts/allContacts.xml @@ -27,6 +27,18 @@ + + a.armitage + Andrew Armitage + National Resources Institute, University of Greenwich, Kent, ME4 4TB, U.K. + +
+ + + + +
+ j.d.bohbot J.D. Bohbot From b9d49b282d9b9099b11d867d9c9d0b4222e5987a Mon Sep 17 00:00:00 2001 From: Eve <53914655+ebapidb@users.noreply.github.com> Date: Mon, 16 Feb 2026 12:39:51 +0000 Subject: [PATCH 3/7] a.armitage --- Model/lib/xml/datasetPresenters/contacts/allContacts.xml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/Model/lib/xml/datasetPresenters/contacts/allContacts.xml b/Model/lib/xml/datasetPresenters/contacts/allContacts.xml index 180c23ca..8f7e022c 100644 --- a/Model/lib/xml/datasetPresenters/contacts/allContacts.xml +++ b/Model/lib/xml/datasetPresenters/contacts/allContacts.xml @@ -31,7 +31,7 @@ a.armitage Andrew Armitage National Resources Institute, University of Greenwich, Kent, ME4 4TB, U.K. - + A.D.Armitage@gre.ac.uk
From 2531c6f8378dabaa76454cf7a5df51f260ac980c Mon Sep 17 00:00:00 2001 From: rdemko2332 Date: Mon, 16 Feb 2026 13:15:23 -0500 Subject: [PATCH 4/7] Updating sequence attributes table with product description changes to fill missing descriptions --- .../tuningManager/orthomclTuningManager.xml | 141 +++++++++++------- 1 file changed, 87 insertions(+), 54 deletions(-) diff --git a/Model/lib/xml/tuningManager/orthomclTuningManager.xml b/Model/lib/xml/tuningManager/orthomclTuningManager.xml index 821a12ec..fba515a4 100644 --- a/Model/lib/xml/tuningManager/orthomclTuningManager.xml +++ b/Model/lib/xml/tuningManager/orthomclTuningManager.xml @@ -74,17 +74,20 @@ LEFT JOIN ( + From 93c250017820c88c41632cb1c8ca110174575304 Mon Sep 17 00:00:00 2001 From: steve-fischer-200 Date: Wed, 18 Feb 2026 12:51:57 -0500 Subject: [PATCH 5/7] update seq attrs table --- .../tuningManager/orthomclTuningManager.xml | 205 ++++++++++-------- 1 file changed, 119 insertions(+), 86 deletions(-) diff --git a/Model/lib/xml/tuningManager/orthomclTuningManager.xml b/Model/lib/xml/tuningManager/orthomclTuningManager.xml index fba515a4..125bec61 100644 --- a/Model/lib/xml/tuningManager/orthomclTuningManager.xml +++ b/Model/lib/xml/tuningManager/orthomclTuningManager.xml @@ -84,10 +84,8 @@ LEFT JOIN ( aas.source_id AS full_id, aas.source_id, aas.aa_sequence_id, - length(aas.sequence) AS length, - - COALESCE(aas.description, ta.gene_product) AS product, - + length(aas.sequence) as length, + aas.description AS product, aas.taxon_id, taxon.orthomcl_taxon_id, @@ -102,102 +100,80 @@ LEFT JOIN ( o.number_of_core_members, o.number_of_peripheral_members, CASE is_residual WHEN 1 THEN 'Residual' - ELSE 'Core' END AS group_type, + ELSE 'Core' END AS group_type, urls.source_url, - urls.source_text - - FROM dots.AASequence aas - - JOIN apidb.orthologGroupAASequence ogseq - ON aas.aa_sequence_id = ogseq.aa_sequence_id - - JOIN apidb.orthologGroup o - ON ogseq.group_id = o.group_id - - LEFT JOIN apidbtuning.transcriptattributes ta - ON ta.protein_source_id = aas.source_id - - JOIN ( + urls.source_text, + da_agg.pfam_domains + FROM + dots.AASequence aas + LEFT JOIN ( + SELECT + aa_sequence_id, + string_agg(accession, ', ') AS pfam_domains + FROM apidbTuning.DomainAssignment + GROUP BY aa_sequence_id + ) da_agg ON aas.aa_sequence_id = da_agg.aa_sequence_id, + apidb.orthologGroup o, + apidb.orthologGroupAASequence ogseq, + ( SELECT o.orthomcl_abbrev, - o.taxon_id AS orthomcl_taxon_id, + o.taxon_id as orthomcl_taxon_id, t.name, t.core_peripheral, t.taxon_group FROM apidb.organism o, - ( - WITH RECURSIVE TaxonHierarchy AS ( - SELECT - three_letter_abbrev, - orthomcl_clade_id, - name, - core_peripheral, - name AS taxon_group, - parent_id - FROM apidb.OrthomclClade - WHERE name IN ( - 'Archaea','Bacteria','Alveolates','Amoebozoa', - 'Euglenozoa','Fungi','Metazoa', - 'Other Eukaryota','Viridiplantae' - ) - - UNION ALL - - SELECT - child.three_letter_abbrev, - child.orthomcl_clade_id, - child.name, - child.core_peripheral, - parent.taxon_group, - child.parent_id - FROM apidb.OrthomclClade child - JOIN TaxonHierarchy parent - ON child.parent_id = parent.orthomcl_clade_id + (WITH RECURSIVE TaxonHierarchy AS ( + SELECT + three_letter_abbrev, + orthomcl_clade_id, + name, + core_peripheral, + name AS taxon_group, + parent_id + FROM apidb.OrthomclClade + WHERE name IN ('Archaea', 'Bacteria', 'Alveolates', 'Amoebozoa', 'Euglenozoa', + 'Fungi', 'Metazoa', 'Other Eukaryota', 'Viridiplantae') + UNION ALL + SELECT + child.three_letter_abbrev, + child.orthomcl_clade_id, + child.name, + child.core_peripheral, + parent.taxon_group, + child.parent_id + FROM apidb.OrthomclClade child + JOIN TaxonHierarchy parent ON child.parent_id = parent.orthomcl_clade_id ) SELECT three_letter_abbrev, taxon_group, name, core_peripheral FROM TaxonHierarchy - WHERE core_peripheral IN ('C','P') - ) t + WHERE core_peripheral IN ('C', 'P') + ) t WHERE t.three_letter_abbrev = o.orthomcl_abbrev - ) taxon - ON taxon.orthomcl_taxon_id = aas.taxon_id - - JOIN ( + ) taxon, + + ( SELECT aas.aa_sequence_id, - CASE - WHEN ores.resource_name IN ( - 'AmoebaDB','CryptoDB','FungiDB','GiardiaDB','HostDB', - 'MicrosporidiaDB','PlasmoDB','PiroplasmaDB','ToxoDB', - 'TrichDB','TriTrypDB','VectorBase' - ) - THEN SUBSTR(ores.resource_url,0,strpos(ores.resource_url,'/downloads')) - || 'record/gene/' || aas.source_id - - WHEN ores.resource_name = 'Uniprot' - THEN SUBSTR(ores.resource_url,0,strpos(ores.resource_url,'/proteomes')) - || 'uniprot/' || aas.source_id - ELSE '' - END AS source_url, - - CASE - WHEN ores.resource_name IS NULL THEN '' - ELSE aas.source_id || ' (' || ores.resource_name || ')' - END AS source_text - - FROM dots.AASequence aas, + CASE + WHEN ores.resource_name IN ('AmoebaDB','CryptoDB','FungiDB','GiardiaDB','HostDB','MicrosporidiaDB', + 'PlasmoDB','PiroplasmaDB','ToxoDB','TrichDB','TriTrypDB','VectorBase') + THEN SUBSTR(ores.resource_url, 0, strpos(ores.resource_url, '/downloads')) || 'record/gene/' + || aas.source_id + WHEN ores.resource_name = 'Uniprot' + THEN SUBSTR(ores.resource_url, 0, strpos(ores.resource_url, '/proteomes') ) || 'uniprot/' + || aas.source_id + ELSE '' END AS source_url, + CASE WHEN ores.resource_name IS NULL THEN '' + ELSE aas.source_id || ' (' || ores.resource_name || ')' END AS source_text + FROM dots.AaSequence aas, apidb.organism ot, apidb.orthomclresource ores WHERE ot.taxon_id = ores.orthomcl_taxon_id - AND ot.taxon_id = aas.taxon_id - ) urls - ON aas.aa_sequence_id = urls.aa_sequence_id - - WHERE taxon.orthomcl_taxon_id = aas.taxon_id - AND aas.taxon_id IN ( - SELECT DISTINCT eas.taxon_id - FROM apidb.organism og, - dots.AASequence eas - WHERE eas.taxon_id = og.taxon_id - ) + AND ot.taxon_id = aas.taxon_id) urls + WHERE aas.aa_sequence_id = ogseq.aa_sequence_id + AND ogseq.group_id = o.group_id + AND aas.aa_sequence_id = urls.aa_sequence_id + AND taxon.orthomcl_taxon_id = aas.taxon_id + AND aas.taxon_id in (select distinct(eas.taxon_id) from apidb.organism og, dots.aasequence eas where eas.taxon_id = og.taxon_id) ]]> @@ -334,6 +310,63 @@ ORDER BY sa.full_id, da.start_min
+ + + + + + + + + + + + + + + + From 40a86df9c427fae74eca13baa8dc4e05ac04d72f Mon Sep 17 00:00:00 2001 From: steve-fischer-200 Date: Thu, 19 Feb 2026 14:17:31 -0500 Subject: [PATCH 6/7] adjust more tuning tables --- .../tuningManager/orthomclTuningManager.xml | 47 ++++++++++++++----- 1 file changed, 35 insertions(+), 12 deletions(-) diff --git a/Model/lib/xml/tuningManager/orthomclTuningManager.xml b/Model/lib/xml/tuningManager/orthomclTuningManager.xml index 125bec61..94262fb4 100644 --- a/Model/lib/xml/tuningManager/orthomclTuningManager.xml +++ b/Model/lib/xml/tuningManager/orthomclTuningManager.xml @@ -11,15 +11,18 @@ @@ -75,6 +89,7 @@ LEFT JOIN ( + @@ -110,7 +125,7 @@ LEFT JOIN ( SELECT aa_sequence_id, string_agg(accession, ', ') AS pfam_domains - FROM apidbTuning.DomainAssignment + FROM DomainAssignment GROUP BY aa_sequence_id ) da_agg ON aas.aa_sequence_id = da_agg.aa_sequence_id, apidb.orthologGroup o, @@ -305,7 +320,7 @@ ORDER BY sa.full_id, da.start_min @@ -423,21 +438,29 @@ CREATE INDEX TypeAheadCounts_idx&1 ON TypeAheadCounts&1 (option_id) - + + + From ee7b16cfbea3747302cdff1294a18ddf8a92e79e Mon Sep 17 00:00:00 2001 From: rdemko2332 Date: Thu, 19 Feb 2026 15:29:32 -0500 Subject: [PATCH 7/7] Adding new product description functionality to more efficient sequence attributes query --- .../tuningManager/orthomclTuningManager.xml | 248 +++++++++--------- 1 file changed, 130 insertions(+), 118 deletions(-) diff --git a/Model/lib/xml/tuningManager/orthomclTuningManager.xml b/Model/lib/xml/tuningManager/orthomclTuningManager.xml index 3e8ee1ef..2915b9e7 100644 --- a/Model/lib/xml/tuningManager/orthomclTuningManager.xml +++ b/Model/lib/xml/tuningManager/orthomclTuningManager.xml @@ -94,125 +94,137 @@ LEFT JOIN (