From 5255adafda1ae1cca4dccc586b9d45349b4188a3 Mon Sep 17 00:00:00 2001 From: l-singh-biomsu Date: Thu, 17 Oct 2024 10:18:36 +0000 Subject: [PATCH] udated classification.json --- CURATED_SET/classification.json | 4988 ++++++++++++++++++++----------- 1 file changed, 3292 insertions(+), 1696 deletions(-) diff --git a/CURATED_SET/classification.json b/CURATED_SET/classification.json index a4a9272..05eb72a 100644 --- a/CURATED_SET/classification.json +++ b/CURATED_SET/classification.json @@ -1,11 +1,30 @@ { "tree": { + "Archaeal": "null", + "H1": { + "cH1": "null", + "generic_H1": "null", + "H1.0": "null", + "H1.1": "null", + "H1.10": "null", + "H1.2": "null", + "H1.3": "null", + "H1.4": "null", + "H1.5": "null", + "OO_H1.8": "null", + "scH1": "null", + "TS_H1.6": "null", + "TS_H1.7": "null", + "TS_H1.9": "null" + }, "H2A": { "cH2A": { "cH2A_(Animals)": { "cH2A_(Vertebrata)": { "cH2A_(Mammalia)": { "cH2A_(Homo_sapiens)": { + "cH2A.10_(Homo_sapiens)": "null", + "cH2A.11_(Homo_sapiens)": "null", "cH2A.1_(Homo_sapiens)": "null", "cH2A.2_(Homo_sapiens)": "null", "cH2A.3_(Homo_sapiens)": "null", @@ -14,9 +33,7 @@ "cH2A.6_(Homo_sapiens)": "null", "cH2A.7_(Homo_sapiens)": "null", "cH2A.8_(Homo_sapiens)": "null", - "cH2A.9_(Homo_sapiens)": "null", - "cH2A.10_(Homo_sapiens)": "null", - "cH2A.11_(Homo_sapiens)": "null" + "cH2A.9_(Homo_sapiens)": "null" }, "cH2A_(Mus_musculus)": { "cH2A.1_(Mus_musculus)": "null" @@ -24,13 +41,33 @@ } } }, + "cH2A_(Fungi)": "null", "cH2A_(Plants)": { - "cH2A_(Embryophyta)": "null", - "cH2A_(Chlorophyta)": "null" + "cH2A_(Chlorophyta)": "null", + "cH2A_(Embryophyta)": "null" }, - "cH2A_(Fungi)": "null", "cH2A_(Protists)": "null" }, + "gH2A": "null", + "H2A.J": { + "H2A.J_(Homo_sapiens)": "null" + }, + "H2A.M": "null", + "H2A.R": "null", + "H2A.W": "null", + "H2A.X": { + "H2A.X_(Animals)": { + "H2A.X_(Vertebrata)": { + "H2A.X_(Mammalia)": { + "H2A.X_(Homo_sapiens)": "null", + "H2A.X_(Mus_musculus)": "null" + } + } + }, + "H2A.X_(Fungi)": "null", + "H2A.X_(Plants)": "null", + "H2A.X_(Protists)": "null" + }, "H2A.Z": { "H2A.Z.1_(Chordata)": { "H2A.Z.1_(Primates)": { @@ -48,19 +85,6 @@ } } }, - "H2A.X": { - "H2A.X_(Animals)": { - "H2A.X_(Vertebrata)": { - "H2A.X_(Mammalia)": { - "H2A.X_(Homo_sapiens)": "null", - "H2A.X_(Mus_musculus)": "null" - } - } - }, - "H2A.X_(Plants)": "null", - "H2A.X_(Fungi)": "null", - "H2A.X_(Protists)": "null" - }, "macroH2A": { "macroH2A.1_(Mammalia)": { "macroH2A.1.s1_(Mammalia)": { @@ -102,14 +126,7 @@ "H2A.P_(Mus_musculus)": "null" }, "H2A.Q": "null" - }, - "H2A.R": "null", - "H2A.J": { - "H2A.J_(Homo_sapiens)": "null" - }, - "H2A.W": "null", - "H2A.M": "null", - "gH2A": "null" + } }, "H2B": { "cH2B": { @@ -117,6 +134,12 @@ "cH2B_(Vertebrata)": { "cH2B_(Mammalia)": { "cH2B_(Homo_sapiens)": { + "cH2B.10_(Homo_sapiens)": "null", + "cH2B.11_(Homo_sapiens)": "null", + "cH2B.12_(Homo_sapiens)": "null", + "cH2B.13_(Homo_sapiens)": "null", + "cH2B.14_(Homo_sapiens)": "null", + "cH2B.15_(Homo_sapiens)": "null", "cH2B.1_(Homo_sapiens)": "null", "cH2B.2_(Homo_sapiens)": "null", "cH2B.3_(Homo_sapiens)": "null", @@ -125,12 +148,7 @@ "cH2B.6_(Homo_sapiens)": "null", "cH2B.7_(Homo_sapiens)": "null", "cH2B.8_(Homo_sapiens)": "null", - "cH2B.9_(Homo_sapiens)": "null", - "cH2B.10_(Homo_sapiens)": "null", - "cH2B.11_(Homo_sapiens)": "null", - "cH2B.12_(Homo_sapiens)": "null", - "cH2B.13_(Homo_sapiens)": "null", - "cH2B.14_(Homo_sapiens)": "null" + "cH2B.9_(Homo_sapiens)": "null" }, "cH2B_(Mus_musculus)": { "cH2B.1_(Mus_musculus)": "null", @@ -139,37 +157,40 @@ } } }, + "cH2B_(Fungi)": "null", "cH2B_(Plants)": { - "cH2B_(Embryophyta)": "null", - "cH2B_(Chlorophyta)": "null" + "cH2B_(Chlorophyta)": "null", + "cH2B_(Embryophyta)": "null" }, - "cH2B_(Fungi)": "null", "cH2B_(Protists)": "null" }, - "H2B.L": "null", - "H2B.W": { - "H2B.W_(Homo_sapiens)": { - "H2B.W.1_(Homo_sapiens)": "null", - "H2B.W.2_(Homo_sapiens)": "null" - } - }, + "CS_H2B_(Echinoidea)": "null", + "early_H2B_(Echinoidea)": "null", + "gH2B": "null", "H2B.K": { "H2B.K_(Homo_sapiens)": "null" }, + "H2B.L": "null", "H2B.N": { "H2B.N_(Homo_sapiens)": "null" }, "H2B.O": "null", "H2B.S": "null", - "gH2B": "null", - "H2B.Z": "null", "H2B.V": "null", - "CS_H2B_(Echinoidea)": "null", - "early_H2B_(Echinoidea)": "null", + "H2B.W": { + "H2B.W_(Homo_sapiens)": { + "H2B.W.1_(Homo_sapiens)": "null", + "H2B.W.2_(Homo_sapiens)": "null" + } + }, + "H2B.Z": "null", "late_H2B_(Echinoidea)": "null", "sperm_H2B_(Echinoidea)": "null" }, "H3": { + "cenH3_(Eukarya)": { + "cenH3_(Plants)": "null" + }, "cH3": { "cH3_(Animals)": { "cH3_(Vertebrata)": { @@ -183,24 +204,24 @@ } } }, + "cH3_(Fungi)": "null", "cH3_(Plants)": { - "cH3_(Embryophyta)": "null", - "cH3_(Chlorophyta)": "null" + "cH3_(Chlorophyta)": "null", + "cH3_(Embryophyta)": "null" }, - "cH3_(Fungi)": "null", "cH3_(Protists)": "null" }, + "H3.1-like_(Plants)": "null", "H3.3": { "H3.3_(Animals)": { "H3.3_(Homo_sapiens)": "null" }, - "H3.3_(Plants)": "null", "H3.3_(Fungi)": { "H3.3_(Ascomycota)": "null" }, + "H3.3_(Plants)": "null", "H3.3_(Protists)": "null" }, - "H3.4_(Mammalia)": "null", "H3.3-like?": { "H3.3-like_(Animals)": { "H3.X_(Primates?)": { @@ -211,64 +232,57 @@ } }, "H3.3-like_(Plants)": { - "TS H3.10": "null", - "H3_(Lilly???)": "null" + "H3_(Lilly???)": "null", + "TS H3.10": "null" } }, - "H3.1-like_(Plants)": "null", + "H3.4_(Mammalia)": "null", "H3.5_(Primates_or_Hominids?)": "null", "H3.6_(Mammals?)?": "null", "H3.7_(Mammals?)?": "null", "H3.8_(Mammals?)?": "null", - "H3.P_(Moneuplotes?)": "null", - "H3.V_(Trypanosomes?)": "null", "H3.B_(Giardia?)": "null", - "cenH3_(Eukarya)": "null" + "H3.P_(Moneuplotes?)": "null", + "H3.V_(Trypanosomes?)": "null" }, "H4": { "cH4": "null" }, - "H1": { - "cH1": "null", - "generic_H1": "null", - "H1.0": "null", - "H1.1": "null", - "H1.2": "null", - "H1.3": "null", - "H1.4": "null", - "H1.5": "null", - "TS_H1.6": "null", - "TS_H1.7": "null", - "OO_H1.8": "null", - "TS_H1.9": "null", - "H1.10": "null", - "scH1": "null" - }, - "Archaeal": "null", "Viral": "null" }, "info": { - "H2A": { + "Archaeal": { "level": "type", "description": { - "summary": "H2A is one of the core histone types present in all Eukaryotes. H2A forms dimers with H2B via the \"hand shake\" motif. Two H2A-H2B dimers in turn associate with H3-H4 tetramer to form complete nucleosome core. Structure of H2A consists of a histone fold domain extended by a short \u03b1C-helix and has both N- and C-terminal tails. \u03b1C-helix and C-terminal tail form \"docking domain\" that locks the H2A-H2B dimer onto the surface of H3-H4 tetramer [luger_crystal_1997]. It has been suggested that H2A and H2B have arisen from H3 and H4 during evolution [malik_phylogenomics_2003]. H2A histones have the most number of described functional variants." + "summary": "null", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Eukaryotes", - "taxonomic_span_id": "2759", - "publications": [ - "luger_crystal_1997", - "malik_phylogenomics_2003" - ] + "taxonomic_span": "null", + "taxonomic_span_id": "null", + "alternate_names": [], + "publications": [] }, - "cH2A": { + "cenH3_(Eukarya)": { "level": "variant_group", "description": { - "summary": "cH2A -- canonical H2A histones. This is a loosely defined group that encompasses major H2A histone proteins that are mainly expressed during S-phase of the cell cycle in eukaryotes and are highly conserved even between distantly related species. Such proteins are often called replication dependent (RD), replication coupled (RC), clustered or \"bulk\" histones [marzluff_metabolism_2008,talbert_histone_2021]. They are likely similar to the original H2A histones of the last common ancestor of eukaryotes [malik_phylogenomics_2003], although a similar H2A.X variant might have been also ancestral [talbert_histone_2021]. Expression of canonical histones during S-phase is often tightly regulated, but mechanisms may differ among kindoms [marzluff_birth_2017,pontarotti_long-term_2009]. Canonical histone genes are often present as large mulrigene families clustered together in certain locations of the genome. However, there are known limitations to the definition given above. Functional diversification of paralogous genes is a common process in evolution -- in many species multiple copies of canonical histone genes have undergone diversification in terms of sequence variation, cell-cycle or tissue-specific expression patterns. Sometimes this diversification is very subtle and species-specific (e.g. cH2A isoforms in human), in other cases there may be a spectrum of canonical-like proteins (e.g. plant canonical H2As which show higher sequence diversity than cH2Bs of animals). Hence, whether a particular gene should be regarded as a canonical, a bona fide variant or a canonical subvariant/isoform may be a matter of debate and definition in each particular case. Within the current hierarchical classification system, additional information about the cH2A class may be gained by looking at the description of its subclasses. ", - "taxonomy": "Present in all Eukaryotes.", + "summary": "null", + "taxonomy": "null", "genes": "null", - "evolution": "Because of its conserved function in the DNA damage response, it seems probable that H2A.X is ancestral, and that the various RC H2As are derived from it [talbert_histone_2021].", + "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -276,32 +290,74 @@ "structure": "null", "interactions": "null", "disease": "null", - "caveats": "In certain species H2A.X may perform cH2A role, hence in our classification such species will lack cH2A histones. In single-celled eukaryotes, such as yeast, H2A.X can be the primary form of H2A [talbert_histone_2021]. The same might apply to certain protozoan parasites, such as G. lamblia [dalmasso_canonical_2011]." + "caveats": "null" }, - "taxonomic_span": "Eukaryota", + "taxonomic_span": "null", + "taxonomic_span_id": "null", + "alternate_names": [], + "publications": [] + }, + "cenH3_(Plants)": { + "level": "variant", + "description": { + "summary": "cenH3 is a centromere-specific histone variant, which replaces canonical H3 in centromeric nucleosomes. It is required for kinetochore formation, mitotic progression and chromosome segregation. cenH3 has an extended L1-loop and its N-terminal tail is very different from other H3 variants. cenH3s have an extended L1-loop and usually replace Phe84 in canonical H3 with Trp, and Thr 107 with Ala, Cys, or Ser. cenH3s ususally lack a conserved glutamine in the alpha1 helix of the histone fold. cenH3s typically have only about 50-60% amino acid identity to canonical H3 in the histone fold domain and no conservation of the N-terminus.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Eukaryotes", "taxonomic_span_id": "2759", "alternate_names": [ { - "name": "canonical H2A" + "name": "CENP-A" + }, + { + "name": "Cse4" + }, + { + "name": "HCP-3" + }, + { + "name": "CNP1" + }, + { + "name": "HTR12" + }, + { + "name": "CNA1" + }, + { + "name": "cid" } ], "publications": [ - "marzluff_metabolism_2008", - "talbert_histone_2021", - "malik_phylogenomics_2003", - "marzluff_birth_2017", - "pontarotti_long-term_2009" + "14583738", + "19766562", + "21743476", + "22650316", + "23324462", + "25956076" ] }, - "cH2A_(Animals)": { + "cH1": { "level": "variant_group", "description": { - "summary": "cH2A_(Animals) -- clustered H2A histones in animals (Metazoa), often called canonical, replication-dependent, replication-coupled or \"bulk\" H2A histones are a major class of H2A histones in animals with high sequence similarity across all animal species. Histone genes encodig these proteins have several particular features. 1) These genes lack introns and are found in multiple similar copies clustered along the genome togerther with other core histone genes (H3, H4, H2B, and optionally H1). The exact organisation may vary from tandemly repeated quintets of H3, H4, H2A, H2B, H1 genes transcribed from the same strand to non-tandem jumbled arrays of genes transcribed from divergent promoters [pontarotti_long-term_2009]. 2) These genes are mainly expressed during S-phase of the cell cycle in a coordinated fashion (hence the name \"replication dendent\") and produce mRNAs that are not polyadenylated but rather end in a conserved stem-loop, which is further bound by the stem-loop binding protein (SLBP). mRNAs are rapidly degraded after the S-phase. 3) These genes are present in a specialized nuclear domain, the histone locus body (HLB), which concetrates factors for histone mRNA transcription and processing (in humans these include NPAT, U7 snRNP, FLASH) [marzluff_birth_2017].", - "taxonomy": "Animals (Metazoa)", + "summary": "null", + "taxonomy": "null", "genes": "null", - "evolution": "H2A.X histone variant is usually closely related to replication-dependent H2A histones in the same group of animals. In humans, H2A.X produces both polyadenylated mRNAs and mRNAs ending in a stem-loop. It is probale that it is ancestral to clustered H2A histones [talbert_histone_2021].", + "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -309,25 +365,22 @@ "structure": "null", "interactions": "null", "disease": "null", - "caveats": "1) Clustered histones may still exhibit some level of sequence variation between the multiple gene copies in certain species. Evidence exists that these differences may have functional implications (e.g. affect nucleosome stability). Some clustered genes have tissue-specific expression and play specific functional roles (e.g. cH2A.1 in mice). 2) A subset of clustered histones, which are normally expressed as replication-dependent histones, are expressed as polyadenylated mRNAs in adult non-dividing tissues to replenish histone pool in differentiated tissues [lyons_subset_2016]. 3) Certain clustered histones may act as functional histone variants with replication-independent polyA-tail-regulated expression being the major/only form (e.g. cH2B.E_(Mus_musculus), or H2A.J, which is closely related to cH2As). 4) In C. elegans an alternative mechanism of mRNA 3'-end processing evolved resulting in loss of HLB and histone clusters [marzluff_birth_2017, pontarotti_long-term_2009]. 5) H2A.X histone variant is usually closely related to replication-dependent H2A histones in the same group of animals. In humans, H2A.X produces both polyadenylated mRNAs and mRNAs ending in a stem-loop. It is probale that it is ancestral to clustered H2A histones [talbert_histone_2021]. " + "caveats": "null" }, - "taxonomic_span": "Metazoa", - "taxonomic_span_id": "33208", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], - "publications": [ - "pontarotti_long-term_2009", - "marzluff_birth_2017" - ] + "publications": [] }, - "cH2A_(Vertebrata)": { + "cH2A": { "level": "variant_group", "description": { - "summary": "cH2A_(Vertebrata) -- clustered H2A histones in vertebrates, often called canonical, replication-dependent, replication-coupled or \"bulk\" H2A histones. This is a subclass of cH2A_(Animals) (see it for a detailed description).", - "taxonomy": "Vertebrates (Vertebrata)", + "summary": "cH2A canonical H2A histones. This is a loosely defined group that encompasses major H2A histone proteins that are mainly expressed during S-phase of the cell cycle in eukaryotes and are highly conserved even between distantly related species. Such proteins are often called replication dependent (RD), replication coupled (RC), clustered or \"bulk\" histones [marzluff_metabolism_2008,talbert_histone_2021]. They are likely similar to the original H2A histones of the last common ancestor of eukaryotes [malik_phylogenomics_2003], although a similar H2A.X variant might have been also ancestral [talbert_histone_2021]. Expression of canonical histones during S-phase is often tightly regulated, but mechanisms may differ among kindoms [marzluff_birth_2017,pontarotti_long-term_2009]. Canonical histone genes are often present as large mulrigene families clustered together in certain locations of the genome. However, there are known limitations to the definition given above. Functional diversification of paralogous genes is a common process in evolution in many species multiple copies of canonical histone genes have undergone diversification in terms of sequence variation, cell-cycle or tissue-specific expression patterns. Sometimes this diversification is very subtle and species-specific (e.g. cH2A isoforms in human), in other cases there may be a spectrum of canonical-like proteins (e.g. plant canonical H2As which show higher sequence diversity than cH2Bs of animals). Hence, whether a particular gene should be regarded as a canonical, a bona fide variant or a canonical subvariant/isoform may be a matter of debate and definition in each particular case. Within the current hierarchical classification system, additional information about the cH2A class may be gained by looking at the description of its subclasses. ", + "taxonomy": "Present in all Eukaryotes.", "genes": "null", - "evolution": "null", + "evolution": "Because of its conserved function in the DNA damage response, it seems probable that H2A.X is ancestral, and that the various RC H2As are derived from it [talbert_histone_2021].", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -335,22 +388,32 @@ "structure": "null", "interactions": "null", "disease": "null", - "caveats": "null" + "caveats": "In certain species H2A.X may perform cH2A role, hence in our classification such species will lack cH2A histones. In single-celled eukaryotes, such as yeast, H2A.X can be the primary form of H2A [talbert_histone_2021]. The same might apply to certain protozoan parasites, such as G. lamblia [dalmasso_canonical_2011]." }, - "taxonomic_span": "Vertebrata", - "taxonomic_span_id": "7742", - "alternate_names": [], - "publications": [] + "taxonomic_span": "Eukaryota", + "taxonomic_span_id": "2759", + "alternate_names": [ + { + "name": "canonical H2A" + } + ], + "publications": [ + "malik_phylogenomics_2003", + "marzluff_birth_2017", + "marzluff_metabolism_2008", + "pontarotti_long-term_2009", + "talbert_histone_2021" + ] }, - "cH2A_(Mammalia)": { - "level": "variant_group", + "cH2A.10_(Homo_sapiens)": { + "level": "variant", "description": { - "summary": "cH2A_(Mammalia) -- clustered H2A histones in mammals, often called canonical, replication-dependent, replication-coupled or \"bulk\" H2A histones. This is a subclass of cH2A_(Vertebrata) and cH2A_(Animals) (see it for a detailed description).", - "taxonomy": "Vertebrates (Vertebrata)", + "summary": "cH2A.10_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2A histones in human endoded by H2AC21 gene.", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -360,19 +423,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Mammalia", - "taxonomic_span_id": "40674", + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", "alternate_names": [], "publications": [] }, - "cH2A_(Homo_sapiens)": { - "level": "variant_group", + "cH2A.11_(Homo_sapiens)": { + "level": "variant", "description": { - "summary": "cH2A_(Homo_sapiens) -- clustered H2A histones in human, often called canonical, replication-dependent, replication-coupled or \"bulk\" H2A histones. For a general description see cH2A_(Animals) class. Replication-dependent histones in humans are found in four loci: a large cluster on chromosome 6 (more than 60 genes), two clusters on chromosome 1 (10-12 genes and 4 genes) and a single H4 gene on chromosome 12 (with a neighbouring H2AJ gene). Humans have 18 H2A genes that code for replication-dependent H2A histones. The cluster on chromosome 6 encodes 13 H2A genes (H2AC1, H2AC4, H2AC6, H2AC7, H2AC8, H2AC11, H2AC12, H2AC13, H2AC14, H2AC15, H2AC16, H2AC17) and several pseudogenes. The first cluster on chromosome 1 encodes 4 genes (H2AC18, H2AC19, H2AC20, H2AC21), and the second cluster on chromosome 1 endodes one gene (H2AC25). 18 genes enconde 11 protein variants. H2A18, H2AC19, H2AC20, H2AC21 encode isoforms that have a methionine instead of leucine at position 51 conferring a mobility shift in triton-acid urea gel electrophoresis (historically, H2A.2 symbol was used to mark this difference) [franklin_non-allelic_1977]. H2AC1 gene (formely, called HIST1H2AA, TH2A) is the most divergent gene of the family, together with H2BC1 they share a common promoter and maifest tissue-specific expression (at least in testis and oocytes) [huynh_two_2016].", + "summary": "cH2A.11_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2A histones in human endoded by H2AC25 gene.", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -380,24 +444,22 @@ "structure": "null", "interactions": "null", "disease": "null", - "caveats": "1) A subset of clustered histones, which are normally expressed as replication-dependent histones, are expressed as polyadenylated mRNAs in adult non-dividing tissues to replenish histone pool in differentiated tissues [lyons_subset_2016]. 2) H2A.X histone variant is usually closely related to replication-dependent H2A histones in the same group of animals. In humans, H2A.X produces both polyadenylated mRNAs and mRNAs ending on a stem-loop. It is probale that it is ancestral to clustered H2A histones [talbert_histone_2021]. 3) The H2AJ gene on chromosome 12 encoding H2A.J histone variant is sequence wise very similar to other canonical H2As in human. However, it appears to produce only polyadenylated mRNA. See H2A.J variant description for details." + "caveats": "null" }, "taxonomic_span": "Homo sapiens", "taxonomic_span_id": "9606", "alternate_names": [], - "publications": [ - "franklin_non-allelic_1977", - "huynh_two_2016" - ] + "publications": [] }, "cH2A.1_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "cH2A.1_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2A histones in human endoded by H2AC1 gene (formerly, HIST1H2AA, TH2A). This is the most divergent gene of the family, its protein product has differences in several internal positions as well as in the last 6 amino acids at the C-terminus with respect to the majority of clustered H2As. Its length is also one amino acid longer than for the rest of H2As (130 amio acid residues after initiator methionine cleavage). Together with H2BC1 they share a common promoter and manifest tissue-specific expression (at least in testis and oocytes) (see human protein atlas). H2AC1 and H2BC1 are thought to be maternal effect factors and their expression was shown to enhance OSKM-induced cell reprogramming in human cells [huynh_two_2016]. See also description of cH2A.1_(Mus_musculus) -- a related histone variant encoded by H2ac1 gene which has been characterized through a number of in vivo and in vitro studies.", + "summary": "cH2A.1_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2A histones in human endoded by H2AC1 gene (formerly, HIST1H2AA, TH2A). This is the most divergent gene of the family, its protein product has differences in several internal positions as well as in the last 6 amino acids at the C-terminus with respect to the majority of clustered H2As. Its length is also one amino acid longer than for the rest of H2As (130 amio acid residues after initiator methionine cleavage). Together with H2BC1 they share a common promoter and manifest tissue-specific expression (at least in testis and oocytes) (see human protein atlas). H2AC1 and H2BC1 are thought to be maternal effect factors and their expression was shown to enhance OSKM-induced cell reprogramming in human cells [huynh_two_2016]. See also description of cH2A.1_(Mus_musculus) a related histone variant encoded by H2ac1 gene which has been characterized through a number of in vivo and in vitro studies.", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -421,10 +483,57 @@ "huynh_two_2016" ] }, + "cH2A.1_(Mus_musculus)": { + "level": "variant", + "description": { + "summary": "cH2A.1_(Mus_musculus) is an isoform (variant) of clustered (canonical) H2A histones in mouse endoded by H2ac1 gene (formerly, Hist1h2aa, Th2a). This is the most divergent gene of the family, its protein product has differences in the ?last 6 amino acids? at the C-terminus with respect to the majority of clustered H2As???. Together with H2bc1 gene they share a common promoter and manifest tissue-specific expression (at least in testis, oocytes and zygotes) [padavattan_structural_2015]. Disruption of Th2a and Th2b genes causes defects in spermatogenesis [shinagawa_disruption_2015]. H2ac1 and H2bc1 contribute to activation of the paternal genome after fertilization [shinagawa_histone_2014]. These variant facilitate OSKM-induced cell reprogramming [shinagawa_histone_2014]. X-ray structure of nucleosome harboring this variant have fewer histone-DNA contacts and perturbed L1-L1-loop interactions. Mutational in vivo analysis suggest histone tails and L1 loop are important for reprogramming[padavattan_structural_2015]. Differential scanning calorimetry analysis indicated that the H2ac1/H2bc1 complex was more stable than other combinations of canonical histones [shinagawa_histone_2014]. This variant is related to cH2A.1_(Homo_sapiens) encoded by H2A1C gene, is located in the same position at the largest histone gene cluster, however, their sequence differs at 18 positions. Note: Since this variant manifests similar features in mice and humans (tissue-specific expression, synteny, divergent sequence with respect to other canonical variants in each species) likely similar variants exist in all supraprimates or in higher taxa. Once and if sufficient evidence accumulates such variants may be grouped into a separate class.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Mus musculus", + "taxonomic_span_id": "10090", + "alternate_names": [ + { + "name": "Th2a" + }, + { + "name": "TS H2A.1" + } + ], + "publications": [ + "padavattan_structural_2015", + "shinagawa_disruption_2015", + "shinagawa_histone_2014" + ] + }, "cH2A.2_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "cH2A.2_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2A histones in human endoded by H2AC4, H2AC8 genes." + "summary": "cH2A.2_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2A histones in human endoded by H2AC4, H2AC8 genes.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, "taxonomic_span": "Homo sapiens", "taxonomic_span_id": "9606", @@ -434,7 +543,20 @@ "cH2A.3_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "cH2A.3_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2A histones in human endoded by H2AC6 gene." + "summary": "cH2A.3_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2A histones in human endoded by H2AC6 gene.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, "taxonomic_span": "Homo sapiens", "taxonomic_span_id": "9606", @@ -444,7 +566,20 @@ "cH2A.4_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "cH2A.4_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2A histones in human endoded by H2AC7 gene." + "summary": "cH2A.4_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2A histones in human endoded by H2AC7 gene.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, "taxonomic_span": "Homo sapiens", "taxonomic_span_id": "9606", @@ -454,7 +589,20 @@ "cH2A.5_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "cH2A.5_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2A histones in human endoded by H2AC11, H2AC13, H2AC15, H2AC16, H2AC17 genes. This is an isoform represented by the most number of genes." + "summary": "cH2A.5_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2A histones in human endoded by H2AC11, H2AC13, H2AC15, H2AC16, H2AC17 genes. This is an isoform represented by the most number of genes.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, "taxonomic_span": "Homo sapiens", "taxonomic_span_id": "9606", @@ -464,7 +612,20 @@ "cH2A.6_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "cH2A.6_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2A histones in human endoded by H2AC12 gene." + "summary": "cH2A.6_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2A histones in human endoded by H2AC12 gene.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, "taxonomic_span": "Homo sapiens", "taxonomic_span_id": "9606", @@ -474,7 +635,20 @@ "cH2A.7_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "cH2A.7_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2A histones in human endoded by H2AC14 gene." + "summary": "cH2A.7_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2A histones in human endoded by H2AC14 gene.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, "taxonomic_span": "Homo sapiens", "taxonomic_span_id": "9606", @@ -484,7 +658,20 @@ "cH2A.8_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "cH2A.8_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2A histones in human. It is the product of H2AC18 and H2AC19 genes. Together with cH2A.9_(Homo_sapiens) isoform (product of H2AC20 gene) this isoform has a methionine instead of leucine at position 51 relative to other cH2As in human (H2AL51M substitution). Historically the methionine containing isoforms were classified as H2A.2 histones, based on mobility differences in triton-acid urea gel electrophoresis[franklin_non-allelic_1977]." + "summary": "cH2A.8_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2A histones in human. It is the product of H2AC18 and H2AC19 genes. Together with cH2A.9_(Homo_sapiens) isoform (product of H2AC20 gene) this isoform has a methionine instead of leucine at position 51 relative to other cH2As in human (H2AL51M substitution). Historically the methionine containing isoforms were classified as H2A.2 histones, based on mobility differences in triton-acid urea gel electrophoresis[franklin_non-allelic_1977].", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, "taxonomic_span": "Eukaryotes", "taxonomic_span_id": "2759", @@ -496,7 +683,20 @@ "cH2A.9_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "cH2A.9_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2A histones in human. It is the product of H2AC20 gene. Together with cH2A.8_(Homo_sapiens) isoform (product of H2AC18 and H2AC19 genes) this isoform has a methionine instead of leucine at position 51 relative to other cH2As in human (H2AL51M substitution). Historically the methionine containing isoforms were classified as H2A.2 histones, based on mobility differences in triton-acid urea gel electrophoresis[franklin_non-allelic_1977]." + "summary": "cH2A.9_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2A histones in human. It is the product of H2AC20 gene. Together with cH2A.8_(Homo_sapiens) isoform (product of H2AC18 and H2AC19 genes) this isoform has a methionine instead of leucine at position 51 relative to other cH2As in human (H2AL51M substitution). Historically the methionine containing isoforms were classified as H2A.2 histones, based on mobility differences in triton-acid urea gel electrophoresis[franklin_non-allelic_1977].", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, "taxonomic_span": "Eukaryotes", "taxonomic_span_id": "2759", @@ -505,34 +705,15 @@ "franklin_non-allelic_1977" ] }, - "cH2A.10_(Homo_sapiens)": { - "level": "variant", - "description": { - "summary": "cH2A.10_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2A histones in human endoded by H2AC21 gene." - }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", - "alternate_names": [], - "publications": [] - }, - "cH2A.11_(Homo_sapiens)": { + "cH2A_(Animals)": { "level": "variant", "description": { - "summary": "cH2A.11_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2A histones in human endoded by H2AC25 gene." - }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", - "alternate_names": [], - "publications": [] - }, - "cH2A_(Mus_musculus)": { - "level": "variant_group", - "description": { - "summary": "cH2A_(Mus_musculus) -- clustered H2A histones in mouse, often called canonical, replication-dependent, replication-coupled or \"bulk\" H2A histones. repliation-dependent histones in mouse similar to human are found in several clusters. The largest cluster is found on chromosome 13 (more than 50 geens) and smaller clusters on chromosomes 3 and 11 [marzluff_human_2002]. There are 18 replication-dependent H2A genes currently annotated in mouse genome: 13 in cluster on chromosome 13, 4 in cluster on chromosome 3 and 1 on chromosome 11.", + "summary": "cH2A_(Animals) clustered H2A histones in animals (Metazoa), often called canonical, replication-dependent, replication-coupled or \"bulk\" H2A histones are a major class of H2A histones in animals with high sequence similarity across all animal species. Histone genes encodig these proteins have several particular features. 1) These genes lack introns and are found in multiple similar copies clustered along the genome togerther with other core histone genes (H3, H4, H2B, and optionally H1). The exact organisation may vary from tandemly repeated quintets of H3, H4, H2A, H2B, H1 genes transcribed from the same strand to non-tandem jumbled arrays of genes transcribed from divergent promoters [pontarotti_long-term_2009]. 2) These genes are mainly expressed during S-phase of the cell cycle in a coordinated fashion (hence the name \"replication dendent\") and produce mRNAs that are not polyadenylated but rather end in a conserved stem-loop, which is further bound by the stem-loop binding protein (SLBP). mRNAs are rapidly degraded after the S-phase. 3) These genes are present in a specialized nuclear domain, the histone locus body (HLB), which concetrates factors for histone mRNA transcription and processing (in humans these include NPAT, U7 snRNP, FLASH) [marzluff_birth_2017].", + "taxonomy": "Animals (Metazoa)", "genes": "null", - "evolution": "null", + "evolution": "H2A.X histone variant is usually closely related to replication-dependent H2A histones in the same group of animals. In humans, H2A.X produces both polyadenylated mRNAs and mRNAs ending in a stem-loop. It is probale that it is ancestral to clustered H2A histones [talbert_histone_2021].", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -540,44 +721,25 @@ "structure": "null", "interactions": "null", "disease": "null", - "caveats": "null" + "caveats": "1) Clustered histones may still exhibit some level of sequence variation between the multiple gene copies in certain species. Evidence exists that these differences may have functional implications (e.g. affect nucleosome stability). Some clustered genes have tissue-specific expression and play specific functional roles (e.g. cH2A.1 in mice). 2) A subset of clustered histones, which are normally expressed as replication-dependent histones, are expressed as polyadenylated mRNAs in adult non-dividing tissues to replenish histone pool in differentiated tissues [lyons_subset_2016]. 3) Certain clustered histones may act as functional histone variants with replication-independent polyA-tail-regulated expression being the major/only form (e.g. cH2B.E_(Mus_musculus), or H2A.J, which is closely related to cH2As). 4) In C. elegans an alternative mechanism of mRNA 3'-end processing evolved resulting in loss of HLB and histone clusters [marzluff_birth_2017, pontarotti_long-term_2009]. 5) H2A.X histone variant is usually closely related to replication-dependent H2A histones in the same group of animals. In humans, H2A.X produces both polyadenylated mRNAs and mRNAs ending in a stem-loop. It is probale that it is ancestral to clustered H2A histones [talbert_histone_2021]. " }, - "taxonomic_span": "Mus musculus", - "taxonomic_span_id": "10090", + "taxonomic_span": "Metazoa", + "taxonomic_span_id": "33208", + "alternate_names": [], "publications": [ - "marzluff_human_2002" + "marzluff_birth_2017", + "pontarotti_long-term_2009" ] }, - "cH2A.1_(Mus_musculus)": { + "cH2A_(Chlorophyta)": { "level": "variant", "description": { - "summary": "cH2A.1_(Mus_musculus) -- is an isoform (variant) of clustered (canonical) H2A histones in mouse endoded by H2ac1 gene (formerly, Hist1h2aa, Th2a). This is the most divergent gene of the family, its protein product has differences in the ?last 6 amino acids? at the C-terminus with respect to the majority of clustered H2As???. Together with H2bc1 gene they share a common promoter and manifest tissue-specific expression (at least in testis, oocytes and zygotes) [padavattan_structural_2015]. Disruption of Th2a and Th2b genes causes defects in spermatogenesis [shinagawa_disruption_2015]. H2ac1 and H2bc1 contribute to activation of the paternal genome after fertilization [shinagawa_histone_2014]. These variant facilitate OSKM-induced cell reprogramming [shinagawa_histone_2014]. X-ray structure of nucleosome harboring this variant have fewer histone-DNA contacts and perturbed L1-L1-loop interactions. Mutational in vivo analysis suggest histone tails and L1 loop are important for reprogramming[padavattan_structural_2015]. Differential scanning calorimetry analysis indicated that the H2ac1/H2bc1 complex was more stable than other combinations of canonical histones [shinagawa_histone_2014]. This variant is related to cH2A.1_(Homo_sapiens) encoded by H2A1C gene, is located in the same position at the largest histone gene cluster, however, their sequence differs at 18 positions. Note: Since this variant manifests similar features in mice and humans (tissue-specific expression, synteny, divergent sequence with respect to other canonical variants in each species) likely similar variants exist in all supraprimates or in higher taxa. Once and if sufficient evidence accumulates such variants may be grouped into a separate class." - }, - "taxonomic_span": "Mus musculus", - "taxonomic_span_id": "10090", - "alternate_names": [ - { - "name": "Th2a" - }, - { - "name": "TS H2A.1" - } - ], - "publications": [ - "padavattan_structural_2015", - "shinagawa_disruption_2015", - "shinagawa_histone_2014" - ] - }, - "cH2A_(Plants)": { - "level": "variant_group", - "description": { - "summary": "cH2A_(Plants) -- canonical H2A histones of green plants (Viridiplantae), which include green algae and land plants. This is a loosely defined group of replication-dependent H2A histones in plants together with similar sequences that might have further diversified towards replication-independent tissue-specific expression but have not yet been extensively studied. Currenly not much is known about the functional specialization of various cH2As isoforms in plants [alvarez-venegas_canonical_2019]. Organisation of canonical histones in green plants is variable. In land plants unlike clustered/canonical histones of animals (see cH2A_(Metazoa)) replication dependent histone mRNAs are polyadenilated and genes are interspersed throught the genome, H2A genes may have introns. In chlorophyte green algae, such as Chlamydomonas, genes are grouped in clusteres and mRNAs end in 3'-stem loop similar to those of histone genes in animals [marzluff_metabolism_2008, alvarez-venegas_canonical_2019]", - "taxonomy": "Viridiplantae (Plants)", + "summary": "cH2A_(Chlorophyta) canonical H2A histones of green algae and similar replication-independent histones. In chlorophyte green algae, such as Chlamydomonas, genes are grouped in clusteres and mRNAs end in 3'-stem loop similar to those of histone genes in animals [marzluff_metabolism_2008, alvarez-venegas_canonical_2019].", + "taxonomy": "Chlorophyta", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -587,24 +749,24 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Viridiplantae", - "taxonomic_span_id": "33090", + "taxonomic_span": "Chlorophyta", + "taxonomic_span_id": "3041", "alternate_names": [], "publications": [ - "alvarez-venegas_canonical_2019", - "marzluff_metabolism_2008", - " alvarez-venegas_canonical_2019" + " alvarez-venegas_canonical_2019", + "jiang_evolution_2020", + "marzluff_metabolism_2008" ] }, "cH2A_(Embryophyta)": { - "level": "variant_group", + "level": "variant", "description": { - "summary": "cH2A_(Embryophyta) -- canonical replication-dependent H2A histones of land plants and similar replication-independent histones. In land plants unlike clustered/canonical histones of animals (see cH2A_(Metazoa)) replication dependent histone mRNAs are polyadenilated and genes are interspersed throught the genome, H2A genes may have introns. [marzluff_metabolism_2008, alvarez-venegas_canonical_2019]", + "summary": "cH2A_(Embryophyta) canonical replication-dependent H2A histones of land plants and similar replication-independent histones. In land plants unlike clustered/canonical histones of animals (see cH2A_(Metazoa)) replication dependent histone mRNAs are polyadenilated and genes are interspersed throught the genome, H2A genes may have introns. [marzluff_metabolism_2008, alvarez-venegas_canonical_2019]", "taxonomy": "Embryophyta", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -618,19 +780,19 @@ "taxonomic_span_id": "3193", "alternate_names": [], "publications": [ - "marzluff_metabolism_2008", - " alvarez-venegas_canonical_2019" + " alvarez-venegas_canonical_2019", + "marzluff_metabolism_2008" ] }, - "cH2A_(Chlorophyta)": { - "level": "variant_group", + "cH2A_(Fungi)": { + "level": "variant", "description": { - "summary": "cH2A_(Chlorophyta) -- canonical H2A histones of green algae and similar replication-independent histones. In chlorophyte green algae, such as Chlamydomonas, genes are grouped in clusteres and mRNAs end in 3'-stem loop similar to those of histone genes in animals [marzluff_metabolism_2008, alvarez-venegas_canonical_2019].", - "taxonomy": "Chlorophyta", + "summary": "cH2A_(Fungi) canonical replication-dependent H2A histones in fungi. In most fungal species H2A.X histone plays the role of the primary H2A histone [nowrousian_5_2014]. In the current classification these histones will be classified as H2A.X, and this group does not include them. Certain parasitic fungi have been reported to lack H2A.X and have H2A histones [dalmasso_canonical_2011]. Note: Since H2A.X are usually closely related to canonical H2As within respective taxanomic groups, an alternative approach might be to assign fungal H2A.X histones simultaneously to both H2A.X and cH2A classes.", + "taxonomy": "Fungi", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -640,24 +802,23 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Chlorophyta", - "taxonomic_span_id": "3041", + "taxonomic_span": "Fungi", + "taxonomic_span_id": "4751", "alternate_names": [], "publications": [ - "marzluff_metabolism_2008", - " alvarez-venegas_canonical_2019", - "jiang_evolution_2020" + "dalmasso_canonical_2011", + "nowrousian_5_2014" ] }, - "cH2A_(Fungi)": { - "level": "variant_group", + "cH2A_(Homo_sapiens)": { + "level": "variant", "description": { - "summary": "cH2A_(Fungi) -- canonical replication-dependent H2A histones in fungi. In most fungal species H2A.X histone plays the role of the primary H2A histone [nowrousian_5_2014]. In the current classification these histones will be classified as H2A.X, and this group does not include them. Certain parasitic fungi have been reported to lack H2A.X and have H2A histones [dalmasso_canonical_2011]. Note: Since H2A.X are usually closely related to canonical H2As within respective taxanomic groups, an alternative approach might be to assign fungal H2A.X histones simultaneously to both H2A.X and cH2A classes.", - "taxonomy": "Fungi", + "summary": "cH2A_(Homo_sapiens) clustered H2A histones in human, often called canonical, replication-dependent, replication-coupled or \"bulk\" H2A histones. For a general description see cH2A_(Animals) class. Replication-dependent histones in humans are found in four loci: a large cluster on chromosome 6 (more than 60 genes), two clusters on chromosome 1 (10-12 genes and 4 genes) and a single H4 gene on chromosome 12 (with a neighbouring H2AJ gene). Humans have 18 H2A genes that code for replication-dependent H2A histones. The cluster on chromosome 6 encodes 13 H2A genes (H2AC1, H2AC4, H2AC6, H2AC7, H2AC8, H2AC11, H2AC12, H2AC13, H2AC14, H2AC15, H2AC16, H2AC17) and several pseudogenes. The first cluster on chromosome 1 encodes 4 genes (H2AC18, H2AC19, H2AC20, H2AC21), and the second cluster on chromosome 1 endodes one gene (H2AC25). 18 genes enconde 11 protein variants. H2A18, H2AC19, H2AC20, H2AC21 encode isoforms that have a methionine instead of leucine at position 51 conferring a mobility shift in triton-acid urea gel electrophoresis (historically, H2A.2 symbol was used to mark this difference) [franklin_non-allelic_1977]. H2AC1 gene (formely, called HIST1H2AA, TH2A) is the most divergent gene of the family, together with H2BC1 they share a common promoter and maifest tissue-specific expression (at least in testis and oocytes) [huynh_two_2016].", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -665,25 +826,25 @@ "structure": "null", "interactions": "null", "disease": "null", - "caveats": "null" + "caveats": "1) A subset of clustered histones, which are normally expressed as replication-dependent histones, are expressed as polyadenylated mRNAs in adult non-dividing tissues to replenish histone pool in differentiated tissues [lyons_subset_2016]. 2) H2A.X histone variant is usually closely related to replication-dependent H2A histones in the same group of animals. In humans, H2A.X produces both polyadenylated mRNAs and mRNAs ending on a stem-loop. It is probale that it is ancestral to clustered H2A histones [talbert_histone_2021]. 3) The H2AJ gene on chromosome 12 encoding H2A.J histone variant is sequence wise very similar to other canonical H2As in human. However, it appears to produce only polyadenylated mRNA. See H2A.J variant description for details." }, - "taxonomic_span": "Fungi", - "taxonomic_span_id": "4751", + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", "alternate_names": [], "publications": [ - "nowrousian_5_2014", - "dalmasso_canonical_2011" + "franklin_non-allelic_1977", + "huynh_two_2016" ] }, - "cH2A_(Protists)": { - "level": "variant_group", + "cH2A_(Mammalia)": { + "level": "variant", "description": { - "summary": "cH2A_(Protists) -- canonical replication-dependent H2A histones in various protists.", - "taxonomy": "Protists", + "summary": "cH2A_(Mammalia) clustered H2A histones in mammals, often called canonical, replication-dependent, replication-coupled or \"bulk\" H2A histones. This is a subclass of cH2A_(Vertebrata) and cH2A_(Animals) (see it for a detailed description).", + "taxonomy": "Vertebrates (Vertebrata)", "genes": "null", "evolution": "null", - "expression": "Recent evidence suggests that the specialized stem-loop forming 3-prime-end of replication-dependent histone mRNAs originated early in the evolution of eukaryotes but was completely lost in several lineages, including plants, fungi and most protozoa. Instead, these species synthesize histones from cell-cycle-regulated polyadenylated mRNAs, and regulation is primarily at the level of transcription [marzluff_metabolism_2008].", - "knock-out:": "null", + "expression": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -693,367 +854,1592 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "", - "taxonomic_span_id": "", + "taxonomic_span": "Mammalia", + "taxonomic_span_id": "40674", "alternate_names": [], "publications": [] }, - "H2A.Z": { - "level": "variant_group", + "cH2A_(Mus_musculus)": { + "level": "variant", "description": { - "summary": "H2A.Z -- is a replication-independent H2A histone variant strongly conserved in almost all Eukaryotes (exceptions may include some metamonads (e.g. Giardia, Trichomonas), Amebae and parasitic fungi [dalmasso_canonical_2011]). This histone variant is essential from Tetrahymena to mammals (although its knock out in yeast is not lethal) and amounts to around 5-10% of H2A histones [dalmasso_canonical_2011]. H2A.Z containing nucleosomes often localize near transcription start sites (+1 nucleosomes) and enhancer regions, they are thought to be involved in Pol II recruitment, transcription regulation, DNA repair, suppression of antisense RNA, heterochromatin regulation. [giaimo_histone_2019]. H2A.Z nucleosomes have a larger acidic patch, an amino acid insertion in \u03b11-helix and one deletion in the docking domain compared to the canonical H2A. The L1-loop region exhibits four amino acids difference between H2A.Z and canonical H2A and is likely involved in conferring stability and functional specificity of variant nucleosomes via L1-L1 interactions [shaytan_nucleosome_2015]. C-terminal region of the yeast H2A.Z protein interacts with RNA polymerase II (RNAPII), promoting its recruitment at promoters [adam_h2az_2001]." + "summary": "cH2A_(Mus_musculus) clustered H2A histones in mouse, often called canonical, replication-dependent, replication-coupled or \"bulk\" H2A histones. repliation-dependent histones in mouse similar to human are found in several clusters. The largest cluster is found on chromosome 13 (more than 50 geens) and smaller clusters on chromosomes 3 and 11 [marzluff_human_2002]. There are 18 replication-dependent H2A genes currently annotated in mouse genome: 13 in cluster on chromosome 13, 4 in cluster on chromosome 3 and 1 on chromosome 11.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Eukaryotes", - "taxonomic_span_id": "2759", - "alternate_names": [ - { - "name": "Htz1p", - "taxonomy": "saccharomyces" - }, + "taxonomic_span": "Mus musculus", + "taxonomic_span_id": "10090", + "alternate_names": [], + "publications": [ + "marzluff_human_2002" + ] + }, + "cH2A_(Plants)": { + "level": "variant", + "description": { + "summary": "cH2A_(Plants) canonical H2A histones of green plants (Viridiplantae), which include green algae and land plants. This is a loosely defined group of replication-dependent H2A histones in plants together with similar sequences that might have further diversified towards replication-independent tissue-specific expression but have not yet been extensively studied. Currenly not much is known about the functional specialization of various cH2As isoforms in plants [alvarez-venegas_canonical_2019]. Organisation of canonical histones in green plants is variable. In land plants unlike clustered/canonical histones of animals (see cH2A_(Metazoa)) replication dependent histone mRNAs are polyadenilated and genes are interspersed throught the genome, H2A genes may have introns. In chlorophyte green algae, such as Chlamydomonas, genes are grouped in clusteres and mRNAs end in 3'-stem loop similar to those of histone genes in animals [marzluff_metabolism_2008, alvarez-venegas_canonical_2019]", + "taxonomy": "Viridiplantae (Plants)", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Viridiplantae", + "taxonomic_span_id": "33090", + "alternate_names": [], + "publications": [ + " alvarez-venegas_canonical_2019", + "alvarez-venegas_canonical_2019", + "marzluff_metabolism_2008" + ] + }, + "cH2A_(Protists)": { + "level": "variant", + "description": { + "summary": "cH2A_(Protists) canonical replication-dependent H2A histones in various protists.", + "taxonomy": "Protists", + "genes": "null", + "evolution": "null", + "expression": "Recent evidence suggests that the specialized stem-loop forming 3-prime-end of replication-dependent histone mRNAs originated early in the evolution of eukaryotes but was completely lost in several lineages, including plants, fungi and most protozoa. Instead, these species synthesize histones from cell-cycle-regulated polyadenylated mRNAs, and regulation is primarily at the level of transcription [marzluff_metabolism_2008].", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "null", + "taxonomic_span_id": "null", + "alternate_names": [], + "publications": [] + }, + "cH2A_(Vertebrata)": { + "level": "variant", + "description": { + "summary": "cH2A_(Vertebrata) clustered H2A histones in vertebrates, often called canonical, replication-dependent, replication-coupled or \"bulk\" H2A histones. This is a subclass of cH2A_(Animals) (see it for a detailed description).", + "taxonomy": "Vertebrates (Vertebrata)", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Vertebrata", + "taxonomic_span_id": "7742", + "alternate_names": [], + "publications": [] + }, + "cH2B": { + "level": "variant_group", + "description": { + "summary": "cH2B canonical H2B histones. Like cH2A, this is a loosely defined group that encompasses major H2B histone proteins that are expressed during S-phase of the cell cycle in eukaryotes and are highly conserved even between distantly related species. Such proteins are often called replication dependent (RD) or \"bulk\" histones [marzluff_metabolism_2008,talbert_histone_2021]. They are likely similar to the original H2B histones of the last common ancestor of eukaryotes [malik_phylogenomics_2003]. Expression of cH2Bs during S-phase is often tightly regulated, but mechanisms may differ among kindoms [marzluff_birth_2017,pontarotti_long-term_2009]. These histones are often present as large multigene families. However, there are known limitations to the definition given above. Functional diversification of paralogous genes is a common process in evolution in many species multiple copies of canonical histone genes have undergone diversification in terms of sequence variation, cell-cycle or tissue-specific expression patterns. Sometimes this diversification is very subtle and species-specific (e.g. cH2B.E isoforms in mouse), in other cases there may be a spectrum of canonical-like proteins (e.g. plant canonical H2Bs which show higher sequence diversity than cH2Bs of animals). Hence, whether a particular gene should be regarded as a canonical, a bona fide variant or a canonical subvariant/isoform may be a matter of debate and definition in each particular case. Within the current hierarchical classification system, additional information about the cH2A class may be gained by looking at the description of its subclasses.", + "taxonomy": "Present in all Eukaryotes.", + "genes": "null", + "evolution": "It has been suggested that H2A and H2B have arisen from H3 and H4 during evolution [malik_phylogenomics_2003]. The eukaryotic H3-H4 tetramer resembles the tetramer found in Archaea, and it has been suggested that H2A and H2B have arisen from H3 and H4 later on in histone evolution [henneman_structure_2018].", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Eukaryota", + "taxonomic_span_id": "2759", + "alternate_names": [], + "publications": [ + "malik_phylogenomics_2003", + "marzluff_birth_2017", + "marzluff_metabolism_2008", + "pontarotti_long-term_2009", + "talbert_histone_2021" + ] + }, + "cH2B.10_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "cH2B.10_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC15 gene.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [], + "publications": [] + }, + "cH2B.11_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "cH2B.11_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC17 gene.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [], + "publications": [] + }, + "cH2B.12_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "cH2B.12_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC18 gene.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [], + "publications": [] + }, + "cH2B.13_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "cH2B.13_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC21 gene.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [], + "publications": [] + }, + "cH2B.14_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "cH2B.14_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC26 gene.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [], + "publications": [] + }, + "cH2B.15_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "cH2B.15_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC12L gene. H2BC12L is represented by a human-specific duplication of the H2BC12 gene from the chromosome 6 onto chromosome 21, the gene appears to be expressed, its protein sequence is expected to have two nonsynonymous substitutions with respect to H2BC12 gene.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [], + "publications": [] + }, + "cH2B.1_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "cH2B.1_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC1 gene (formerly, HIST1H2BA, TH2B). This is the most divergent gene of the family (around 85% identity with other cH2Bs) [zalensky_human_2002]. Its length is also one amino acid longer than for the rest of H2Bs (126 amio acid residues after initiator methionine cleavage). Together with H2AC1 they share a common promoter and manifest tissue-specific expression (at least in testis and oocytes) (see human protein atlas). H2AC1 and H2BC1 are thought to be maternal effect factors and their expression was shown to enhance OSKM-induced cell reprogramming in human cells [huynh_two_2016]. See also description of cH2B.1_(Mus_musculus) a related histone variant encoded by H2bc1 gene which has been characterized through a number of in vivo and in vitro studies. Phylogenetic analysis of cH2B.1 in mammals by Raman et al. suggests that when considered together with its N-terminal tail histones form a distinct phylogenetic clade with high bootstrap support [raman_novel_2022].", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [ { - "name": "hv1", - "taxonomy": "tetrahymena" + "name": "TH2B" }, { - "name": "H2A.V", - "taxonomy": "drosophila" + "name": "TS H2B.1" }, { - "name": "H2Av", - "taxonomy": "drosophila" - }, + "name": "hTSH2B" + } + ], + "publications": [ + "huynh_two_2016", + "raman_novel_2022", + "zalensky_human_2002" + ] + }, + "cH2B.1_(Mus_musculus)": { + "level": "variant", + "description": { + "summary": "cH2B.1_(Mus_musculus) is an isoform (variant) of clustered (canonical) H2B histones in mouse endoded by H2bc1 gene (formerly, Hist1h2ba, Th2b). This is the most divergent gene of the family, its protein product has differences in INSERT HERE. Together with H2ac1 gene they share a common promoter and manifest tissue-specific expression (at least in testis, oocytes and zygotes) [padavattan_structural_2015]. Disruption of Th2a and Th2b genes causes defects in spermatogenesis [shinagawa_disruption_2015]. H2ac1 and H2bc1 contribute to activation of the paternal genome after fertilization [shinagawa_histone_2014]. These variant facilitate OSKM-induced cell reprogramming [shinagawa_histone_2014]. X-ray structure of nucleosome harboring this variant have fewer histone-DNA contacts and perturbed L1-L1-loop interactions. Mutational in vivo analysis suggest histone tails and L1 loop of cH2A.1 are important for reprogramming [padavattan_structural_2015]. Differential scanning calorimetry analysis indicated that the H2ac1/H2bc1 complex was more stable than other combinations of canonical histones [shinagawa_histone_2014]. This variant is related to cH2B.1_(Homo_sapiens) encoded by H2B1C gene, is located in the same position at the largest histone gene cluster, however, their sequence differs at INSERT HERE positions. Structural and in vitro studies suggest that cH2B.1-containing nucleosomes are less stable than RC H2B, which may allow H2B.1 to facilitate histone-protamine exchange during spermatogenesis. More recently, H2B.1 has also been detected in mouse oocytes, where its function is not yet understood [raman_novel_2022]. Note: Since this variant manifests similar features in mice and humans (tissue-specific expression, synteny, divergent sequence with respect to other canonical variants in each species) likely similar variants exist in all supraprimates or in higher taxa. Once and if sufficient evidence accumulates such variants may be grouped into a separate class.", + "taxonomy": "Mus musculus (House mouse)", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "Govin et al. investigated the stability of nucleosomes incorporating cH2B.1/H2A.L.2 histone dimer (H2A.L.2 encoded by H2al2a gene in mouse was used) and concluded that they were less stable than nucleosomes containing somatic histones [govin_pericentric_2007].", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Mus musculus", + "taxonomic_span_id": "10090", + "alternate_names": [ + { + "name": "Th2b" + }, + { + "name": "TS H2B.1" + } + ], + "publications": [ + "padavattan_structural_2015", + "raman_novel_2022", + "shinagawa_disruption_2015", + "shinagawa_histone_2014" + ] + }, + "cH2B.2_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "cH2B.2_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC3 gene.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [], + "publications": [] + }, + "cH2B.3_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "cH2B.3_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC4, H2BC6, H2BC7, H2BC8, H2BC10 genes.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [], + "publications": [] + }, + "cH2B.4_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "cH2B.4_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC5 gene.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [], + "publications": [] + }, + "cH2B.5_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "cH2B.5_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC9 gene.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [], + "publications": [] + }, + "cH2B.6_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "cH2B.6_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC11 gene.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [], + "publications": [] + }, + "cH2B.7_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "cH2B.7_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC12 gene.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [], + "publications": [] + }, + "cH2B.8_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "cH2B.8_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC13 gene.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [], + "publications": [] + }, + "cH2B.9_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "cH2B.9_(Homo_sapiens) is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC14 gene.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [], + "publications": [] + }, + "cH2B.E_(Mus_musculus)": { + "level": "variant", + "description": { + "summary": "cH2B.E_(Mus_musculus) is an isoform (variant) of clustered (canonical) H2B histones in mouse endoded by H2bc21 gene (histone gene cluster on chromosome 3). It differs by four of five amino acids from other cH2Bs in mouse. It is expressed via a polyA-tail containing mRNA, typical of replication-independent variants in the main olfactory epithelium and the vomeronasal organ [santoro_activity-dependent_2012]. Santoro and Dulac showed that its expression is reduced by sensory activity and that it promotes neuronal cell death, such that inactive olfactory neurons display higher levels of the variant and shorter life spans. [santoro_activity-dependent_2012]", + "taxonomy": "Mus musculus (House mouse)", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Mus musculus", + "taxonomic_span_id": "10090", + "alternate_names": [ + { + "name": "H2B.21" + } + ], + "publications": [ + "santoro_activity-dependent_2012" + ] + }, + "cH2B_(Animals)": { + "level": "variant", + "description": { + "summary": "cH2B_(Animals) clustered H2B histones in animals (Metazoa), often called canonical, replication-dependent, replication-coupled or \"bulk\" H2B histones are a major class of H2B histones in animals with high sequence similarity across all animal species. Histone genes encodig these proteins have several particular features. 1) These genes lack introns and are found in multiple similar copies clustered along the genome togerther with other core histone genes (H3, H4, H2A, and optionally H1). The exact organisation may vary from tandemly repeated quintets of H3, H4, H2A, H2B, H1 genes transcribed from the same strand to non-tandem jumbled arrays of genes transcribed from divergent promoters [pontarotti_long-term_2009]. 2) These genes are mainly expressed during S-phase of the cell cycle in a coordinated fashion (hence the name \"replication dendent\") and produce mRNAs that are not polyadenylated but rather end in a conserved stem-loop, which is further bound by the stem-loop binding protein (SLBP). mRNAs are rapidly degraded after the S-phase. 3) These genes are present in a specialized nuclear domain, the histone locus body (HLB), which concetrates factors for histone mRNA transcription and processing (in humans these include NPAT, U7 snRNP, FLASH) [marzluff_birth_2017].", + "taxonomy": "Animals (Metazoa)", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "1) Clustered histones may still exhibit some level of sequence variation between the multiple gene copies in certain species. Evidence exists that these differences may have functional implications (e.g. affect nucleosome stability). Some clustered genes have tissue-specific expression and play specific functional roles (e.g. cH2B.1 and cH2B.E in mice). 2) A subset of clustered histones, which are normally expressed as replication-dependent histones, are expressed as polyadenylated mRNAs in adult non-dividing tissues to replenish histone pool in differentiated tissues [lyons_subset_2016]. 3) Certain clustered histones may act as functional histone variants with replication-independent polyA-tail-regulated expression being the major/only form (e.g. cH2B.E_(Mus_musculus), or H2A.J, which is closely related to cH2As). 4) In C. elegans an alternative mechanism of mRNA 3'-end processing evolved resulting in loss of HLB and histone clusters [marzluff_birth_2017, pontarotti_long-term_2009]. " + }, + "taxonomic_span": "Metazoa", + "taxonomic_span_id": "33208", + "alternate_names": [], + "publications": [ + "marzluff_birth_2017", + "pontarotti_long-term_2009" + ] + }, + "cH2B_(Chlorophyta)": { + "level": "variant", + "description": { + "summary": "cH2B_(Chlorophyta) canonical H2B histones of green algae and similar replication-independent histones. In chlorophyte green algae, such as Chlamydomonas, genes are grouped in clusteres and mRNAs end in 3'-stem loop similar to those of histone genes in animals [marzluff_metabolism_2008, alvarez-venegas_canonical_2019]. See description of cH2B_(Plants) variant Jiang et al. paper for further information about H2B histones in plant [jiang_evolution_2020].", + "taxonomy": "Chlorophyta", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Chlorophyta", + "taxonomic_span_id": "3041", + "alternate_names": [], + "publications": [ + " alvarez-venegas_canonical_2019", + "jiang_evolution_2020", + "marzluff_metabolism_2008" + ] + }, + "cH2B_(Embryophyta)": { + "level": "variant", + "description": { + "summary": "cH2B_(Embryophyta) canonical H2B histones of land plants. In land plants unlike clustered/canonical histones of animals (see cH2A_(Metazoa)) replication dependent histone mRNAs are polyadenilated and genes are interspersed throught the genome [marzluff_metabolism_2008, alvarez-venegas_canonical_2019]. See description of cH2B_(Plants) variant Jiang et al. paper for further information about H2B histones in plant [jiang_evolution_2020].", + "taxonomy": "Embryophyta", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Embryophyta", + "taxonomic_span_id": "3193", + "alternate_names": [], + "publications": [ + " alvarez-venegas_canonical_2019", + "jiang_evolution_2020", + "marzluff_metabolism_2008" + ] + }, + "cH2B_(Fungi)": { + "level": "variant", + "description": { + "summary": "cH2B_(Fungi) canonical replication-dependent H2B histones in fungi. In most filamentous fungi, genes for the core histones H3, H2A, and H2B, as well as the linker histone H1, are unique [nowrousian_5_2014]. ", + "taxonomy": "Fungi", + "genes": "null", + "evolution": "null", + "expression": "Recent evidence suggests that the specialized stem-loop forming 3-prime-end of replication-dependent histone mRNAs originated early in the evolution of eukaryotes but was completely lost in several lineages, including plants, fungi and most protozoa. Instead, these species synthesize histones from cell-cycle-regulated polyadenylated mRNAs, and regulation is primarily at the level of transcription [marzluff_metabolism_2008].", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Fungi", + "taxonomic_span_id": "4751", + "alternate_names": [], + "publications": [ + "nowrousian_5_2014" + ] + }, + "cH2B_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "cH2B_(Homo_sapiens) clustered H2B histones in human, often called canonical, replication-dependent, replication-coupled or \"bulk\" H2B histones. For a general description see cH2B_(Animals) class. Replication-dependent histones in humans are found in four loci: a large cluster on chromosome 6 (more than 60 genes), two clusters on chromosome 1 (10-12 genes and 4 genes) and a single H4 gene on chromosome 12. Humans have 19 H2B genes that code for replication-dependent H2B histones. The cluster on chromosome 6 encodes 15 H2B genes (H2BC1, H2BC3-H2BC15, H2BC17) and several pseudogenes. The first cluster on chromosome 1 encodes 2 genes (H2BC18, H2BC21) and two pseudogenes (H2BC19P, H2BC20P), and the second cluster on chromosome 1 endodes one gene (H2BC26) and one pseudogene (H2BC27P). One additional gene H2BC12L is represented by a human-specific duplication of the H2BC12 gene from the chromosome 6 onto chromosome 21, the gene appears to be expressed, its protein sequence is expected to have two nonsynonymous substitutions with respect to H2BC12 gene. 19 cH2B genes in human enconde 15 protein variants. H2BC1 gene (formely, called HIST1H2BA, TH2B) is the most divergent gene of the family, together with H2AC1 they share a common promoter and maifest tissue-specific expression (at least in testis and oocytes) [huynh_two_2016].", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "1) A subset of clustered histones, which are normally expressed as replication-dependent histones, are expressed as polyadenylated mRNAs in adult non-dividing tissues to replenish histone pool in differentiated tissues [lyons_subset_2016]. " + }, + "taxonomic_span": "null", + "taxonomic_span_id": "null", + "alternate_names": [], + "publications": [ + "huynh_two_2016" + ] + }, + "cH2B_(Mammalia)": { + "level": "variant", + "description": { + "summary": "cH2B_(Mammalia) clustered H2B histones in mammals, often called canonical, replication-dependent, replication-coupled or \"bulk\" H2B histones. This is a subclass of cH2B_(Vertebrata) and cH2B_(Animals) (see it for a detailed description).", + "taxonomy": "Mammals (Mammalia)", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Mammalia", + "taxonomic_span_id": "40674", + "alternate_names": [], + "publications": [] + }, + "cH2B_(Mus_musculus)": { + "level": "variant", + "description": { + "summary": "cH2B_(Mus_musculus) clustered H2B histones in mouse, often called canonical, replication-dependent, replication-coupled or \"bulk\" H2B histones. repliation-dependent histones in mouse similar to human are found in several clusters. The largest cluster is found on chromosome 13 (more than 50 genes) and smaller clusters on chromosomes 3 and 11 [marzluff_human_2002]. There are 18 replication-dependent H2B genes currently annotated in mouse genome: 15 in cluster on chromosome 13, 2 in cluster on chromosome 3 and 1 on chromosome 11.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Mus musculus", + "taxonomic_span_id": "10090", + "alternate_names": [], + "publications": [ + "marzluff_human_2002" + ] + }, + "cH2B_(Plants)": { + "level": "variant", + "description": { + "summary": "cH2B_(Plants) canonical H2B histones of green plants (Viridiplantae), which include green algae and land plants. Currently, this is a loosely defined group of replication-dependent H2B histones in plants together with similar sequences that might have further diversified towards replication-independent tissue-specific expression but have not yet been extensively studied. An example of the latter would be the HTB3 gene of Arabidopsis which has the hallmarks of a replacement histone variant enriched in mature cells [jiang_evolution_2020]. Organisation of canonical histones in green plants is variable. In land plants unlike clustered/canonical histones of animals (see cH2B_(Metazoa)) replication dependent histone mRNAs are polyadenilated and genes are interspersed throught the genome. In chlorophyte green algae, such as Chlamydomonas, genes are grouped in clusteres and mRNAs end in 3'-stem loop similar to those of histone genes in animals [marzluff_metabolism_2008, alvarez-venegas_canonical_2019]. Plant H2Bs vary substantially in the length and sequence of their N-terminal tails [jiang_evolution_2020,bergmuller_characterization_2007]. A study of evolution and functional divergence of H2B histones in plants by Jiang et al. concluded that amongst flowering plants, eudicots had experienced the highest degree of divergence among H2B genes [jiang_evolution_2020]. This divergence appears to have been driven by preferential expression during gametogenesis, including three genes in Arabidopsis (HTB7/8/10 genes) and at least one in tomato. While HTB8 gene in Arabidopsis belongs to a phylogenetically distinct H2B.S variant [jiang_evolution_2020], HTB7 and HTB10 are much more similar in sequence to other H2Bs for now are included as cH2B in our classification [alvarez-venegas_canonical_2019].", + "taxonomy": "Viridiplantae (Plants)", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Viridiplantae", + "taxonomic_span_id": "33090", + "alternate_names": [], + "publications": [ + " alvarez-venegas_canonical_2019", + "alvarez-venegas_canonical_2019", + "bergmuller_characterization_2007", + "jiang_evolution_2020", + "marzluff_metabolism_2008" + ] + }, + "cH2B_(Protists)": { + "level": "variant", + "description": { + "summary": "cH2B_(Protists) canonical replication-dependent H2B histones in various protists.", + "taxonomy": "Protists", + "genes": "null", + "evolution": "null", + "expression": "Recent evidence suggests that the specialized stem-loop forming 3-prime-end of replication-dependent histone mRNAs originated early in the evolution of eukaryotes but was completely lost in several lineages, including plants, fungi and most protozoa. Instead, these species synthesize histones from cell-cycle-regulated polyadenylated mRNAs, and regulation is primarily at the level of transcription [marzluff_metabolism_2008].", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "null", + "taxonomic_span_id": "null", + "alternate_names": [], + "publications": [] + }, + "cH2B_(Vertebrata)": { + "level": "variant", + "description": { + "summary": "cH2B_(Vertebrata) clustered H2B histones in vertebrates, often called canonical, replication-dependent, replication-coupled or \"bulk\" H2B histones. This is a subclass of cH2B_(Animals) (see it for a detailed description).", + "taxonomy": "Vertebrates (Vertebrata)", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Vertebrata", + "taxonomic_span_id": "7742", + "alternate_names": [], + "publications": [] + }, + "cH3": { + "level": "variant_group", + "description": { + "summary": "cH3 canonical H3 histones. This is a loosely defined group that encompasses major H3 histone proteins that are mainly expressed during S-phase of the cell cycle in eukaryotes and are highly conserved even between distantly related species. Such proteins are often called replication dependent (RD), replication coupled (RC), clustered or \"bulk\" histones [marzluff_metabolism_2008,talbert_histone_2021]. They are likely similar to the original H3 histones of the last common ancestor of eukaryotes [malik_phylogenomics_2003]. Expression of canonical histones during S-phase is often tightly regulated, but mechanisms may differ among kindoms [marzluff_birth_2017,pontarotti_long-term_2009]. Canonical histone genes are often present as large mulrigene families clustered together in certain locations of the genome. However, there are known limitations to the definition given above. Functional diversification of paralogous genes is a common process in evolution in some species multiple copies of canonical histone genes have undergone diversification in terms of sequence variation, cell-cycle or tissue-specific expression patterns. Such diversification for cH3s is rather limited compared to cH2As and cH2Bs. In humans there are only two very similar cH3 isoforms both expressed in S-phase (cH3.1 and cH3.2). However, the mamal-specific H3.4 variant, which manifests tissue specific expression, is in fact a very closely related to the canonical H3s (similarly to cH2A.1 and cH2B.1 is is located within histone gene clusters and has mRNA with a stem-loop). In plants, some cH3s show variable expression patterns [alvarez-venegas_canonical_2019]. Hence, whether a particular gene should be regarded as a canonical, a bona fide variant or a canonical subvariant/isoform may be a matter of debate and definition in each particular case. Another complication with defining cH3 class is that major H3 variants, such as H3.3, may only have 3-4 amino acid deference with the canonical H3 histone. They may have arisen multiple times during evolution and hence their functional classification does not match the phylogenetic classificstion. Ascomycetes are thought to have lost cH3 genes and generally have only a single form which is H3.3-like, it is usually referred to simply as H3 [talbert_unified_2012, malik_phylogenomics_2003]. Within the current hierarchical classification system, additional information about the cH3 class may be gained by looking at the description of its subclasses. ", + "taxonomy": "Eukaryotes, although lost in ascomycetes.", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "" + }, + "taxonomic_span": "Eukaryota", + "taxonomic_span_id": "2759", + "alternate_names": [ { - "name": "H2AvD", - "taxonomy": "drosophila" + "name": "canonical H3" }, { - "name": "D2", - "taxonomy": "drosophila" + "name": "RC H3" }, { - "name": "member Z" + "name": "RD H3" } ], "publications": [ - "giaimo_histone_2019", - "colino-sanguino_h2az-nuclesome_2021", - "talbert_histone_2021", - "22650316", - "25731851", - "11101893", - "18275809", - "24311584", - "19193230", - "24969791", - "22467210", - "20003410", - "24768041", - "23301656", - "20197778", - "dalmasso_canonical_2011", - "shaytan_nucleosome_2015", - "adam_h2az_2001" + " malik_phylogenomics_2003", + "alvarez-venegas_canonical_2019", + "malik_phylogenomics_2003", + "marzluff_birth_2017", + "marzluff_metabolism_2008", + "pontarotti_long-term_2009", + "talbert_histone_2021", + "talbert_unified_2012" + ] + }, + "cH3.1_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "cH3.1_(Homo_sapiens) a mammal-specific cH3.1 paralog of canonical H3 histone in human encoded by the following 10 genes on chromosome 6: H3C1-H3C4, H3C6-H3C8, H3C10-H3C12. cH3.2 is the most common replicative histone in eukaryotes, cH3.1 differs from it by only one residue at position 96 [ray-gallet_histone_2021].", + "taxonomy": "Homo sapiens", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [], + "publications": [ + "ray-gallet_histone_2021" + ] + }, + "cH3.1_(Mammalia)": { + "level": "variant", + "description": { + "summary": "cH3.1_(Mammalia) a mamal specific subvariant of cH3 histone in mammals. Mammalian cH3s have the primary cH3.2 isoform and a mammal-specific cH3.1 paralog [talbert_histone_2021]. cH3.2 is the most common replicative histone in eukaryotes, cH3.1 differs from it by only one residue at position 96 [ray-gallet_histone_2021].", + "taxonomy": "Mammals (Mammalia)", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Mammalia", + "taxonomic_span_id": "40674", + "alternate_names": [], + "publications": [ + "ray-gallet_histone_2021", + "talbert_histone_2021" + ] + }, + "cH3.2_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "cH3.2_(Homo_sapiens) cH3.2 cH3 histone isoform in human, encoded by the following 3 genes on chromosome 1: H3C13, H3C14, H3C15. cH3.2 is the most common replicative histone in eukaryotes, cH3.1 differs from it by only one residue at position 96 [ray-gallet_histone_2021].", + "taxonomy": "Homo sapiens", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [], + "publications": [ + "ray-gallet_histone_2021" ] }, - "H2A.Z.1_(Chordata)": { + "cH3.2_(Mammalia)": { "level": "variant", "description": { - "summary": "H2A.Z.1_(Chordata) -- product of one of two H2A.Z genes converved in chordates, homologous to human H2AZ1 gene [giaimo_histone_2019]. Porducts of H2AZ1 and H2AZ2 genes differ by only three amino acids, however they have acquired some degree of functional indepedence. For example, H2A.Z.1 has been shown to better interact with bromodomain-containing protein 2 (BRD2) [draker_combination_2012], H2A.Z.2 preferentially associates with H3 trimethylated at lysine 4 (H3K4me3) [dryhurst_characterization_2009]." + "summary": "cH3.2_(Mammalia) is a subvariant of cH3 histone in mammals, which corresponds to the most common replicative histone in eukaryotes, cH3.2 differs from cH3.2 by only one residue at position 96 [ray-gallet_histone_2021].", + "taxonomy": "Mammals (Mammalia)", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Chordata", - "taxonomic_span_id": "7711", + "taxonomic_span": "Mammalia", + "taxonomic_span_id": "40674", "alternate_names": [], "publications": [ - "giaimo_histone_2019", - "colino-sanguino_h2az-nuclesome_2021", - "talbert_histone_2021", - "draker_combination_2012", - "dryhurst_characterization_2009" + "ray-gallet_histone_2021" ] }, - "H2A.Z.1_(Primates)": { + "cH3_(Animals)": { "level": "variant", "description": { - "summary": "H2A.Z.1_(Primates) -- H2A.Z.1 variant in primates, see H2A.Z.1_(Chordata) variant description." + "summary": "cH3_(Animals) clustered H3 histones in animals (Metazoa), often called canonical, replication-dependent, replication-coupled or \"bulk\" H3 histones are a major class of H3 histones in animals with high sequence similarity across all animal species. Histone genes encodig these proteins have several particular features. 1) These genes lack introns and are found in multiple similar copies clustered along the genome togerther with other core histone genes (H4, H3, H2B, and optionally H1). The exact organisation may vary from tandemly repeated quintets of H3, H4, H2A, H2B, H1 genes transcribed from the same strand to non-tandem jumbled arrays of genes transcribed from divergent promoters [pontarotti_long-term_2009]. 2) These genes are mainly expressed during S-phase of the cell cycle in a coordinated fashion (hence the name \"replication dendent\") and produce mRNAs that are not polyadenylated but rather end in a conserved stem-loop, which is further bound by the stem-loop binding protein (SLBP). mRNAs are rapidly degraded after the S-phase. 3) These genes are present in a specialized nuclear domain, the histone locus body (HLB), which concetrates factors for histone mRNA transcription and processing (in humans these include NPAT, U7 snRNP, FLASH) [marzluff_birth_2017].", + "taxonomy": "Animals (Metazoa)", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "1) Clustered histones may still exhibit some level of sequence variation between the multiple gene copies in certain species. Although for cH3 this variation is very limited (only two isoforms in humans: H3.1 and H3.2. 2) In C. elegans an alternative mechanism of mRNA 3'-end processing evolved resulting in loss of HLB and histone clusters [marzluff_birth_2017, pontarotti_long-term_2009]." }, - "taxonomic_span": "Primates", - "taxonomic_span_id": "9443", + "taxonomic_span": "Metazoa", + "taxonomic_span_id": "33208", "alternate_names": [], "publications": [ - "giaimo_histone_2019", - "colino-sanguino_h2az-nuclesome_2021", - "talbert_histone_2021" + "marzluff_birth_2017", + "pontarotti_long-term_2009" ] }, - "H2A.Z.1_(Homo_sapiens)": { + "cH3_(Chlorophyta)": { "level": "variant", "description": { - "summary": "H2A.Z.1_(Homo_sapiens) -- H2A.Z variant encoded in humans by H2A.Z.1 gene. Differes by only 3 amino acids from the product of H2A.Z.2 gene." + "summary": "cH3_(Chlorophyta) canonical replication-dependent H3 histones of green algae and similar replication-independent histones. In chlorophyte green algae, such as Chlamydomonas, genes are grouped in clusteres and mRNAs end in 3'-stem loop similar to those of histone genes in animals [marzluff_metabolism_2008, alvarez-venegas_canonical_2019]", + "taxonomy": "Chlorophyta", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Eukaryotes", - "taxonomic_span_id": "2759", + "taxonomic_span": "Chlorophyta", + "taxonomic_span_id": "3041", + "alternate_names": [], + "publications": [ + " alvarez-venegas_canonical_2019", + "marzluff_metabolism_2008" + ] + }, + "cH3_(Embryophyta)": { + "level": "variant", + "description": { + "summary": "cH3_(Embryophyta) canonical replication-dependent H3 histones of land plants and similar replication-independent histones. In land plants unlike clustered/canonical histones of animals (see cH3_(Metazoa)) replication dependent histone mRNAs are polyadenilated and genes are interspersed throught the genome. [marzluff_metabolism_2008, alvarez-venegas_canonical_2019]", + "taxonomy": "Embryophyta", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Embryophyta", + "taxonomic_span_id": "3193", + "alternate_names": [], + "publications": [ + " alvarez-venegas_canonical_2019", + "marzluff_metabolism_2008" + ] + }, + "cH3_(Fungi)": { + "level": "variant", + "description": { + "summary": "cH3_(Fungi) canonical replication-dependent H3 histones in fungi, excluding ascomycetes which have lost this gene class. In Ascomycetes such as Saccharomyces cerevisiae, only H3.3 gene is present. Comparison with the basally branching Basidiomycetes, which have both H3 and H3.3, led Malik et al. to the conclusion that only the H3.3 version has been retained in Ascomycetes, presumably because H3.3 can deposit both during and after replication, whereas H3 cannot [malik_phylogenomics_2003].", + "taxonomy": "Fungi", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Fungi", + "taxonomic_span_id": "4751", + "alternate_names": [], + "publications": [ + "malik_phylogenomics_2003" + ] + }, + "cH3_(Mammalia)": { + "level": "variant", + "description": { + "summary": "cH3_(Mammalia) clustered H3 histones in mammals, often called canonical, replication-dependent, replication-coupled or \"bulk\" H3 histones. This is a subclass of cH3_(Vertebrata) and cH3_(Animals) (see it for a detailed description). Mammalian cH3s have the primary cH3.2 isoform and a mammal-specific cH3.1 paralog [talbert_histone_2021].", + "taxonomy": "Vertebrates (Vertebrata)", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Mammalia", + "taxonomic_span_id": "40674", "alternate_names": [], "publications": [ - "giaimo_histone_2019", - "colino-sanguino_h2az-nuclesome_2021", "talbert_histone_2021" ] }, - "H2A.Z.2_(Chordata)": { + "cH3_(Plants)": { "level": "variant", "description": { - "summary": "H2A.Z.2_(Chordata) -- product of one of two H2A.Z genes converved in chordates, homologous to human H2A.Z.2 gene [giaimo_histone_2019]. Porducts of H2A.Z.1 and H2A.Z.2 genes differ by only three amino acids, however they have acquired some degree of functional indepedence. For example, H2A.Z.1 has been shown to better interact with bromodomain-containing protein 2 (BRD2) [draker_combination_2012], H2A.Z.2 preferentially associates with H3 trimethylated at lysine 4 (H3K4me3) [dryhurst_characterization_2009]." + "summary": "cH3_(Plants) canonical H3 histones of green plants (Viridiplantae), which include green algae and land plants. This is a loosely defined group of replication-dependent H3 histones in plants together with similar sequences that might have further diversified towards replication-independent tissue-specific expression but have not yet been extensively studied. Currenly not much is known about the functional specialization of various cH3s isoforms in plants [alvarez-venegas_canonical_2019]. The canonical histone H3 or cH3.1 from higher plants is remarkably similar to that of animals, fungi, and even lower eukaryotes. A sequence comparison indicates that only four amino acid substitutions, F41Y, K53R, A90M, and A96C, differentiate the canonical histone H3 from plants and mammals. Interestingly, the five HTR genes from Arabidopsis encoding histone H3.1 do not contain introns and are expressed in tissues containing highly dividing cells and all but one are expressed during the S-phase of the cell cycle. In a similar way, the seven genes encoding H3.1 from rice also lack introns and several of them are expressed in highly dividing tissues [alvarez-venegas_canonical_2019]. Organisation of canonical histones in green plants is variable. In land plants unlike clustered/canonical histones of animals (see cH3_(Metazoa)) replication dependent histone mRNAs are polyadenilated and genes are interspersed throught the genome. In chlorophyte green algae, such as Chlamydomonas, genes are grouped in clusteres and mRNAs end in 3'-stem loop similar to those of histone genes in animals [marzluff_metabolism_2008, alvarez-venegas_canonical_2019]. ", + "taxonomy": "Viridiplantae (Plants)", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Chordata", - "taxonomic_span_id": "7711", + "taxonomic_span": "Viridiplantae", + "taxonomic_span_id": "33090", "alternate_names": [], "publications": [ - "giaimo_histone_2019", - "colino-sanguino_h2az-nuclesome_2021", - "talbert_histone_2021", - "draker_combination_2012", - "dryhurst_characterization_2009" + " alvarez-venegas_canonical_2019", + "alvarez-venegas_canonical_2019", + "marzluff_metabolism_2008" ] }, - "H2A.Z.2_(Primates)": { + "cH3_(Protists)": { + "level": "variant", + "description": { + "summary": "cH3_(Protists) canonical replication-dependent H3 histones in various protists.", + "taxonomy": "Protists", + "genes": "null", + "evolution": "null", + "expression": "Recent evidence suggests that the specialized stem-loop forming 3-prime-end of replication-dependent histone mRNAs originated early in the evolution of eukaryotes but was completely lost in several lineages, including plants, fungi and most protozoa. Instead, these species synthesize histones from cell-cycle-regulated polyadenylated mRNAs, and regulation is primarily at the level of transcription [marzluff_metabolism_2008].", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "SAR,Metamonada,Discoba,Amoebozoa", + "taxonomic_span_id": "2698737,2611341,2611352,554915", + "alternate_names": [], + "publications": [] + }, + "cH3_(Vertebrata)": { "level": "variant", "description": { - "summary": "H2A.Z.2_(Primates) -- H2A.Z.2 variant in primates, see H2A.Z.2_(Chordata) variant description." + "summary": "cH3_(Vertebrata) clustered H3 histones in vertebrates, often called canonical, replication-dependent, replication-coupled or \"bulk\" H3 histones. This is a subclass of cH3_(Animals) (see it for a detailed description).", + "taxonomy": "Vertebrates (Vertebrata)", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Vertebrata", + "taxonomic_span_id": "7742", + "alternate_names": [], + "publications": [] + }, + "cH4": { + "level": "variant_group", + "description": { + "summary": "Canonical histones are replication-dependent while histone variants are replication-independent, constitutively expressed during cell cycle. Genes encoding canonical histones are typically located within multigene clusters and use specific type of regulation at the RNA level with a stem loop structure instead of polyA tail", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Eukaryotes", + "taxonomic_span_id": "2759", + "alternate_names": [ + { + "name": "ca H4" + } + ], + "publications": [ + "22650316" + ] + }, + "CS_H2B_(Echinoidea)": { + "level": "variant_group", + "description": { + "summary": "CS_H2B_(Echinoidea) is a histone variant class containing cleavage-stage (CS) H2B histones characterized so far in sea urchins. Four classes of histones in sea urchins have been characterized. Three sets of histone variants are coexisting in the embryo at larval stages of sea urchin\u2019s development: the maternally inherited cleavage stage variants (CS) expressed during the two initial cleavage divisions, the early histone variants, which are recruited into embryonic chromatin from middle cleavage stages until hatching and the late variants, that are fundamentally expressed from blastula stage onward [oliver_conservative_2003]. The fourth class of histones in sea urchins are the sperm histones. They are exclusively transcribed during spermatogenesis and code for specialized H1 and H2B proteins with basic N-terminal extensions which are responsible for the unusually high chromatin condensation in mature sperm [mandl_five_1997]. Early, late, and sperm histone genes lack introns, contain the conserved 3-prime terminal stem-loop structure instead of a poly(A) addition site, and thus show the classical hallmarks of replication-dependent histone genes. The CS proteins are the first histones to be synthesized after fertilization in the cleaving embryo. The CS histones appear to be synthesized during oogenesis and in the mature egg, where they give rise to a large maternal pool of histone proteins. The CS proteins are the only histones present in the chromatin of the egg and zygote up to the second cell division. Thereafter, the efficient synthesis of the early histones leads to a rapid dilution of the CS histones in the chromatin except in the nondividing small micromeres, where the CS proteins remain the major histones up to the pluteus larva stage. The maternally stored CS histones play an important role in remodeling of the sperm chromatin after fertilization. Upon entry in the egg cytoplasm, the sperm H1 and H2B proteins present in the male pronucleus are rapidly phosphorylated on their N-terminal extensions, and the sperm H1 protein is subsequently replaced in the chromatin by the CS H1 protein. This exchange of H1 histones is immediately followed by decondensation of the chromatin. At around the time of DNA replication, the CS H2A and H2B proteins start to accumulate in the chromatin of the male pronucleus, which correlates with the transition of the nucleosomal repeat length from 250 bp in the sperm chromatin to 200 bp in the early embryo. As a consequence of this massive chromatin restructuring, the paternal genome is transcriptionally activated already at the beginning of S phase in the first cell cycle, which further emphasizes the importance of the CS histones for early development [mandl_five_1997].", + "taxonomy": "Echinoidea (sea urchins)", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "It is likely, that CS_H2B homologs are present in other taxonomic clades. Raman et al. suggested that newly identified histones H2B.N and H2B.K which are primarily expressed in ovaries and early embryos of mammals and may play key roles in female fertility and early development may be related to the cleavage stage histones of sea urchins [raman_novel_2022]. Other CS histones, such as CS H1 in sea urchins are functionally equivalent to frog H1M(B) proteins [mandl_five_1997]." }, - "taxonomic_span": "Primates", - "taxonomic_span_id": "9443", - "alternate_names": [], + "taxonomic_span": "Echinoidea", + "taxonomic_span_id": "7625", + "alternate_names": [ + { + "name": "cleavage H2B" + } + ], "publications": [ - "giaimo_histone_2019", - "colino-sanguino_h2az-nuclesome_2021", - "talbert_histone_2021" + "mandl_five_1997", + "oliver_conservative_2003" ] }, - "H2A.Z.2.s1_(Primates)": { - "level": "variant", + "early_H2B_(Echinoidea)": { + "level": "variant_group", "description": { - "summary": "H2A.Z.2.s1_(Primates) -- this is the main full length splice isoform of H2A.Z.2 in primates as compared to an slternatively spliced H2A.Z.2.s2 isofom which has an alternative shorter C-terminus [giaimo_histone_2019]." + "summary": "early_H2B_(Echinoidea) is a histone variant class of early H2B histones characterized so far in sea urchins. Four classes of histones in sea urchins have been characterized. Three sets of histone variants are coexisting in the embryo at larval stages of sea urchin\u2019s development: the maternally inherited cleavage stage variants (CS) expressed during the two initial cleavage divisions, the early histone variants, which are recruited into embryonic chromatin from middle cleavage stages until hatching and the late variants, that are fundamentally expressed from blastula stage onward [oliver_conservative_2003]. The fourth class of histones in sea urchins are the sperm histones [mandl_five_1997]. Early, late, and sperm histone genes lack introns, contain the conserved 3-prime terminal stem-loop structure instead of a poly(A) addition site, and thus show the classical hallmarks of replication-dependent histone genes. The repetitive early histone genes are transcriptionally activated upon meiotic maturation of the egg, are maximally expressed in the rapidly dividing blastula embryo, and are already silenced at the hatching blastula stage, when the transcripts of late histone genes start to accumulate [mandl_five_1997].", + "taxonomy": "Echinoidea (sea urchins)", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Primates", - "taxonomic_span_id": "9443", + "taxonomic_span": "Echinoidea", + "taxonomic_span_id": "7625", "alternate_names": [], "publications": [ - "giaimo_histone_2019" + "mandl_five_1997", + "oliver_conservative_2003" ] }, - "H2A.Z.2.s1_(Homo_sapiens)": { - "level": "variant", + "generic_H1": { + "level": "variant_group", "description": { - "summary": "H2A.Z.2.s1_(Homo_sapiens) -- this is the main full length splice isoform of H2A.Z.2 in humans as compared to an slternatively spliced H2A.Z.2.s2 isofom which has an alternative shorter C-terminus [giaimo_histone_2019]." + "summary": "H1 has mainly species specific variants. In current version of HistoneDB all H1 are presented as genericH1 class, except for several interesting species specific variants which are provided as separate classes.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", - "alternate_names": [], + "taxonomic_span": "Eukaryotes", + "taxonomic_span_id": "2759", + "alternate_names": [ + { + "name": "gen H1" + } + ], "publications": [ - "giaimo_histone_2019" + "10973918", + "11149891", + "22650316", + "23945933", + "26212454" ] }, - "H2A.Z.2.s2_(Primates)": { - "level": "variant", + "gH2A": { + "level": "variant_group", "description": { - "summary": "H2A.Z.2.s2_(Primates) -- this is an alternatively spliced isoform of H2A.Z.2 in primates which has an alternative shorter C-terminus with respect to H2A.Z.2.s1 isoform. This isoform is expressed in a wide range of tissues, including brain tissues. Nucleosome containing H2A.Z.2.s2 isoform are less stable, than nuclesomes with the main isoform. [giaimo_histone_2019]." + "summary": "gH2A is a male-gamete-specific variant found in the genus Lilium [alvarez-venegas_canonical_2019,ueda_male_2005].", + "taxonomy": "Suggested to be a distinctive variant that evloved specifically in Lilium [alvarez-venegas_canonical_2019]", + "genes": "gH2A gene in Lilium longiflorum. The gene is interrupted by one intron.", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "This histone variant is expected to be specifically synthesized in the male gametic cells and to cause chromatin condensation or remodeling of chromatin structure [ueda_male_2005].", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Primates", - "taxonomic_span_id": "9443", + "taxonomic_span": "Lilium", + "taxonomic_span_id": "4688", "alternate_names": [], "publications": [ - "giaimo_histone_2019" + "alvarez-venegas_canonical_2019", + "ueda_male_2005" ] }, - "H2A.Z.2.s2_(Homo_sapiens)": { - "level": "variant", + "gH2B": { + "level": "variant_group", "description": { - "summary": "H2A.Z.2.s2_(Homo_sapiens) -- this is an alternatively spliced isoform of H2A.Z.2 in humans which has an alternative shorter C-terminus with respect to H2A.Z.2.s1 isoform. This isoform is expressed in a wide range of tissues, including brain tissues. Nucleosome containing H2A.Z.2.s2 isoform are less stable, than nuclesomes with the main isoform. [giaimo_histone_2019]." + "summary": "gH2B is a group of plant H2B variants found in Lilium that are highly divergent from the canonical H2B and are expressed in the generative cell of the bicellular pollen where it may be necessary for chromatin remodeling of the male germline [alvarez-venegas_canonical_2019,yang_proteomic_2016,ueda_unusual_2000]. The subvariants so far identified are named gH2B in Lilium longiflorum, mgH2B in Lilium davidii, and mgH2B.in in Lilium davidii. These subvariants are rather different and are grouped due to lack of further information. Some phylogenetic reconstructions cluster these variant together with H2B.S [alvarez-venegas_canonical_2019], however, this may be likely to long branch attraction, and the exact phylogeny remains to be studied [jiang_evolution_2020].", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "Lilium", + "taxonomic_span_id": "4688", "alternate_names": [], "publications": [ - "giaimo_histone_2019" + "alvarez-venegas_canonical_2019", + "jiang_evolution_2020", + "ueda_unusual_2000", + "yang_proteomic_2016" ] }, - "H2A.X": { - "level": "variant_group", + "H1": { + "level": "type", "description": { - "summary": "H2A.X -- is an H2A histone variant present in almost all Eukaryotes most notably involved in DNA damage response, marking the double strand DNA breaks with its phosphorylated form \u0263-H2A.X. It is also more broadly implicated in chromatin remodeling, found at collapsed replication forks and heterochromatin. It is a non-monophyletic (polyphyletic) variant of H2A and has the charactristic SQE/D\u03a6 motif at C-terminus (SQAY in Drosophila), where \u03a6-represents a hydrophobic residue (usually Tyr in mammals), and S is phosphorylation site. In multicellular eukaryotes H2A.X is usually closely related to cH2As in the same group of multicellular organisms [millar_organizing_2013, talbert_histone_2021]. It seems likely that H2A.X was ancestral to cH2As due to its conserved role in DNA damage response [talbert_histone_2010]. Caveats: Nematodes are the only known species that lack H2A.X. Many fungi lack canonical H2A its role is fullfiled by H2A.X. In Drosophila melanogaster H2A.X function is fullfiled by H2A.Z histone." + "summary": "H1 is the linker histone. Associates with the nucleosome core and linker DNA near the DNA entry-exit points. The resulting particle is called chromatosome. H1-histone is lysine rich, has long disordered C-terminal tail and a short N-terminal tail. The globular domain has three helices and a wing, so-called \"winged helix\" motif.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Eukaryotes", - "taxonomic_span_id": "2759", - "alternate_names": [ - { - "name": "member X" - } - ], - "publications": [ - "22650316", - "25731851", - "18095327", - "23301656", - "millar_organizing_2013", - " talbert_histone_2021", - "talbert_histone_2010" - ] + "taxonomic_span": "null", + "taxonomic_span_id": "null", + "alternate_names": [], + "publications": [] }, - "macroH2A": { + "H1.0": { "level": "variant_group", "description": { - "summary": "macroH2A is the largest replication independent H2A histone variant characterized by an additional non-histone ~30 kDa macro domain connected to the C-end of the histone fold via an unstructured linker. MacroH2A is conserved and widespread in vertebrates, but also found in invertebrates. MacroH2A is involved in heterochromatin formation, X-inactivation and transcriptional regulation. MacroH2A is broadly distributed across the genome, found at H3K27me3-decorated faculatative heterochromatin, constitutive heterochromatin regions, is incorporated at sites of DNA damage. Macro domains may be capable of binding NAD+ derived metabolites, such as ADP-ribose and poly-ADP-ribose. Mammals have two macroH2A genes (macroH2A.1 and macroH2A.2 in humans) [sun_histone_2019]." + "summary": "H1.0 is a replication independent linker histone found in animals expressed in terminally differentiated cells. Has a common monophyletic origin that can be traced back before the differentiation between protostomes and deuterostomes, very early in metazoan evolution.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, "taxonomic_span": "Metazoa", "taxonomic_span_id": "33208", "alternate_names": [ { - "name": "mH2A" - }, - { - "name": "macroH2A1", - "gene": 1 - }, - { - "name": "macroH2A2", - "gene": 2 - }, - { - "name": "macroH2A1.1", - "gene": 1, - "splice": 1 + "name": "H1\u00b0" }, { - "name": "macroH2A1.2", - "gene": 1, - "splice": 2 + "name": "H5", + "taxonomy": "aves" }, { - "name": "macroH2A2.1", - "gene": 2, - "splice": 1 + "name": "H1\u03b4" }, { - "name": "macroH2A2.2", - "gene": 2, - "splice": 2 + "name": "RI H1" } ], "publications": [ "22650316", - "25731851", - "16107708", - "20543561", - "16803903", - "sun_histone_2019" - ] - }, - "macroH2A.1_(Mammalia)": { - "level": "variant", - "description": { - "summary": "macroH2A.1_(Mammalia) is a protein encoded by one of the macroH2A genes in mammals (coresponds to macroH2A.1 gene in humans). This gene further produces two splice variants macroH2A.1.s1 and macroH2A.1.s2 by inclusion of mutually exclusive exons encoding a region within the macro domain. The macro domain of macroH2A.1.s1 isoform is capable of binding NAD+ derived metabolites, such as ADP-ribose and poly-ADP-ribose, while other isoforms (including those produced by macroH2A.2 gene homologs) do not have this ability [sun_histone_2019]." - }, - "taxonomic_span": "Mammalia", - "taxonomic_span_id": "40674", - "alternate_names": [], - "publications": [ - "sun_histone_2019" + "23945933", + "2898141", + "7066298" ] }, - "macroH2A.1.s1_(Mammalia)": { - "level": "variant", + "H1.1": { + "level": "variant_group", "description": { - "summary": "macroH2A.1.s1_(Mammalia) is a splice isoform encoded by one of the macroH2A genes in mammals (coresponds to macroH2A.1 gene in humans). The macro domain of macroH2A.1.s1 isoform is capable of binding NAD+ derived metabolites, such as ADP-ribose and poly-ADP-ribose, while other isoforms (including those produced by macroH2A.2 gene homologs) do not have this ability [sun_histone_2019]." + "summary": "H1.1 is a replication independent linker histone.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Mammalia", - "taxonomic_span_id": "40674", + "taxonomic_span": "Homo", + "taxonomic_span_id": "9605", "alternate_names": [], "publications": [ - "sun_histone_2019" + "26689747" ] }, - "macroH2A.1.s1_(Homo_sapiens)": { - "level": "variant", + "H1.10": { + "level": "variant_group", "description": { - "summary": "macroH2A.1.s1_(Homo_sapiens) is a splice isoform encoded by macroH2A.1 gene in humans. The macro domain of macroH2A.1.s1 isoform is capable of binding NAD+ derived metabolites, such as ADP-ribose and poly-ADP-ribose, while other isoforms (including those produced by macroH2A.2 gene homologs) do not have this ability [sun_histone_2019]." + "summary": "Sequences collected here belong to H1.10 here - a vertebrate specific H1 variant.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", - "alternate_names": [], + "taxonomic_span": "Vertebrates", + "taxonomic_span_id": "7742", + "alternate_names": [ + { + "name": "H1x" + } + ], "publications": [ - "sun_histone_2019" + "22650316" ] }, - "macroH2A.1.s2_(Mammalia)": { - "level": "variant", + "H1.2": { + "level": "variant_group", "description": { - "summary": "macroH2A.1.s2_(Mammalia) is a splice isoform encoded by one of the macroH2A genes in mammals (coresponds to macroH2A.1 gene in humans). The macro domain of macroH2A.1.s2 isoform is not capable of binding NAD+ derived metabolites, such as ADP-ribose and poly-ADP-ribose [sun_histone_2019]." + "summary": "H1.2 is a replication independent linker histone.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Mammalia", - "taxonomic_span_id": "40674", + "taxonomic_span": "Homo", + "taxonomic_span_id": "9605", "alternate_names": [], "publications": [ - "sun_histone_2019" + "26689747" ] }, - "macroH2A.1.s2_(Homo_sapiens)": { - "level": "variant", + "H1.3": { + "level": "variant_group", "description": { - "summary": "macroH2A.1.s2_(Homo_sapiens) is a splice isoform encoded by macroH2A.1 gene in humans. The macro domain of macroH2A.1.s2 isoform is not capable of binding NAD+ derived metabolites, such as ADP-ribose and poly-ADP-ribose [sun_histone_2019]." + "summary": "H1.3 is a replication independent linker histone.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "Homo", + "taxonomic_span_id": "9605", "alternate_names": [], "publications": [ - "sun_histone_2019" + "26689747" ] }, - "macroH2A.2_(Mammalia)": { - "level": "variant", + "H1.4": { + "level": "variant_group", "description": { - "summary": "macroH2A.2_(Mammalia) is a protein encoded by one of the macroH2A genes in mammals (coresponds to macroH2A.2 gene in humans). The macro domain of macroH2A.2 variant is not capable of binding NAD+ derived metabolites [sun_histone_2019]." + "summary": "H1.4 is a replication independent linker histone.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Mammalia", - "taxonomic_span_id": "40674", + "taxonomic_span": "Homo", + "taxonomic_span_id": "9605", "alternate_names": [], "publications": [ - "sun_histone_2019" + "26689747" ] }, - "macroH2A.2_(Homo_sapiens)": { - "level": "variant", + "H1.5": { + "level": "variant_group", "description": { - "summary": "macroH2A.2_(Homo_sapiens) is a protein encoded by macroH2A.2 gene in humans. The macro domain of macroH2A.2 variant is not capable of binding NAD+ derived metabolites [sun_histone_2019]." + "summary": "H1.5 is a replication independent linker histone.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "Homo", + "taxonomic_span_id": "9605", "alternate_names": [], "publications": [ - "sun_histone_2019" + "26689747" ] }, - "short_H2A": { - "level": "variant_group", + "H2A": { + "level": "type", "description": { - "summary": "short_H2A is a class encompassing several histone H2A variants in placental (eutherian) mammals with shortened C-terminus expressed mainly during mammalian male germ cell development before the nearly complete replacement of histones by protamines in sperm nuclei. The repertoires of short histone H2A variants vary extensively among eutherian mammals due to lineage-specific gains and losses. Short H2A variants include H2A.B, H2A.L, H2A.P, H2A.Q, their genes are usually located on X chromosome and are intronless. These four clades of eutherian mammal short H2A variants emerged from a single, well-supported monophyletic clade, confirming their common ancestry [molaro_evolutionary_2018]. Due to shortened docking domain and changes within the acidic patch nucleosomes incorporating short H2As wrap less DNA (120-130 bp) and form loosely packed chromatin. There are few conserved residues in the histone fold domain of sH2As that distinguish them from each other, instead much of their specialization may stem from changes in the N- and C-terminal tails of these variatns [molaro_evolutionary_2018]. Abberant short H2A upregulation was reported in a broad range of cancers [chew_short_2021]. Caveats: H2A.B is also expressed in the brain [jiang_short_2020]." + "summary": "H2A is one of the core histone types present in all Eukaryotes. H2A forms dimers with H2B via the \"hand shake\" motif. Two H2A-H2B dimers in turn associate with H3-H4 tetramer to form complete nucleosome core. Structure of H2A consists of a histone fold domain extended by a short \u03b1C-helix and has both N- and C-terminal tails. \u03b1C-helix and C-terminal tail form \"docking domain\" that locks the H2A-H2B dimer onto the surface of H3-H4 tetramer [luger_crystal_1997]. It has been suggested that H2A and H2B have arisen from H3 and H4 during evolution [malik_phylogenomics_2003]. H2A histones have the most number of described functional variants.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Eutheria", - "taxonomic_span_id": "9347", - "alternate_names": [ - { - "name": "sH2A" - } - ], + "taxonomic_span": "Eukaryotes", + "taxonomic_span_id": "2759", + "alternate_names": [], "publications": [ - "molaro_evolutionary_2018", - "chew_short_2021", - "jiang_short_2020" + "luger_crystal_1997", + "malik_phylogenomics_2003" ] }, "H2A.B": { "level": "variant", "description": { - "summary": "H2A.B, previously known as \"Barr body deficient\" (H2A.Bbd) variant -- is a short replication independent H2A variant found in eutherian mammals implicated in spermiogenesis, transcription regulation, splicing, DNA synthesis. Genes: Common ancestor of eutherian mammals encoded two or three H2A.B genes. Genes are usually located on X chromosome in three conserved locations (except in mouse, where H2A.B genes are located at other locations on X chromosome with unclear kinship to the ancestral genes that relocated to autosomes and decayed [molaro_evolutionary_2018]). Human and mouse have three genes encoding H2A.Bs [molaro_evolutionary_2018]. Evolution: H2A.B is a rapildy evolving variant which is closely related to H2A.L, H2A.P, H2A.Q. It was suggested that H2A.B have been the subject to diversifying selection in simian primates, although mucj of the increased divergence of short histone H2A variants may be better explained by relaxed purifying selection [molaro_evolutionary_2018]. Knock-out: H2A.B knock-out mice are viable, subfertile and display changes in splicing events [anuar_gene_2019]. Sequence: Around 50% identity with the canonical H2A, has truncated docking domain, divergent histone fold domain, altered acidic patch, arginine rich N-terminus [molaro_evolutionary_2018]. Localization: H2A.B is expressed during mammalian male germ cell development and in the brain [molaro_evolutionary_2018,jiang_short_2020]. Originally, H2A.B was characterized by its exclusion from the inactive X chromosome if overexpressed in female somatic cells [chadwick_novel_2001]. However, experiments in mouse testis revealed that H2A.B is in fact present on the inactive X chromosome [soboleva_unique_2011]. Short H2A variants localize to sites of open chromatin and potentiate DNA synthesis, transcription, and splicing [molaro_evolutionary_2018]. This histone variant can bind to RNA directly in vitro and in vivo, and associates with mRNA at intron\u2014exon boundaries [soboleva_new_2017]. Structural effects: H2A.B containing nucleosomes wrap less DNA (~120-130 bp instead of ~150 bp) [sugiyama_distinct_2014,doyen_dissection_2006], form loosely packed chromatin. Interactions: RNA processing factors, proteins involved in the piRNA pathway [jiang_short_2020] Deposition: It was suggested that H2A.B is incorporated into DNA sites that are transiently exposed, for instance, during DNA replication [jiang_short_2020]. H2A.B-H2A dimers in nucleosomes can spontaneously be replaced by H2A-H2B dimers [hirano_histone_2021]. Disease: H2A.B is upregulated in cancer as other short H2A variants [chew_short_2021]. Caveats: Due to rapid evolution H2A.B function in different species may vary. For example, human H2A.B is retained during spermiogenesis, while is mouse it disappears and H2A.L is retained instead [molaro_evolutionary_2018]. Mouse H2A.B has additional negative residue in acidic patch, which is thought to increase its propensity to compact nucleosomal arrays relative to human H2A.B." + "summary": "H2A.B, previously known as \"Barr body deficient\" (H2A.Bbd) variant is a short replication independent H2A variant found in eutherian mammals implicated in spermiogenesis, transcription regulation, splicing, DNA synthesis. Genes: Common ancestor of eutherian mammals encoded two or three H2A.B genes. Genes are usually located on X chromosome in three conserved locations (except in mouse, where H2A.B genes are located at other locations on X chromosome with unclear kinship to the ancestral genes that relocated to autosomes and decayed [molaro_evolutionary_2018]). Human and mouse have three genes encoding H2A.Bs [molaro_evolutionary_2018]. Evolution: H2A.B is a rapildy evolving variant which is closely related to H2A.L, H2A.P, H2A.Q. It was suggested that H2A.B have been the subject to diversifying selection in simian primates, although mucj of the increased divergence of short histone H2A variants may be better explained by relaxed purifying selection [molaro_evolutionary_2018]. Knock-out: H2A.B knock-out mice are viable, subfertile and display changes in splicing events [anuar_gene_2019]. Sequence: Around 50% identity with the canonical H2A, has truncated docking domain, divergent histone fold domain, altered acidic patch, arginine rich N-terminus [molaro_evolutionary_2018]. Localization: H2A.B is expressed during mammalian male germ cell development and in the brain [molaro_evolutionary_2018,jiang_short_2020]. Originally, H2A.B was characterized by its exclusion from the inactive X chromosome if overexpressed in female somatic cells [chadwick_novel_2001]. However, experiments in mouse testis revealed that H2A.B is in fact present on the inactive X chromosome [soboleva_unique_2011]. Short H2A variants localize to sites of open chromatin and potentiate DNA synthesis, transcription, and splicing [molaro_evolutionary_2018]. This histone variant can bind to RNA directly in vitro and in vivo, and associates with mRNA at intron\u2014exon boundaries [soboleva_new_2017]. Structural effects: H2A.B containing nucleosomes wrap less DNA (~120-130 bp instead of ~150 bp) [sugiyama_distinct_2014,doyen_dissection_2006], form loosely packed chromatin. Interactions: RNA processing factors, proteins involved in the piRNA pathway [jiang_short_2020] Deposition: It was suggested that H2A.B is incorporated into DNA sites that are transiently exposed, for instance, during DNA replication [jiang_short_2020]. H2A.B-H2A dimers in nucleosomes can spontaneously be replaced by H2A-H2B dimers [hirano_histone_2021]. Disease: H2A.B is upregulated in cancer as other short H2A variants [chew_short_2021]. Caveats: Due to rapid evolution H2A.B function in different species may vary. For example, human H2A.B is retained during spermiogenesis, while is mouse it disappears and H2A.L is retained instead [molaro_evolutionary_2018]. Mouse H2A.B has additional negative residue in acidic patch, which is thought to increase its propensity to compact nucleosomal arrays relative to human H2A.B.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, "taxonomic_span": "Eutheria", "taxonomic_span_id": "9347", @@ -1069,148 +2455,304 @@ } ], "publications": [ - "molaro_evolutionary_2018", "anuar_gene_2019", - "jiang_short_2020", "chadwick_novel_2001", - "soboleva_unique_2011", - "soboleva_new_2017", - "sugiyama_distinct_2014", + "chew_short_2021", "doyen_dissection_2006", "hirano_histone_2021", - "chew_short_2021" + "jiang_short_2020", + "molaro_evolutionary_2018", + "soboleva_new_2017", + "soboleva_unique_2011", + "sugiyama_distinct_2014" ] }, - "H2A.B_(Homo_sapiens)": { + "H2A.B.1_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "H2A.B_(Homo_sapiens), previously known as \"Barr body deficient\" (H2A.Bbd) variant -- is a group of short replication independent H2A variants in humans encoded by H2AB1, H2AB2 and H2AB3 genes. They are involved in spermiogenesis, transcription regulation, splicing, DNA synthesis. Genes: In human H2A.B is encoded by H2AB1, H2AB2 and H2AB3 genes. Genes are intronless. H2AB2 and H2AB3 encode identical proteins. H2AB1 protein which differes by ??one?? amino acid. Genes are located on X chromosome. Evolution: H2A.B is a rapildy evolving variant which is closely related to H2A.L, H2A.P, H2A.Q [molaro_evolutionary_2018]. Common ancestor of eutherian mammals encoded two or three H2A.B genes. Knock-out: H2A.B knock-out mice are viable, subfertile and display changes in splicing events [anuar_gene_2019]. Sequence: Around 50% identity with the canonical H2A, has truncated docking domain, divergent histone fold domain, altered acidic patch, arginine rich N-terminus [molaro_evolutionary_2018]. Localization: H2A.B is expressed during mammalian male germ cell development and in the brain [molaro_evolutionary_2018,jiang_short_2020]. Originally, H2A.B was characterized by its exclusion from the inactive X chromosome if overexpressed in female somatic cells [chadwick_novel_2001]. However, experiments in mouse testis revealed that H2A.B is in fact present on the inactive X chromosome [soboleva_unique_2011]. Short H2A variants localize to sites of open chromatin and potentiate DNA synthesis, transcription, and splicing [molaro_evolutionary_2018]. In mouse this histone variant was shown to bind to RNA directly in vitro and in vivo, and associate with mRNA at intron\u2014exon boundaries [soboleva_new_2017]. Structural effects: H2A.B containing nucleosomes wrap less DNA (~120-130 bp instead of ~150 bp) [sugiyama_distinct_2014,doyen_dissection_2006], form loosely packed chromatin. Interactions: RNA processing factors, proteins involved in the piRNA pathway [jiang_short_2020] Deposition: It was suggested that H2A.B is incorporated into DNA sites that are transiently exposed, for instance, during DNA replication [jiang_short_2020]. H2A.B-H2A dimers in nucleosomes can spontaneously be replaced by H2A-H2B dimers [hirano_histone_2021]. Disease: H2A.B is upregulated in cancer as other short H2A variants [chew_short_2021]. Caveats: Due to rapid evolution H2A.B function in different species may vary. For example, human H2A.B is retained during spermiogenesis, while is mouse it disappears and H2A.L is retained instead [molaro_evolutionary_2018]. Mouse H2A.B has additional negative residue in acidic patch, which is thought to increase its propensity to compact nucleosomal arrays relative to human H2A.B." + "summary": "H2A.B.1_(Homo_sapiens) is one of the two isoform of H2A.B variant in humans encoded by H2AB1 gene. This isoform differs by ??one?? amino acid from H2A.B.2 isoform encoded by H2AB2 and H2AB3 genes. Caveats: Unfortunately there is confusion with respect to the number suffix in the literature. El Kennani et al. have used this numbering scheme that follows the numbers in the gene names [el_kennani_ms_histonedb_2017]. And the gene names are numbered from centromere to telomere. However, Molaro et al. in their evolutionary analysis have used H2A.B.1.1, H2A.B.1.2 and H2A.B.2 to reffer to H2AB3, H2AB2 and H2AB1 genes, respectively. The variant numbering used by Molaro et al. was based on the relative position of the genes on each arm of the X Chromosome from telomere to centromere [molaro_evolutionary_2018].", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, "taxonomic_span": "Homo sapiens", "taxonomic_span_id": "9606", "alternate_names": [ { - "name": "H2A.Bbd" + "name": "H2A.B.2" } ], "publications": [ - "molaro_evolutionary_2018", + "el_kennani_ms_histonedb_2017", + "molaro_evolutionary_2018" + ] + }, + "H2A.B.1_(Mus_musculus)": { + "level": "variant", + "description": { + "summary": "H2A.B.1_(Mus_musculus) is one of the three isoforms of H2A.B variant in mouse encoded by H2ab3 gene. Caveats: Unfortunately there is some confusion with respect to the number suffixes in the literature and between the gene names and variant names. Since a variant encoded by H2ab1 gene was named initially H2A.Lap1 [soboleva_unique_2011], but renamed afterwards to H2A.B.3 [soboleva_new_2017], and this name has been used afterwards [anuar_gene_2019,jiang_short_2020], the H2ab3 gene variant is name here as H2A.B.1.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Mus musculus", + "taxonomic_span_id": "10090", + "alternate_names": [], + "publications": [ "anuar_gene_2019", "jiang_short_2020", - "chadwick_novel_2001", - "soboleva_unique_2011", "soboleva_new_2017", - "sugiyama_distinct_2014", - "doyen_dissection_2006", - "hirano_histone_2021", - "chew_short_2021" + "soboleva_unique_2011" ] }, - "H2A.B.1_(Homo_sapiens)": { + "H2A.B.2_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "H2A.B.2_(Homo_sapiens) is one of the two isoform of H2A.B variant in humans encoded by H2AB2 and H2AB3 genes. This isoform differs by ??one?? amino acid from H2A.B.1 isoform encoded by H2AB1 gene. Caveats: Unfortunately there is confusion with respect to the number suffix in the literature. El Kennani et al. have used this numbering scheme that follows the numbers in the gene names [el_kennani_ms_histonedb_2017]. And the gene names are numbered from centromere to telomere. However, Molaro et al. in their evolutionary analysis have used H2A.B.1.1, H2A.B.1.2 and H2A.B.2 to reffer to H2AB3, H2AB2 and H2AB1 genes, respectively. The variant numbering used by Molaro et al. was based on the relative position of the genes on each arm of the X Chromosome from telomere to centromere [molaro_evolutionary_2018].", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [ + { + "name": "H2A.B.1" + }, + { + "name": "H2A.B.1.1" + }, + { + "name": "H2A.B.1.2" + } + ], + "publications": [ + "el_kennani_ms_histonedb_2017", + "molaro_evolutionary_2018" + ] + }, + "H2A.B.2_(Mus_musculus)": { + "level": "variant", + "description": { + "summary": "H2A.B.2_(Mus_musculus) is one of the three isoforms of H2A.B variant in mouse encoded by H2ab2 gene.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Mus musculus", + "taxonomic_span_id": "10090", + "alternate_names": [], + "publications": [] + }, + "H2A.B.3_(Mus_musculus)": { "level": "variant", "description": { - "summary": "H2A.B.1_(Homo_sapiens) is one of the two isoform of H2A.B variant in humans encoded by H2AB1 gene. This isoform differs by ??one?? amino acid from H2A.B.2 isoform encoded by H2AB2 and H2AB3 genes. Caveats: Unfortunately there is confusion with respect to the number suffix in the literature. El Kennani et al. have used this numbering scheme that follows the numbers in the gene names [el_kennani_ms_histonedb_2017]. And the gene names are numbered from centromere to telomere. However, Molaro et al. in their evolutionary analysis have used H2A.B.1.1, H2A.B.1.2 and H2A.B.2 to reffer to H2AB3, H2AB2 and H2AB1 genes, respectively. The variant numbering used by Molaro et al. was based on the relative position of the genes on each arm of the X Chromosome from telomere to centromere [molaro_evolutionary_2018]." + "summary": "H2A.B.3_(Mus_musculus) is one of the three isoforms of H2A.B variant in mouse encoded by H2ab1 gene. This gene has been characterized the most experimentally among all H2A.B. variants. Caveats: Unfortunately there is some confusion with respect to the number suffixes in the literature and between the gene names and variant names. This variant was named initially H2A.Lap1 [soboleva_unique_2011], but renamed afterwards to H2A.B.3 [soboleva_new_2017], and this name has been used afterwards [anuar_gene_2019,jiang_short_2020]. Hence we follow the established convention. Caveat: Moralo et al. suggests that \"rat-mouse common ancestor acquired an intact H2A.B gene in a new X-linked locus (H2a.b.ratMouse1, also historically named H2A.B.3) [molaro_evolutionary_2018]\". Our analysis of supplementary information suggests that H2a.b.ratMouse1 is H2ab2 gene in the current nomenclature. Our analysis of sequences published by Soboleva et al. suggests that H2A.B.3 (H2A.Lap1) is H2ab1 gene and not H2ab2 [soboleva_unique_2011].", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "Mus musculus", + "taxonomic_span_id": "10090", "alternate_names": [ { - "name": "H2A.B.2" + "name": "H2A.Lap1" } ], "publications": [ - "el_kennani_ms_histonedb_2017", - "molaro_evolutionary_2018" + "anuar_gene_2019", + "jiang_short_2020", + "molaro_evolutionary_2018", + "soboleva_new_2017", + "soboleva_unique_2011" ] }, - "H2A.B.2_(Homo_sapiens)": { + "H2A.B_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "H2A.B.2_(Homo_sapiens) is one of the two isoform of H2A.B variant in humans encoded by H2AB2 and H2AB3 genes. This isoform differs by ??one?? amino acid from H2A.B.1 isoform encoded by H2AB1 gene. Caveats: Unfortunately there is confusion with respect to the number suffix in the literature. El Kennani et al. have used this numbering scheme that follows the numbers in the gene names [el_kennani_ms_histonedb_2017]. And the gene names are numbered from centromere to telomere. However, Molaro et al. in their evolutionary analysis have used H2A.B.1.1, H2A.B.1.2 and H2A.B.2 to reffer to H2AB3, H2AB2 and H2AB1 genes, respectively. The variant numbering used by Molaro et al. was based on the relative position of the genes on each arm of the X Chromosome from telomere to centromere [molaro_evolutionary_2018]." + "summary": "H2A.B_(Homo_sapiens), previously known as \"Barr body deficient\" (H2A.Bbd) variant is a group of short replication independent H2A variants in humans encoded by H2AB1, H2AB2 and H2AB3 genes. They are involved in spermiogenesis, transcription regulation, splicing, DNA synthesis. Genes: In human H2A.B is encoded by H2AB1, H2AB2 and H2AB3 genes. Genes are intronless. H2AB2 and H2AB3 encode identical proteins. H2AB1 protein which differes by ??one?? amino acid. Genes are located on X chromosome. Evolution: H2A.B is a rapildy evolving variant which is closely related to H2A.L, H2A.P, H2A.Q [molaro_evolutionary_2018]. Common ancestor of eutherian mammals encoded two or three H2A.B genes. Knock-out: H2A.B knock-out mice are viable, subfertile and display changes in splicing events [anuar_gene_2019]. Sequence: Around 50% identity with the canonical H2A, has truncated docking domain, divergent histone fold domain, altered acidic patch, arginine rich N-terminus [molaro_evolutionary_2018]. Localization: H2A.B is expressed during mammalian male germ cell development and in the brain [molaro_evolutionary_2018,jiang_short_2020]. Originally, H2A.B was characterized by its exclusion from the inactive X chromosome if overexpressed in female somatic cells [chadwick_novel_2001]. However, experiments in mouse testis revealed that H2A.B is in fact present on the inactive X chromosome [soboleva_unique_2011]. Short H2A variants localize to sites of open chromatin and potentiate DNA synthesis, transcription, and splicing [molaro_evolutionary_2018]. In mouse this histone variant was shown to bind to RNA directly in vitro and in vivo, and associate with mRNA at intron\u2014exon boundaries [soboleva_new_2017]. Structural effects: H2A.B containing nucleosomes wrap less DNA (~120-130 bp instead of ~150 bp) [sugiyama_distinct_2014,doyen_dissection_2006], form loosely packed chromatin. Interactions: RNA processing factors, proteins involved in the piRNA pathway [jiang_short_2020] Deposition: It was suggested that H2A.B is incorporated into DNA sites that are transiently exposed, for instance, during DNA replication [jiang_short_2020]. H2A.B-H2A dimers in nucleosomes can spontaneously be replaced by H2A-H2B dimers [hirano_histone_2021]. Disease: H2A.B is upregulated in cancer as other short H2A variants [chew_short_2021]. Caveats: Due to rapid evolution H2A.B function in different species may vary. For example, human H2A.B is retained during spermiogenesis, while is mouse it disappears and H2A.L is retained instead [molaro_evolutionary_2018]. Mouse H2A.B has additional negative residue in acidic patch, which is thought to increase its propensity to compact nucleosomal arrays relative to human H2A.B.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, "taxonomic_span": "Homo sapiens", "taxonomic_span_id": "9606", "alternate_names": [ { - "name": "H2A.B.1" - }, - { - "name": "H2A.B.1.1" - }, - { - "name": "H2A.B.1.2" + "name": "H2A.Bbd" } ], "publications": [ - "el_kennani_ms_histonedb_2017", - "molaro_evolutionary_2018" + "anuar_gene_2019", + "chadwick_novel_2001", + "chew_short_2021", + "doyen_dissection_2006", + "hirano_histone_2021", + "jiang_short_2020", + "molaro_evolutionary_2018", + "soboleva_new_2017", + "soboleva_unique_2011", + "sugiyama_distinct_2014" ] }, "H2A.B_(Mus_musculus)": { "level": "variant", "description": { - "summary": "H2A.B_(Mus_musculus) is a group of three isoforms of H2A.B variant in mouse encoded by H2ab1, H2ab2 and H2ab3 genes. H2ab1 is the most studied gene and corresponds to H2A.B.3 variant. Evolution: Moreover, the ancestral loci encoding H2A.B genes relocated away from the X Chromosome to autosomes in mouse (Chr 3 and Chr 16) and rat genomes (Chr 20 and Chr 18) as determined by flanking genes, and the encoded H2A.B genes have now been deleted or have decayed beyond recognition. However, the rat-mouse common ancestor acquired an intact H2A.B gene in a new X-linked locus [molaro_evolutionary_2018]. Caveats: Unfortunately there is some confusion with respect to the number suffixes in the literature and between the gene names and variant names. The H2ab1 gene variant was named initially H2A.Lap1 [soboleva_unique_2011], but renamed afterwards to H2A.B.3 [soboleva_new_2017], and this name has been used afterwards [anuar_gene_2019,jiang_short_2020]. Hence we follow the established convention." + "summary": "H2A.B_(Mus_musculus) is a group of three isoforms of H2A.B variant in mouse encoded by H2ab1, H2ab2 and H2ab3 genes. H2ab1 is the most studied gene and corresponds to H2A.B.3 variant. Evolution: Moreover, the ancestral loci encoding H2A.B genes relocated away from the X Chromosome to autosomes in mouse (Chr 3 and Chr 16) and rat genomes (Chr 20 and Chr 18) as determined by flanking genes, and the encoded H2A.B genes have now been deleted or have decayed beyond recognition. However, the rat-mouse common ancestor acquired an intact H2A.B gene in a new X-linked locus [molaro_evolutionary_2018]. Caveats: Unfortunately there is some confusion with respect to the number suffixes in the literature and between the gene names and variant names. The H2ab1 gene variant was named initially H2A.Lap1 [soboleva_unique_2011], but renamed afterwards to H2A.B.3 [soboleva_new_2017], and this name has been used afterwards [anuar_gene_2019,jiang_short_2020]. Hence we follow the established convention.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, "taxonomic_span": "Mus musculus", "taxonomic_span_id": "10090", "alternate_names": [], "publications": [ + "anuar_gene_2019", + "jiang_short_2020", "molaro_evolutionary_2018", - "soboleva_unique_2011", "soboleva_new_2017", - "anuar_gene_2019", - "jiang_short_2020" + "soboleva_unique_2011" ] }, - "H2A.B.1_(Mus_musculus)": { - "level": "variant", + "H2A.J": { + "level": "variant_group", "description": { - "summary": "H2A.B.1_(Mus_musculus) is one of the three isoforms of H2A.B variant in mouse encoded by H2ab3 gene. Caveats: Unfortunately there is some confusion with respect to the number suffixes in the literature and between the gene names and variant names. Since a variant encoded by H2ab1 gene was named initially H2A.Lap1 [soboleva_unique_2011], but renamed afterwards to H2A.B.3 [soboleva_new_2017], and this name has been used afterwards [anuar_gene_2019,jiang_short_2020], the H2ab3 gene variant is name here as H2A.B.1." + "summary": "H2A.J is a poorly studied replication independent H2A histone variant very similar in sequence to canonical H2A histones. It was characterized in human and mouse, similar genes are present in other mammals. It has been implicated in cell senesecence. Genes: In human it is encoded by H2AJ gene on chormomosome 12, in mouse by H2aj gene on chromosome 6. Both genes are intronless. H2aj gene lacks a stem-loop structure at the 3'-UTR but contains a poly (A) signal [nishida_novel_2005]. Similar genes are found in other mammals [contrepois_histone_2017]. Evolution: no studies available. Knock-out: Depletion of H2A.J via RNA interference modifies senesecence-associated chromatin re-structuring and abolishes senesecence-associated secretory phenotype in human fibroblasts subject to ionizing radiation [isermann_histone_2020]. Function, disease: It has been shown that H2A.J accumulates in senescent cells and promotes inflammatory gene expression [isermann_histone_2020,contrepois_histone_2017]. Sequence: It differs from canonical H2A protein sequences only by an A11V substitution and the presence of an SQK motif near the C-terminus, which is a potential phosphorylation site [talbert_histone_2021]. Localization: In fibroblast irradiation experiments it was shown that H2A.J colocalizes with 53BP1 and is incorporated at the periphery of so-called senesecence-associated chromatin foci (SAHF) [isermann_histone_2020]. Deposition: unclear. Structural effects: sequence changes lie only within the histone tails, alterations to the C-terminal tail may theoretically alter interactions with linker DNA and H1-histone, but this has not been studied. Interactions: colocalizes with 53BP1 [isermann_histone_2020].", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Mus musculus", - "taxonomic_span_id": "10090", + "taxonomic_span": "Mammalia", + "taxonomic_span_id": "40674", "alternate_names": [], "publications": [ - "soboleva_unique_2011", - "soboleva_new_2017", - "anuar_gene_2019", - "jiang_short_2020" + "25731851", + "contrepois_histone_2017", + "isermann_histone_2020", + "nishida_novel_2005", + "talbert_histone_2021" ] }, - "H2A.B.2_(Mus_musculus)": { + "H2A.J_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "H2A.B.2_(Mus_musculus) is one of the three isoforms of H2A.B variant in mouse encoded by H2ab2 gene." + "summary": "null", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Mus musculus", - "taxonomic_span_id": "10090", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], "publications": [] }, - "H2A.B.3_(Mus_musculus)": { - "level": "variant", - "description": { - "summary": "H2A.B.3_(Mus_musculus) is one of the three isoforms of H2A.B variant in mouse encoded by H2ab1 gene. This gene has been characterized the most experimentally among all H2A.B. variants. Caveats: Unfortunately there is some confusion with respect to the number suffixes in the literature and between the gene names and variant names. This variant was named initially H2A.Lap1 [soboleva_unique_2011], but renamed afterwards to H2A.B.3 [soboleva_new_2017], and this name has been used afterwards [anuar_gene_2019,jiang_short_2020]. Hence we follow the established convention. Caveat: Moralo et al. suggests that \"rat-mouse common ancestor acquired an intact H2A.B gene in a new X-linked locus (H2a.b.ratMouse1, also historically named H2A.B.3) [molaro_evolutionary_2018]\". Our analysis of supplementary information suggests that H2a.b.ratMouse1 is H2ab2 gene in the current nomenclature. Our analysis of sequences published by Soboleva et al. suggests that H2A.B.3 (H2A.Lap1) is H2ab1 gene and not H2ab2 [soboleva_unique_2011]." - }, - "taxonomic_span": "Mus musculus", - "taxonomic_span_id": "10090", - "alternate_names": [ - { - "name": "H2A.Lap1" - } - ], - "publications": [ - "soboleva_unique_2011", - "soboleva_new_2017", - "anuar_gene_2019", - "jiang_short_2020", - "molaro_evolutionary_2018" - ] - }, "H2A.L": { "level": "variant", "description": { - "summary": "H2A.L - is a class of short H2A variants in eutherian mammals implicated in spermatogenesis and replacement of histones with protamines. Genes: \u0421ommon ancestor of eutherian mammals encoded three H2A.L genes. These genes are usually located on X chromosome at three locations (named H2A.L.1, H2A.L.2 and H2A.L.3 by Molaro et al.) [molaro_evolutionary_2018]. Humans have two putative genes (H2AL1Q, H2AL3, located at H2A.L.1 and H2A.L.3 loci, respectively) and H2AL1MP pseudogene (located at H2A.L.2 loci has inactivating mutation in all primates). The H2AL1Q and H2AL3 genes have unusually long extensions at their 3'-ends and have not so far been detected at protein level. Mouse genome has a leneage specific expansion of H2A.L genes, encoding a total of 18 genes (15 genes on X chromosome H2a1a-H2a1o and H2al3; two genes on Y-chromosome H2al2c and H2al2b; one gene on chromosome 2 H2al2a) and two pseudogenes [molaro_evolutionary_2018]. At H2A.L.1 locus mouse has a pseudogene H2al1q-ps. The most studied gene in mice is H2al2a. This gene was first identified in [govin_pericentric_2007] (NCBI protein id NP_080903) and was refered to as H2AL2 or H2A.L.2 histone in the following papers. However, this gene is not located at the H2A.L.2 locus (as defined by Molaro et al.) on X-chromosome, but it is rather located on chromosome 2. A synthenic location of H2A.L.2 locus in mouse is occupied by H2al1m gene [Seal et al. unpublished]. Previous names for mouse H2A.Ls include H2A.Lap2, H2A.Lap3, H2A.Lap4, H2AL1, H2AL2 [soboleva_unique_2011, govin_pericentric_2007]. H2AL1 has been used to reffer to H2al1a gene [govin_pericentric_2007]. Evolution: Molaro et al. found that short H2A variants show greater evolutionary divergence between species than even CENPA, the fastest-evolving histone variant examined to date [molaro_evolutionary_2018]. Evolutionary analysis of purifying selection suggested that H2A.L function may have been lost in Old World monkeys and hominoids but retained in New World monkeys [molaro_evolutionary_2018]. Knock-out: H2A.L.2 knock out mice are infertile because transition proteins can no longer associate with chromatin [barral_histone_2017]. Function: Required for the histone\u2013protamine exchange process [barral_histone_2017]. Sequence: Sequence is divergent from cH2A. Identity with cH2A may be as low as 30%. H2A.L variants have a shortened C-termus, truncated docking domain, altered acidic patch, arginine rich N-terminus. Nucleosomes incorporating H2A.L warp less DNA and from more loosely packed chromatin [molaro_evolutionary_2018]. Localization: Accumulates in spermatid nuclei until the end of spermatogenesis and remains in mature sperm chromatin even after protamine exchange in mouse, eventually disappearing from the paternal pronucleus following fertilization [molaro_evolutionary_2018]. Involved in pericentric chromatin organization in spermatids, is retained after histone-to-protamine replacement [hoghoughi_rna-guided_2020]. H2A.L.2 is maximally expressed at later stages of spermatogenesis (condensing spermatids) when histones are bound by transition proteins and then replaced with protamines Structural effects: Interactions: H2A.L.2 preferentially dimerizes with H2B.1 (TH2B) at least in mice [govin_pericentric_2007]. Intranuclear localization of H2A.L.2 is controlled by its ability to bind RNA via its N-terminus [hoghoughi_rna-guided_2020]. Deposition: Likely mediated by interaction with RNA [hoghoughi_rna-guided_2020]. Disease: no information, since no H2A.L have been so far detect at protein level in humans. Caveats: there is some confusion in literature with respect to numbering H2A.L subvariants, especially in mouse (see caveats in description of mouse H2A.L variants)." + "summary": "H2A.L - is a class of short H2A variants in eutherian mammals implicated in spermatogenesis and replacement of histones with protamines. Genes: \u0421ommon ancestor of eutherian mammals encoded three H2A.L genes. These genes are usually located on X chromosome at three locations (named H2A.L.1, H2A.L.2 and H2A.L.3 by Molaro et al.) [molaro_evolutionary_2018]. Humans have two putative genes (H2AL1Q, H2AL3, located at H2A.L.1 and H2A.L.3 loci, respectively) and H2AL1MP pseudogene (located at H2A.L.2 loci has inactivating mutation in all primates). The H2AL1Q and H2AL3 genes have unusually long extensions at their 3'-ends and have not so far been detected at protein level. Mouse genome has a leneage specific expansion of H2A.L genes, encoding a total of 18 genes (15 genes on X chromosome H2a1a-H2a1o and H2al3; two genes on Y-chromosome H2al2c and H2al2b; one gene on chromosome 2 H2al2a) and two pseudogenes [molaro_evolutionary_2018]. At H2A.L.1 locus mouse has a pseudogene H2al1q-ps. The most studied gene in mice is H2al2a. This gene was first identified in [govin_pericentric_2007] (NCBI protein id NP_080903) and was refered to as H2AL2 or H2A.L.2 histone in the following papers. However, this gene is not located at the H2A.L.2 locus (as defined by Molaro et al.) on X-chromosome, but it is rather located on chromosome 2. A synthenic location of H2A.L.2 locus in mouse is occupied by H2al1m gene [Seal et al. unpublished]. Previous names for mouse H2A.Ls include H2A.Lap2, H2A.Lap3, H2A.Lap4, H2AL1, H2AL2 [soboleva_unique_2011, govin_pericentric_2007]. H2AL1 has been used to reffer to H2al1a gene [govin_pericentric_2007]. Evolution: Molaro et al. found that short H2A variants show greater evolutionary divergence between species than even CENPA, the fastest-evolving histone variant examined to date [molaro_evolutionary_2018]. Evolutionary analysis of purifying selection suggested that H2A.L function may have been lost in Old World monkeys and hominoids but retained in New World monkeys [molaro_evolutionary_2018]. Knock-out: H2A.L.2 knock out mice are infertile because transition proteins can no longer associate with chromatin [barral_histone_2017]. Function: Required for the histone\u2013protamine exchange process [barral_histone_2017]. Sequence: Sequence is divergent from cH2A. Identity with cH2A may be as low as 30%. H2A.L variants have a shortened C-termus, truncated docking domain, altered acidic patch, arginine rich N-terminus. Nucleosomes incorporating H2A.L warp less DNA and from more loosely packed chromatin [molaro_evolutionary_2018]. Localization: Accumulates in spermatid nuclei until the end of spermatogenesis and remains in mature sperm chromatin even after protamine exchange in mouse, eventually disappearing from the paternal pronucleus following fertilization [molaro_evolutionary_2018]. Involved in pericentric chromatin organization in spermatids, is retained after histone-to-protamine replacement [hoghoughi_rna-guided_2020]. H2A.L.2 is maximally expressed at later stages of spermatogenesis (condensing spermatids) when histones are bound by transition proteins and then replaced with protamines Structural effects: Interactions: H2A.L.2 preferentially dimerizes with H2B.1 (TH2B) at least in mice [govin_pericentric_2007]. Intranuclear localization of H2A.L.2 is controlled by its ability to bind RNA via its N-terminus [hoghoughi_rna-guided_2020]. Deposition: Likely mediated by interaction with RNA [hoghoughi_rna-guided_2020]. Disease: no information, since no H2A.L have been so far detect at protein level in humans. Caveats: there is some confusion in literature with respect to numbering H2A.L subvariants, especially in mouse (see caveats in description of mouse H2A.L variants).", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, "taxonomic_span": "Eutheria", "taxonomic_span_id": "9347", @@ -1220,11 +2762,11 @@ }, { "name": "H2AL1", - "gene": 1 + "gene": "1" }, { "name": "H2AL2", - "gene": 2 + "gene": "2" }, { "name": "H2A.Lap2" @@ -1234,218 +2776,148 @@ } ], "publications": [ - "22650316", - "25731851", - "19506029", + " govin_pericentric_2007", "17261847", "18703863", - "molaro_evolutionary_2018", + "19506029", + "22650316", + "25731851", + "barral_histone_2017", "govin_pericentric_2007", + "hoghoughi_rna-guided_2020", + "molaro_evolutionary_2018", "Seal et al. unpublished", - "soboleva_unique_2011", - " govin_pericentric_2007", - "barral_histone_2017", - "hoghoughi_rna-guided_2020" + "soboleva_unique_2011" ] }, - "H2A.L_(Homo_sapiens)": { - "level": "variant", - "description": { - "summary": "H2A.L_(Homo_sapiens) - is a class of putative H2A.L histone variants in human. Humans have two putative genes (H2AL1Q, H2AL3, located at H2A.L.1 and H2A.L.3 loci, respectively) and H2AL1MP pseudogene (located at H2A.L.2 loci has inactivating mutation in all primates). The H2AL1Q and H2AL3 genes have unusually long extensions at their 3'-ends and have not so far been detected at protein level. See H2A.L description for more information." - }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", - "alternate_names": [], - "publications": [] - }, "H2A.L.1_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "H2A.L.1_(Homo_sapiens) - is a putative H2A.L histone variant encoded by H2AL1Q gene. It is located at H2A.L.1 locus on X-chromosome which can be traced back to the common ancestor of eutherian mammanls. The H2AL1Q and H2AL3 genes have unusually long extensions at their 3'-ends and have not so far been detected at protein level. See H2A.L description for more information." - }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", - "alternate_names": [], - "publications": [] - }, - "H2A.L.3_(Homo_sapiens)": { - "level": "variant", - "description": { - "summary": "H2A.L.3_(Homo_sapiens) - is a putative H2A.L histone variant encoded by H2AL3 gene. It is located at H2A.L.3 locus on X-chromosome which can be traced back to the common ancestor of eutherian mammanls. The H2AL1Q and H2AL3 genes have unusually long extensions at their 3'-ends and have not so far been detected at protein level. See H2A.L description for more information." + "summary": "H2A.L.1_(Homo_sapiens) - is a putative H2A.L histone variant encoded by H2AL1Q gene. It is located at H2A.L.1 locus on X-chromosome which can be traced back to the common ancestor of eutherian mammanls. The H2AL1Q and H2AL3 genes have unusually long extensions at their 3'-ends and have not so far been detected at protein level. See H2A.L description for more information.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, "taxonomic_span": "Homo sapiens", "taxonomic_span_id": "9606", "alternate_names": [], "publications": [] }, - "H2A.L_(Mus_musculus)": { - "level": "variant", - "description": { - "summary": "H2A.L_(Mus_musculus) - is a group of H2A.L histone variants in mouse. The single autosomal H2al2a (H2A.L.2 variant) gene in mouse located on chromosome 2 is expressed at much higher levels than the sex-linked copies; knockout of this single gene is sufficient to cause male sterility [molaro_evolutionary_2018]. See H2A.L description for more information. Caveats: there is some confusion with the variant names in the literature. Govin et al. initially identified and named three variants H2AL1, H2AL2, H2AL3 [govin_pericentric_2007]. These are encoded by H2al1a, H2al2a and H2ap genes, respectively. The H2Al2 endoded variant was later renamed in the literature as H2A.L.2 [jiang_short_2020]. The H2ap gencoded variant is in fact H2A.P in the current nomenclature. Alternatively, Molaro et al. have named three evolutionary conserved loci on X chromosome that harbor H2A.L genes, these loci are H2A.L.1, H2A.L.2 and H2A.L.3 [molaro_evolutionary_2018]. While human gene and variant naming is in line with the names of these loci, in mouse names of these loci do not correspond exactly to the originally proposed gene names except for H2A.L.3 locus which harbors H2al3 gene (not H2ap gene(!)). In mouse at H2A.L.1 locus a pseudogene H2al1q-ps is located, at H2A.L.2 locus mouse has H2al1m gene (H2al1a-H2al1o genes located within 5 megabases from this locus have similar protein sequences(?)), while H2A.L.2 variant encoded by H2al2a is located on chromosome 2 (two similar genes H2al2b and H2al2c are located on Y chromosome). In this classification we follow the numbering used in gene names which also corresponds to the one established earlier in the literature. Hence, H2A.L.2 variant in mouse encompasses H2al2a gene and similar H2al2b and H2al2c genes, while H2A.L.1 variant encompasses 14 H2al1a-H2al1o genes including H2al1m gene located at a syntenic location of the H2A.L.2 locus" - }, - "taxonomic_span": "Mus musculus", - "taxonomic_span_id": "10090", - "alternate_names": [], - "publications": [ - "molaro_evolutionary_2018", - "govin_pericentric_2007", - "jiang_short_2020" - ] - }, "H2A.L.1_(Mus_musculus)": { "level": "variant", "description": { - "summary": "H2A.L.1_(Mus_musculus) - is a group of H2A.L histone variants in mouse endoded by 14 genes on X-chromosome (H2al1a,H2al1b,H2al1c,H2al1d,H2al1e,H2al1f,H2al1g,H2al1h,H2al1i,H2al1j,H2al1k,H2al1m,H2al1n,H2al1o). See H2A.L description for more information. El Kennani et al. reported variations in expression of different H2A.L.1 genes between different stages of spermatogenesis in mice [el_kennani_ms_histonedb_2017]." - }, - "taxonomic_span": "Mus musculus", - "taxonomic_span_id": "10090", - "alternate_names": [], - "publications": [ - "el_kennani_ms_histonedb_2017" - ] - }, - "H2A.L.2_(Mus_musculus)": { - "level": "variant", - "description": { - "summary": "H2A.L.2_(Mus_musculus) - is a group of H2A.L histone variants in mouse endoded by H2al2a gene on chromosome 2 and two related H2al2b, H2al2b genes on Y-chromosome. H2al2a gene reffered in literature as H2A.L.2 variant is the most studied one, demostrating higher levels of expression than other H2A.L genes in mouse. See H2A.L description for more information. " - }, - "taxonomic_span": "Mus musculus", - "taxonomic_span_id": "10090", - "alternate_names": [], - "publications": [] - }, - "H2A.L.3_(Mus_musculus)": { - "level": "variant", - "description": { - "summary": "H2A.L.3_(Mus_musculus) - is a H2A.L histone variant in mouse endoded by H2al3 gene on X chromosome. Its ortolog at a conserved position in humans is H2AL3 gene. See H2A.L description for more information." - }, - "taxonomic_span": "Mus musculus", - "taxonomic_span_id": "10090", - "alternate_names": [], - "publications": [] - }, - "H2A.P": { - "level": "variant", - "description": { - "summary": "H2A.P - is a class of testis-specific short H2A variants in eutherian mammals expressed at post-meiotic stages of spermatogensis. It is not well studied. Its expression in mouse has been shown only at mRNA level [el_kennani_ms_histonedb_2017], although evolutionary analysis strongly argues that it is a protein coding gene [molaro_evolutionary_2018]. In human H2A.P gene H2ap was previously named HYPM (Huntingtin-interacting protein M) since in yeast two-hybrid experiments it was shown to interact with huntingtin, which contains an expanded polyglutamine tract in individuals with Huntington's disease [faber_huntingtin_1998]. Genes: \u0421ommon ancestor of eutherian mammals encoded a single H2A.P gene. These genes are usually located on X chromosome as do other short H2As [molaro_evolutionary_2018]. Humans and mouse have one gene name H2AP and H2ap, respectively. Evolution: Molaro et al. found that short H2A variants show greater evolutionary divergence between species than even CENPA, the fastest-evolving histone variant examined to date. Their results indicate that H2A.P and possible H2A.B have been subject to diversifying selection in simian primates, which could partly ecplame the greater divergence of short H2A histone variants compared to other H2A histones in mammals [molaro_evolutionary_2018]. Knock-out: no studies. Function: no specific studies have been reported, but by its similarity to H2A.L it is likely that it participates in the histone\u2013protamine exchange process. Sequence: Has one of the most divergent sequences from cH2A. Identity with cH2A may be as low as 24%. H2A.P variants have a shortened C-termus, truncated docking domain, altered acidic patch, arginine rich N-terminus. H2A.P have lost two key conserved arginine (R) residues in Loop 1 and 2 that contact the DNA minor-groove and acquired many acidic residues at sites including contacts with DNA and H2B. The last 14 residues in H2A.P are more evolutionary contrained than the rest of the protein, suggesting their potential interaction with non-histone proteins. Localization: H2A.P presence has not been confirmed at protein level. H2A.P mRNA were found to be strongly enriched in round and elongating spermatids [govin_pericentric_2007], expressed in the post-meiotic stages of spermatogenesis [el_kennani_ms_histonedb_2017]. Structural effects: Nucleosomes incorporating H2A.P are predicted to be highly destabilized [molaro_evolutionary_2018]. Interactions: In yeast two-hybrid screens was shown to interact with huntingtin [faber_huntingtin_1998]. Disease: no information. Caveats: H2A.P in mice was previously name H2AL3 [govin_pericentric_2007] and H2A.Lap4 [soboleva_unique_2011]." - }, - "taxonomic_span": "Eutheria", - "taxonomic_span_id": "9347", - "alternate_names": [], - "publications": [ - "9700202", - "el_kennani_ms_histonedb_2017", - "molaro_evolutionary_2018", - "faber_huntingtin_1998", - "govin_pericentric_2007", - "soboleva_unique_2011" - ] - }, - "H2A.P_(Homo_sapiens)": { - "level": "variant", - "description": { - "summary": "H2A.P_(Homo_sapiens) - is a H2A.P variant histone encoded in humans by H2AP gene. See H2A.P variant description for more information. In human H2A.P gene H2ap was previously named HYPM (Huntingtin-interacting protein M) since in yeast two-hybrid experiments it was shown to interact with huntingtin, which contains an expanded polyglutamine tract in individuals with Huntington's disease [faber_huntingtin_1998]." - }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", - "alternate_names": [], - "publications": [ - "9700202", - "faber_huntingtin_1998" - ] - }, - "H2A.P_(Mus_musculus)": { - "level": "variant", - "description": { - "summary": "H2A.P_(Mus_musculus) - is a H2A.P variant histone encoded in humans by H2ap gene. See H2A.P variant description for more information. Caveats: H2A.P in mice was previously name H2AL3 [govin_pericentric_2007] and H2A.Lap4 [soboleva_unique_2011]." + "summary": "H2A.L.1_(Mus_musculus) - is a group of H2A.L histone variants in mouse endoded by 14 genes on X-chromosome (H2al1a,H2al1b,H2al1c,H2al1d,H2al1e,H2al1f,H2al1g,H2al1h,H2al1i,H2al1j,H2al1k,H2al1m,H2al1n,H2al1o). See H2A.L description for more information. El Kennani et al. reported variations in expression of different H2A.L.1 genes between different stages of spermatogenesis in mice [el_kennani_ms_histonedb_2017].", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, "taxonomic_span": "Mus musculus", "taxonomic_span_id": "10090", "alternate_names": [], "publications": [ - "govin_pericentric_2007", - "soboleva_unique_2011" + "el_kennani_ms_histonedb_2017" ] }, - "H2A.Q": { + "H2A.L.2_(Mus_musculus)": { "level": "variant", "description": { - "summary": "H2A.Q - is a short H2A variant present in many eutherian mammalian genomes at a distinct syntenic location. It is not well studied and has only been identified via bioinformatics approaches [molaro_evolutionary_2018]. Human and mouse does not have functional H2A.Q genes, there is a pseudogene in human, named H2AQ1P, Molaro et al. also lists coordinates for mouse pseudogene (mm10, chrX, 59012618-59012929). No expression of H2A.Q in primates has been also found and evolutionary analysis cannot confirm the presence of purifying selection for the respective genes. Like other intact short H2A genes, dog and pig H2A.Q genes are transcribed in testes but are undetectable in other tissues examined, including ovary [molaro_evolutionary_2018]. While tails of H2A.B and H2A.L are similar, they differ significantly from H2A.P and H2A.Q , suggesting that short histone H2A variants do not share the same function given the importance of the N-terminal tails in regulating nucleosome function [jiang_short_2020]. H2A.Q histone variants have variable N-terminus, truncated histone fold domain of variable length and altered acidic patch [molaro_evolutionary_2018]." - }, - "taxonomic_span": "Eutheria", - "taxonomic_span_id": "9347", - "alternate_names": [], - "publications": [ - "molaro_evolutionary_2018", - "jiang_short_2020" - ] - }, - "H2A.R": { - "level": "variant_group", - "description": { - "summary": "H2A.R - is a histone variant found currently in monotremes and marsupials, it is an intermediate between the eutherian short histone H2A variants and canonical H2A. Evolutionary analysis suggests that ancestor histone H2A variant branched out to H2A.R (still possessing a C-terminus) in monotremes and marsupials, and to the four classes of the short histone H2A variants in eutherian mammals. H2A.R histone variants have variable N-terminus, altered charge of the histone fold domain, divergent L1-loop, altered acidic patch and extended C-terminal tail. Platypus and opossum H2A.R variants are expressed in the testis but not in other tissues we examined, including opossum ovary. Molaro et al. concluded that expression analysis allows to infer that testis-specific expression preceded the divergence of H2A.R and eutherian short histone H2A variants and is a common feature of all these genes. It is currently unclear whether the common ancestor of H2A.R and the short H2As was autosomal or sex chromosome-linked [molaro_evolutionary_2018]." + "summary": "H2A.L.2_(Mus_musculus) - is a group of H2A.L histone variants in mouse endoded by H2al2a gene on chromosome 2 and two related H2al2b, H2al2b genes on Y-chromosome. H2al2a gene reffered in literature as H2A.L.2 variant is the most studied one, demostrating higher levels of expression than other H2A.L genes in mouse. See H2A.L description for more information. ", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Mammalia", - "taxonomic_span_id": "40674", + "taxonomic_span": "Mus musculus", + "taxonomic_span_id": "10090", "alternate_names": [], - "publications": [ - "molaro_evolutionary_2018" - ] + "publications": [] }, - "H2A.J": { - "level": "variant_group", + "H2A.L.3_(Homo_sapiens)": { + "level": "variant", "description": { - "summary": "H2A.J is a poorly studied replication independent H2A histone variant very similar in sequence to canonical H2A histones. It was characterized in human and mouse, similar genes are present in other mammals. It has been implicated in cell senesecence. Genes: In human it is encoded by H2AJ gene on chormomosome 12, in mouse by H2aj gene on chromosome 6. Both genes are intronless. H2aj gene lacks a stem-loop structure at the 3'-UTR but contains a poly (A) signal [nishida_novel_2005]. Similar genes are found in other mammals [contrepois_histone_2017]. Evolution: no studies available. Knock-out: Depletion of H2A.J via RNA interference modifies senesecence-associated chromatin re-structuring and abolishes senesecence-associated secretory phenotype in human fibroblasts subject to ionizing radiation [isermann_histone_2020]. Function, disease: It has been shown that H2A.J accumulates in senescent cells and promotes inflammatory gene expression [isermann_histone_2020,contrepois_histone_2017]. Sequence: It differs from canonical H2A protein sequences only by an A11V substitution and the presence of an SQK motif near the C-terminus, which is a potential phosphorylation site [talbert_histone_2021]. Localization: In fibroblast irradiation experiments it was shown that H2A.J colocalizes with 53BP1 and is incorporated at the periphery of so-called senesecence-associated chromatin foci (SAHF) [isermann_histone_2020]. Deposition: unclear. Structural effects: sequence changes lie only within the histone tails, alterations to the C-terminal tail may theoretically alter interactions with linker DNA and H1-histone, but this has not been studied. Interactions: colocalizes with 53BP1 [isermann_histone_2020]." + "summary": "H2A.L.3_(Homo_sapiens) - is a putative H2A.L histone variant encoded by H2AL3 gene. It is located at H2A.L.3 locus on X-chromosome which can be traced back to the common ancestor of eutherian mammanls. The H2AL1Q and H2AL3 genes have unusually long extensions at their 3'-ends and have not so far been detected at protein level. See H2A.L description for more information.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" }, - "taxonomic_span": "Mammalia", - "taxonomic_span_id": "40674", + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", "alternate_names": [], - "publications": [ - "25731851", - "nishida_novel_2005", - "contrepois_histone_2017", - "isermann_histone_2020", - "talbert_histone_2021" - ] + "publications": [] }, - "H2A.W": { - "level": "variant_group", + "H2A.L.3_(Mus_musculus)": { + "level": "variant", "description": { - "summary": "H2A.W is a plant specific variant found in angiosperms (flowering plants) having a potentially DNA minor-groove-binding SPKK (sometime reffered to as KSPKKA) motif within its C-terminal tail, it is enriched in heterochromatin and implicated in gene silencing and DNA damage response.", - "taxonomy": "H2A.W variant is found exclusively in angiosperms [alvarez-venegas_canonical_2019].", - "genes": "Arabidopsis has three H2A.W genes (HTA6, HTA7, and HTA12) endoding three isoforms, rice genome has four genes (HTA701, HTA706, HTA707, and HTA710) encoding three isoforms. Isoforms endoded by different genes may have different number of SPKK motifs. A single copy of the SPKK motif seems to be true for all eudicots, whereas the monocots have been shown to possess 2 or even 3 copies of the same motif [alvarez-venegas_canonical_2019,kawashima_diversification_2015].", - "evolution": "H2A.W is a plant-lineage-specific variant that may have arisen early in the evolution of spermatophytes or seed plants. H2A.W lacks homologs in unicellular green algae, liverworts, mosses, and lycophytes but has distinctive homologs in early spermatophytes from the genus Ginkgo, Cycas, and Gnetum [alvarez-venegas_canonical_2019,kawashima_diversification_2015]. Instead of H2A.W homologs, Kawashima et al. identified a novel group of related H2A variants, they named H2A.M, in the genomes of liverworts, mosses, and lycophytes [kawashima_diversification_2015]. Whether H2A.M and H2A.W emerged from the same ancestor or H2A.M in early basal land plants evolved gradually to become H2A.W in seed plants remains undetermined [alvarez-venegas_canonical_2019,kawashima_diversification_2015].", - "expression": "In Arabidopsis HTA6 and HTA7 were found to have S-phase specific expression during the cell cycle, while H2A12 did not manifest any specific cell-cycle expression peak [alvarez-venegas_canonical_2019,menges_genome-wide_2003].", - "knock-out:": "In Arabidopsis single mutants of H2A.W genes do not dispay any phenotype; double mutants, HtA6 HTA7 and HTA6 HTA12, and triple mutants result in growth defects that were even more severe in the triple mutant. This suggests that the three H2A.W paralogs in Arabidopsis are functionally redundant [alvarez-venegas_canonical_2019,yelagandula_histone_2014]. HTA7 knock-out in Arabidopsis results in sensitivity to genotoxic agents [lorkovic_compartmentalization_2017].", - "function": "H2A.W participates in constitutive heterochromatin formation, particularly pericentric heterochromatin [yelagandula_histone_2014]. H2A.W.7 (HTA7 gene) in Arabidopsis was shown to be involved in DNA damage response. It contains an SQ motif within C-terminal tail, which is phosphorylated by ATM kinase upon DNA damage [lorkovic_compartmentalization_2017].", - "sequence": "A characteristic feature of H2A.W sequences is the presence of one or multiple SPKK motifs within its long C-terminal tail. The SPKK motif was reported to preferentially bind AT-rich DNA, which is a feature of pericentric heterochromatin occupied by H2A.W in Arabidopsis [churchill_spkk_1989]. H2A.W variants also have significant sequence alerations within L1-loop and docking domain, which influence nucleosome stability [osakabe_histone_2018]. L1-loop of flowering plants contains (RYA/SK/Q) motif [kawashima_diversification_2015].", - "localization": "Genome-wide analysis showed that H2A.W variants localize with heterochromatin, transposable elements, H3K9me2-rich regions [yelagandula_histone_2014].", - "deposition": "Specific deposition mechanism are not known. Certain H2A.W are desposited during S-phase in a replication-dependent manner, while others manifest replication-independent deposition [alvarez-venegas_canonical_2019].", - "structure": "The extended C-terminal tail of H2A.W interacts with linker DNA and protects DNA from the cleavage by MNase [osakabe_histone_2018]. H2A.W may facilitate heterochromatin formation by promoting long-range interactions between nucleosomes, an activity that requires the long C-terminal tail domain containing a SPKK motif [alvarez-venegas_canonical_2019,yelagandula_histone_2014]. Replacement of H2A.W L1-loop with the corresponding sequence from H2A does not affect nucleosome stability [osakabe_histone_2018].", - "interactions": "It was hypothesized that C-terminal tail of H2A.W may impact H1 binding [osakabe_histone_2018].", + "summary": "H2A.L.3_(Mus_musculus) - is a H2A.L histone variant in mouse endoded by H2al3 gene on X chromosome. Its ortolog at a conserved position in humans is H2AL3 gene. See H2A.L description for more information.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", "disease": "null", "caveats": "null" }, - "taxonomic_span": "Magnoliopsida", - "taxonomic_span_id": "3398", - "alternate_names": [ - { - "name": "H2A with SPKK motifs" - } - ], + "taxonomic_span": "Mus musculus", + "taxonomic_span_id": "10090", + "alternate_names": [], "publications": [] }, - "H2A.M": { - "level": "variant_group", + "H2A.L_(Homo_sapiens)": { + "level": "variant", "description": { - "summary": "H2A.M is a plant specific variant related to H2A.W found in non-flowering plants such as liverworts, mosses, and lycophytes. H2A.M variants are characterized by having a long C-terminal tail domain, rich in lysine, serine and acidic residues, not present in the other H2A variants. The variant was described by Kawashima et al. [kawashima_diversification_2015].", - "taxonomy": "H2A.M was characterized in genomes of liverworts, mosses, and lycophytes[kawashima_diversification_2015].", + "summary": "H2A.L_(Homo_sapiens) - is a class of putative H2A.L histone variants in human. Humans have two putative genes (H2AL1Q, H2AL3, located at H2A.L.1 and H2A.L.3 loci, respectively) and H2AL1MP pseudogene (located at H2A.L.2 loci has inactivating mutation in all primates). The H2AL1Q and H2AL3 genes have unusually long extensions at their 3'-ends and have not so far been detected at protein level. See H2A.L description for more information.", + "taxonomy": "null", "genes": "null", - "evolution": "Certain similarities between the C-terminal tail and the L1-loop of H2A.M and H2A.W variants and the clustering of H2A.M and H2A.W proteins in the phylogeny of H2A suggest that these two variants are related. Whether H2A.M and H2A.W emerged from the same ancestor or H2A.M in early basal land plants evolved gradually to become H2A.W in seed plants remains undetermined [alvarez-venegas_canonical_2019,kawashima_diversification_2015].", + "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", - "sequence": "In the L1 loop, all H2A.M variants share the motif RYAK/Q. The N-terminal tails of H2A.Ms lack a stretch of lysine and glycine residues that is present in H2A.W variants, and are therefore shorter [kawashima_diversification_2015].", + "sequence": "null", "localization": "null", "deposition": "null", "structure": "null", @@ -1453,23 +2925,21 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Viridiplantae", - "taxonomic_span_id": "33090", + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", "alternate_names": [], - "publications": [ - "kawashima_diversification_2015" - ] + "publications": [] }, - "gH2A": { - "level": "variant_group", + "H2A.L_(Mus_musculus)": { + "level": "variant", "description": { - "summary": "gH2A is a male-gamete-specific variant found in the genus Lilium [alvarez-venegas_canonical_2019,ueda_male_2005].", - "taxonomy": "Suggested to be a distinctive variant that evloved specifically in Lilium [alvarez-venegas_canonical_2019]", - "genes": "gH2A gene in Lilium longiflorum. The gene is interrupted by one intron.", + "summary": "H2A.L_(Mus_musculus) - is a group of H2A.L histone variants in mouse. The single autosomal H2al2a (H2A.L.2 variant) gene in mouse located on chromosome 2 is expressed at much higher levels than the sex-linked copies; knockout of this single gene is sufficient to cause male sterility [molaro_evolutionary_2018]. See H2A.L description for more information. Caveats: there is some confusion with the variant names in the literature. Govin et al. initially identified and named three variants H2AL1, H2AL2, H2AL3 [govin_pericentric_2007]. These are encoded by H2al1a, H2al2a and H2ap genes, respectively. The H2Al2 endoded variant was later renamed in the literature as H2A.L.2 [jiang_short_2020]. The H2ap gencoded variant is in fact H2A.P in the current nomenclature. Alternatively, Molaro et al. have named three evolutionary conserved loci on X chromosome that harbor H2A.L genes, these loci are H2A.L.1, H2A.L.2 and H2A.L.3 [molaro_evolutionary_2018]. While human gene and variant naming is in line with the names of these loci, in mouse names of these loci do not correspond exactly to the originally proposed gene names except for H2A.L.3 locus which harbors H2al3 gene (not H2ap gene(!)). In mouse at H2A.L.1 locus a pseudogene H2al1q-ps is located, at H2A.L.2 locus mouse has H2al1m gene (H2al1a-H2al1o genes located within 5 megabases from this locus have similar protein sequences(?)), while H2A.L.2 variant encoded by H2al2a is located on chromosome 2 (two similar genes H2al2b and H2al2c are located on Y chromosome). In this classification we follow the numbering used in gene names which also corresponds to the one established earlier in the literature. Hence, H2A.L.2 variant in mouse encompasses H2al2a gene and similar H2al2b and H2al2c genes, while H2A.L.1 variant encompasses 14 H2al1a-H2al1o genes including H2al1m gene located at a syntenic location of the H2A.L.2 locus", + "taxonomy": "null", + "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", - "function": "This histone variant is expected to be specifically synthesized in the male gametic cells and to cause chromatin condensation or remodeling of chromatin structure [ueda_male_2005].", + "knock-out": "null", + "function": "null", "sequence": "null", "localization": "null", "deposition": "null", @@ -1478,25 +2948,26 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Lilium", - "taxonomic_span_id": "4688", + "taxonomic_span": "Mus musculus", + "taxonomic_span_id": "10090", "alternate_names": [], "publications": [ - "alvarez-venegas_canonical_2019", - "ueda_male_2005" + "govin_pericentric_2007", + "jiang_short_2020", + "molaro_evolutionary_2018" ] }, - "H2B": { - "level": "type", + "H2A.M": { + "level": "variant_group", "description": { - "summary": "H2B is one of the core histone types present in all Eukaryotes. H2B forms dimers with H2A via the \"hand shake\" motif. Two H2A-H2B dimers in turn associate with H3-H4 tetramer to form complete nucleosome core. It has been suggested that H2A and H2B have arisen from H3 and H4 during evolution [malik_phylogenomics_2003]. Structure of H2B consists of a histone fold with a long flexible N-terminal tail which protrudes between the DNA gyres. H2B interacts with H4 in the nucleosome core via a four helix bundle motif. Addtional \u03b1C-helix of H2B decorates the surface of nucleosome. Unlike, H3 and H2A histone, H2B histones have relatively modest number of characterized histone variants. Although in plants, histone H2Bs have undergone significant sequence divergence and expansion in the number of encoding genes [jiang_evolution_2020].", - "taxonomy": "Present in all Eukaryotes.", + "summary": "H2A.M is a plant specific variant related to H2A.W found in non-flowering plants such as liverworts, mosses, and lycophytes. H2A.M variants are characterized by having a long C-terminal tail domain, rich in lysine, serine and acidic residues, not present in the other H2A variants. The variant was described by Kawashima et al. [kawashima_diversification_2015].", + "taxonomy": "H2A.M was characterized in genomes of liverworts, mosses, and lycophytes[kawashima_diversification_2015].", "genes": "null", - "evolution": "It has been suggested that H2A and H2B have arisen from H3 and H4 during evolution [malik_phylogenomics_2003]. The eukaryotic H3-H4 tetramer resembles the tetramer found in Archaea, and it has been suggested that H2A and H2B have arisen from H3 and H4 later on in histone evolution [henneman_structure_2018]. The histone H2B (HTB) family shows the least conservation of all core histones likely because it is less evolutionarily constrained than its counterparts [alvarez-venegas_canonical_2019].", + "evolution": "Certain similarities between the C-terminal tail and the L1-loop of H2A.M and H2A.W variants and the clustering of H2A.M and H2A.W proteins in the phylogeny of H2A suggest that these two variants are related. Whether H2A.M and H2A.W emerged from the same ancestor or H2A.M in early basal land plants evolved gradually to become H2A.W in seed plants remains undetermined [alvarez-venegas_canonical_2019,kawashima_diversification_2015].", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", - "sequence": "null", + "sequence": "In the L1 loop, all H2A.M variants share the motif RYAK/Q. The N-terminal tails of H2A.Ms lack a stretch of lysine and glycine residues that is present in H2A.W variants, and are therefore shorter [kawashima_diversification_2015].", "localization": "null", "deposition": "null", "structure": "null", @@ -1504,23 +2975,22 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Eukaryota", - "taxonomic_span_id": "2759", + "taxonomic_span": "Viridiplantae", + "taxonomic_span_id": "33090", "alternate_names": [], "publications": [ - "malik_phylogenomics_2003", - "jiang_evolution_2020" + "kawashima_diversification_2015" ] }, - "cH2B": { - "level": "variant_group", + "H2A.P": { + "level": "variant", "description": { - "summary": "cH2B -- canonical H2B histones. Like cH2A, this is a loosely defined group that encompasses major H2B histone proteins that are expressed during S-phase of the cell cycle in eukaryotes and are highly conserved even between distantly related species. Such proteins are often called replication dependent (RD) or \"bulk\" histones [marzluff_metabolism_2008,talbert_histone_2021]. They are likely similar to the original H2B histones of the last common ancestor of eukaryotes [malik_phylogenomics_2003]. Expression of cH2Bs during S-phase is often tightly regulated, but mechanisms may differ among kindoms [marzluff_birth_2017,pontarotti_long-term_2009]. These histones are often present as large multigene families. However, there are known limitations to the definition given above. Functional diversification of paralogous genes is a common process in evolution -- in many species multiple copies of canonical histone genes have undergone diversification in terms of sequence variation, cell-cycle or tissue-specific expression patterns. Sometimes this diversification is very subtle and species-specific (e.g. cH2B.E isoforms in mouse), in other cases there may be a spectrum of canonical-like proteins (e.g. plant canonical H2Bs which show higher sequence diversity than cH2Bs of animals). Hence, whether a particular gene should be regarded as a canonical, a bona fide variant or a canonical subvariant/isoform may be a matter of debate and definition in each particular case. Within the current hierarchical classification system, additional information about the cH2A class may be gained by looking at the description of its subclasses.", - "taxonomy": "Present in all Eukaryotes.", + "summary": "H2A.P - is a class of testis-specific short H2A variants in eutherian mammals expressed at post-meiotic stages of spermatogensis. It is not well studied. Its expression in mouse has been shown only at mRNA level [el_kennani_ms_histonedb_2017], although evolutionary analysis strongly argues that it is a protein coding gene [molaro_evolutionary_2018]. In human H2A.P gene H2ap was previously named HYPM (Huntingtin-interacting protein M) since in yeast two-hybrid experiments it was shown to interact with huntingtin, which contains an expanded polyglutamine tract in individuals with Huntington's disease [faber_huntingtin_1998]. Genes: \u0421ommon ancestor of eutherian mammals encoded a single H2A.P gene. These genes are usually located on X chromosome as do other short H2As [molaro_evolutionary_2018]. Humans and mouse have one gene name H2AP and H2ap, respectively. Evolution: Molaro et al. found that short H2A variants show greater evolutionary divergence between species than even CENPA, the fastest-evolving histone variant examined to date. Their results indicate that H2A.P and possible H2A.B have been subject to diversifying selection in simian primates, which could partly ecplame the greater divergence of short H2A histone variants compared to other H2A histones in mammals [molaro_evolutionary_2018]. Knock-out: no studies. Function: no specific studies have been reported, but by its similarity to H2A.L it is likely that it participates in the histone\u2013protamine exchange process. Sequence: Has one of the most divergent sequences from cH2A. Identity with cH2A may be as low as 24%. H2A.P variants have a shortened C-termus, truncated docking domain, altered acidic patch, arginine rich N-terminus. H2A.P have lost two key conserved arginine (R) residues in Loop 1 and 2 that contact the DNA minor-groove and acquired many acidic residues at sites including contacts with DNA and H2B. The last 14 residues in H2A.P are more evolutionary contrained than the rest of the protein, suggesting their potential interaction with non-histone proteins. Localization: H2A.P presence has not been confirmed at protein level. H2A.P mRNA were found to be strongly enriched in round and elongating spermatids [govin_pericentric_2007], expressed in the post-meiotic stages of spermatogenesis [el_kennani_ms_histonedb_2017]. Structural effects: Nucleosomes incorporating H2A.P are predicted to be highly destabilized [molaro_evolutionary_2018]. Interactions: In yeast two-hybrid screens was shown to interact with huntingtin [faber_huntingtin_1998]. Disease: no information. Caveats: H2A.P in mice was previously name H2AL3 [govin_pericentric_2007] and H2A.Lap4 [soboleva_unique_2011].", + "taxonomy": "null", "genes": "null", - "evolution": "It has been suggested that H2A and H2B have arisen from H3 and H4 during evolution [malik_phylogenomics_2003]. The eukaryotic H3-H4 tetramer resembles the tetramer found in Archaea, and it has been suggested that H2A and H2B have arisen from H3 and H4 later on in histone evolution [henneman_structure_2018].", + "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1530,26 +3000,27 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Eukaryota", - "taxonomic_span_id": "2759", + "taxonomic_span": "Eutheria", + "taxonomic_span_id": "9347", "alternate_names": [], "publications": [ - "marzluff_metabolism_2008", - "talbert_histone_2021", - "malik_phylogenomics_2003", - "marzluff_birth_2017", - "pontarotti_long-term_2009" + "9700202", + "el_kennani_ms_histonedb_2017", + "faber_huntingtin_1998", + "govin_pericentric_2007", + "molaro_evolutionary_2018", + "soboleva_unique_2011" ] }, - "cH2B_(Animals)": { - "level": "variant_group", + "H2A.P_(Homo_sapiens)": { + "level": "variant", "description": { - "summary": "cH2B_(Animals) -- clustered H2B histones in animals (Metazoa), often called canonical, replication-dependent, replication-coupled or \"bulk\" H2B histones are a major class of H2B histones in animals with high sequence similarity across all animal species. Histone genes encodig these proteins have several particular features. 1) These genes lack introns and are found in multiple similar copies clustered along the genome togerther with other core histone genes (H3, H4, H2A, and optionally H1). The exact organisation may vary from tandemly repeated quintets of H3, H4, H2A, H2B, H1 genes transcribed from the same strand to non-tandem jumbled arrays of genes transcribed from divergent promoters [pontarotti_long-term_2009]. 2) These genes are mainly expressed during S-phase of the cell cycle in a coordinated fashion (hence the name \"replication dendent\") and produce mRNAs that are not polyadenylated but rather end in a conserved stem-loop, which is further bound by the stem-loop binding protein (SLBP). mRNAs are rapidly degraded after the S-phase. 3) These genes are present in a specialized nuclear domain, the histone locus body (HLB), which concetrates factors for histone mRNA transcription and processing (in humans these include NPAT, U7 snRNP, FLASH) [marzluff_birth_2017].", - "taxonomy": "Animals (Metazoa)", + "summary": "H2A.P_(Homo_sapiens) - is a H2A.P variant histone encoded in humans by H2AP gene. See H2A.P variant description for more information. In human H2A.P gene H2ap was previously named HYPM (Huntingtin-interacting protein M) since in yeast two-hybrid experiments it was shown to interact with huntingtin, which contains an expanded polyglutamine tract in individuals with Huntington's disease [faber_huntingtin_1998].", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1557,25 +3028,25 @@ "structure": "null", "interactions": "null", "disease": "null", - "caveats": "1) Clustered histones may still exhibit some level of sequence variation between the multiple gene copies in certain species. Evidence exists that these differences may have functional implications (e.g. affect nucleosome stability). Some clustered genes have tissue-specific expression and play specific functional roles (e.g. cH2B.1 and cH2B.E in mice). 2) A subset of clustered histones, which are normally expressed as replication-dependent histones, are expressed as polyadenylated mRNAs in adult non-dividing tissues to replenish histone pool in differentiated tissues [lyons_subset_2016]. 3) Certain clustered histones may act as functional histone variants with replication-independent polyA-tail-regulated expression being the major/only form (e.g. cH2B.E_(Mus_musculus), or H2A.J, which is closely related to cH2As). 4) In C. elegans an alternative mechanism of mRNA 3'-end processing evolved resulting in loss of HLB and histone clusters [marzluff_birth_2017, pontarotti_long-term_2009]. " + "caveats": "null" }, - "taxonomic_span": "Metazoa", - "taxonomic_span_id": "33208", + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", "alternate_names": [], "publications": [ - "pontarotti_long-term_2009", - "marzluff_birth_2017" + "9700202", + "faber_huntingtin_1998" ] }, - "cH2B_(Vertebrata)": { - "level": "variant_group", + "H2A.P_(Mus_musculus)": { + "level": "variant", "description": { - "summary": "cH2B_(Vertebrata) -- clustered H2B histones in vertebrates, often called canonical, replication-dependent, replication-coupled or \"bulk\" H2B histones. This is a subclass of cH2B_(Animals) (see it for a detailed description).", - "taxonomy": "Vertebrates (Vertebrata)", + "summary": "H2A.P_(Mus_musculus) - is a H2A.P variant histone encoded in humans by H2ap gene. See H2A.P variant description for more information. Caveats: H2A.P in mice was previously name H2AL3 [govin_pericentric_2007] and H2A.Lap4 [soboleva_unique_2011].", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1585,20 +3056,23 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Vertebrata", - "taxonomic_span_id": "7742", + "taxonomic_span": "Mus musculus", + "taxonomic_span_id": "10090", "alternate_names": [], - "publications": [] + "publications": [ + "govin_pericentric_2007", + "soboleva_unique_2011" + ] }, - "cH2B_(Mammalia)": { - "level": "variant_group", + "H2A.Q": { + "level": "variant", "description": { - "summary": "cH2B_(Mammalia) -- clustered H2B histones in mammals, often called canonical, replication-dependent, replication-coupled or \"bulk\" H2B histones. This is a subclass of cH2B_(Vertebrata) and cH2B_(Animals) (see it for a detailed description).", - "taxonomy": "Mammals (Mammalia)", + "summary": "H2A.Q - is a short H2A variant present in many eutherian mammalian genomes at a distinct syntenic location. It is not well studied and has only been identified via bioinformatics approaches [molaro_evolutionary_2018]. Human and mouse does not have functional H2A.Q genes, there is a pseudogene in human, named H2AQ1P, Molaro et al. also lists coordinates for mouse pseudogene (mm10, chrX, 59012618-59012929). No expression of H2A.Q in primates has been also found and evolutionary analysis cannot confirm the presence of purifying selection for the respective genes. Like other intact short H2A genes, dog and pig H2A.Q genes are transcribed in testes but are undetectable in other tissues examined, including ovary [molaro_evolutionary_2018]. While tails of H2A.B and H2A.L are similar, they differ significantly from H2A.P and H2A.Q , suggesting that short histone H2A variants do not share the same function given the importance of the N-terminal tails in regulating nucleosome function [jiang_short_2020]. H2A.Q histone variants have variable N-terminus, truncated histone fold domain of variable length and altered acidic patch [molaro_evolutionary_2018].", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1608,19 +3082,23 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Mammalia", - "taxonomic_span_id": "40674", + "taxonomic_span": "Eutheria", + "taxonomic_span_id": "9347", "alternate_names": [], - "publications": [] + "publications": [ + "jiang_short_2020", + "molaro_evolutionary_2018" + ] }, - "cH2B_(Homo_sapiens)": { + "H2A.R": { "level": "variant_group", "description": { - "summary": "cH2B_(Homo_sapiens) -- clustered H2B histones in human, often called canonical, replication-dependent, replication-coupled or \"bulk\" H2B histones. For a general description see cH2B_(Animals) class. Replication-dependent histones in humans are found in four loci: a large cluster on chromosome 6 (more than 60 genes), two clusters on chromosome 1 (10-12 genes and 4 genes) and a single H4 gene on chromosome 12. Humans have 19 H2B genes that code for replication-dependent H2B histones. The cluster on chromosome 6 encodes 15 H2B genes (H2BC1, H2BC3-H2BC15, H2BC17) and several pseudogenes. The first cluster on chromosome 1 encodes 2 genes (H2BC18, H2BC21) and two pseudogenes (H2BC19P, H2BC20P), and the second cluster on chromosome 1 endodes one gene (H2BC26) and one pseudogene (H2BC27P). One additional gene H2BC12L is represented by a human-specific duplication of the H2BC12 gene from the chromosome 6 onto chromosome 21, the gene appears to be expressed, its protein sequence is expected to have two nonsynonymous substitutions with respect to H2BC12 gene. 19 cH2B genes in human enconde 15 protein variants. H2BC1 gene (formely, called HIST1H2BA, TH2B) is the most divergent gene of the family, together with H2AC1 they share a common promoter and maifest tissue-specific expression (at least in testis and oocytes) [huynh_two_2016].", + "summary": "H2A.R - is a histone variant found currently in monotremes and marsupials, it is an intermediate between the eutherian short histone H2A variants and canonical H2A. Evolutionary analysis suggests that ancestor histone H2A variant branched out to H2A.R (still possessing a C-terminus) in monotremes and marsupials, and to the four classes of the short histone H2A variants in eutherian mammals. H2A.R histone variants have variable N-terminus, altered charge of the histone fold domain, divergent L1-loop, altered acidic patch and extended C-terminal tail. Platypus and opossum H2A.R variants are expressed in the testis but not in other tissues we examined, including opossum ovary. Molaro et al. concluded that expression analysis allows to infer that testis-specific expression preceded the divergence of H2A.R and eutherian short histone H2A variants and is a common feature of all these genes. It is currently unclear whether the common ancestor of H2A.R and the short H2As was autosomal or sex chromosome-linked [molaro_evolutionary_2018].", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1628,20 +3106,51 @@ "structure": "null", "interactions": "null", "disease": "null", - "caveats": "1) A subset of clustered histones, which are normally expressed as replication-dependent histones, are expressed as polyadenylated mRNAs in adult non-dividing tissues to replenish histone pool in differentiated tissues [lyons_subset_2016]. " + "caveats": "null" + }, + "taxonomic_span": "Mammalia", + "taxonomic_span_id": "40674", + "alternate_names": [], + "publications": [ + "molaro_evolutionary_2018" + ] + }, + "H2A.W": { + "level": "variant_group", + "description": { + "summary": "H2A.W is a plant specific variant found in angiosperms (flowering plants) having a potentially DNA minor-groove-binding SPKK (sometime reffered to as KSPKKA) motif within its C-terminal tail, it is enriched in heterochromatin and implicated in gene silencing and DNA damage response.", + "taxonomy": "H2A.W variant is found exclusively in angiosperms [alvarez-venegas_canonical_2019].", + "genes": "Arabidopsis has three H2A.W genes (HTA6, HTA7, and HTA12) endoding three isoforms, rice genome has four genes (HTA701, HTA706, HTA707, and HTA710) encoding three isoforms. Isoforms endoded by different genes may have different number of SPKK motifs. A single copy of the SPKK motif seems to be true for all eudicots, whereas the monocots have been shown to possess 2 or even 3 copies of the same motif [alvarez-venegas_canonical_2019,kawashima_diversification_2015].", + "evolution": "H2A.W is a plant-lineage-specific variant that may have arisen early in the evolution of spermatophytes or seed plants. H2A.W lacks homologs in unicellular green algae, liverworts, mosses, and lycophytes but has distinctive homologs in early spermatophytes from the genus Ginkgo, Cycas, and Gnetum [alvarez-venegas_canonical_2019,kawashima_diversification_2015]. Instead of H2A.W homologs, Kawashima et al. identified a novel group of related H2A variants, they named H2A.M, in the genomes of liverworts, mosses, and lycophytes [kawashima_diversification_2015]. Whether H2A.M and H2A.W emerged from the same ancestor or H2A.M in early basal land plants evolved gradually to become H2A.W in seed plants remains undetermined [alvarez-venegas_canonical_2019,kawashima_diversification_2015].", + "expression": "In Arabidopsis HTA6 and HTA7 were found to have S-phase specific expression during the cell cycle, while H2A12 did not manifest any specific cell-cycle expression peak [alvarez-venegas_canonical_2019,menges_genome-wide_2003].", + "knock-out": "In Arabidopsis single mutants of H2A.W genes do not dispay any phenotype; double mutants, HtA6 HTA7 and HTA6 HTA12, and triple mutants result in growth defects that were even more severe in the triple mutant. This suggests that the three H2A.W paralogs in Arabidopsis are functionally redundant [alvarez-venegas_canonical_2019,yelagandula_histone_2014]. HTA7 knock-out in Arabidopsis results in sensitivity to genotoxic agents [lorkovic_compartmentalization_2017].", + "function": "H2A.W participates in constitutive heterochromatin formation, particularly pericentric heterochromatin [yelagandula_histone_2014]. H2A.W.7 (HTA7 gene) in Arabidopsis was shown to be involved in DNA damage response. It contains an SQ motif within C-terminal tail, which is phosphorylated by ATM kinase upon DNA damage [lorkovic_compartmentalization_2017].", + "sequence": "A characteristic feature of H2A.W sequences is the presence of one or multiple SPKK motifs within its long C-terminal tail. The SPKK motif was reported to preferentially bind AT-rich DNA, which is a feature of pericentric heterochromatin occupied by H2A.W in Arabidopsis [churchill_spkk_1989]. H2A.W variants also have significant sequence alerations within L1-loop and docking domain, which influence nucleosome stability [osakabe_histone_2018]. L1-loop of flowering plants contains (RYA/SK/Q) motif [kawashima_diversification_2015].", + "localization": "Genome-wide analysis showed that H2A.W variants localize with heterochromatin, transposable elements, H3K9me2-rich regions [yelagandula_histone_2014].", + "deposition": "Specific deposition mechanism are not known. Certain H2A.W are desposited during S-phase in a replication-dependent manner, while others manifest replication-independent deposition [alvarez-venegas_canonical_2019].", + "structure": "The extended C-terminal tail of H2A.W interacts with linker DNA and protects DNA from the cleavage by MNase [osakabe_histone_2018]. H2A.W may facilitate heterochromatin formation by promoting long-range interactions between nucleosomes, an activity that requires the long C-terminal tail domain containing a SPKK motif [alvarez-venegas_canonical_2019,yelagandula_histone_2014]. Replacement of H2A.W L1-loop with the corresponding sequence from H2A does not affect nucleosome stability [osakabe_histone_2018].", + "interactions": "It was hypothesized that C-terminal tail of H2A.W may impact H1 binding [osakabe_histone_2018].", + "disease": "null", + "caveats": "null" }, - "publications": [ - "huynh_two_2016" - ] + "taxonomic_span": "Magnoliopsida", + "taxonomic_span_id": "3398", + "alternate_names": [ + { + "name": "H2A with SPKK motifs" + } + ], + "publications": [] }, - "cH2B.1_(Homo_sapiens)": { - "level": "variant", + "H2A.X": { + "level": "variant_group", "description": { - "summary": "cH2B.1_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC1 gene (formerly, HIST1H2BA, TH2B). This is the most divergent gene of the family (around 85% identity with other cH2Bs) [zalensky_human_2002]. Its length is also one amino acid longer than for the rest of H2Bs (126 amio acid residues after initiator methionine cleavage). Together with H2AC1 they share a common promoter and manifest tissue-specific expression (at least in testis and oocytes) (see human protein atlas). H2AC1 and H2BC1 are thought to be maternal effect factors and their expression was shown to enhance OSKM-induced cell reprogramming in human cells [huynh_two_2016]. See also description of cH2B.1_(Mus_musculus) -- a related histone variant encoded by H2bc1 gene which has been characterized through a number of in vivo and in vitro studies. Phylogenetic analysis of cH2B.1 in mammals by Raman et al. suggests that when considered together with its N-terminal tail histones form a distinct phylogenetic clade with high bootstrap support [raman_novel_2022].", + "summary": "H2A.X is an H2A histone variant present in almost all Eukaryotes most notably involved in DNA damage response, marking the double strand DNA breaks with its phosphorylated form \u0263-H2A.X. It is also more broadly implicated in chromatin remodeling, found at collapsed replication forks and heterochromatin. It is a non-monophyletic (polyphyletic) variant of H2A and has the charactristic SQE/D\u03a6 motif at C-terminus (SQAY in Drosophila), where \u03a6-represents a hydrophobic residue (usually Tyr in mammals), and S is phosphorylation site. In multicellular eukaryotes H2A.X is usually closely related to cH2As in the same group of multicellular organisms [millar_organizing_2013, talbert_histone_2021]. It seems likely that H2A.X was ancestral to cH2As due to its conserved role in DNA damage response [talbert_histone_2010]. Caveats: Nematodes are the only known species that lack H2A.X. Many fungi lack canonical H2A its role is fullfiled by H2A.X. In Drosophila melanogaster H2A.X function is fullfiled by H2A.Z histone.", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1651,33 +3160,32 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "Eukaryotes", + "taxonomic_span_id": "2759", "alternate_names": [ { - "name": "TH2B" - }, - { - "name": "TS H2B.1" - }, - { - "name": "hTSH2B" + "name": "member X" } ], "publications": [ - "zalensky_human_2002", - "huynh_two_2016", - "raman_novel_2022" + " talbert_histone_2021", + "18095327", + "22650316", + "23301656", + "25731851", + "millar_organizing_2013", + "talbert_histone_2010" ] }, - "cH2B.2_(Homo_sapiens)": { + "H2A.X_(Animals)": { "level": "variant", "description": { - "summary": "cH2B.2_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC3 gene.", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1687,19 +3195,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], "publications": [] }, - "cH2B.3_(Homo_sapiens)": { + "H2A.X_(Fungi)": { "level": "variant", "description": { - "summary": "cH2B.3_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC4, H2BC6, H2BC7, H2BC8, H2BC10 genes.", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1709,19 +3218,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], "publications": [] }, - "cH2B.4_(Homo_sapiens)": { + "H2A.X_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "cH2B.4_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC5 gene.", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1731,19 +3241,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], "publications": [] }, - "cH2B.5_(Homo_sapiens)": { + "H2A.X_(Mammalia)": { "level": "variant", "description": { - "summary": "cH2B.5_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC9 gene.", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1753,19 +3264,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], "publications": [] }, - "cH2B.6_(Homo_sapiens)": { + "H2A.X_(Mus_musculus)": { "level": "variant", "description": { - "summary": "cH2B.6_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC11 gene.", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1775,19 +3287,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], "publications": [] }, - "cH2B.7_(Homo_sapiens)": { + "H2A.X_(Plants)": { "level": "variant", "description": { - "summary": "cH2B.7_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC12 gene.", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1797,19 +3310,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], "publications": [] }, - "cH2B.8_(Homo_sapiens)": { + "H2A.X_(Protists)": { "level": "variant", "description": { - "summary": "cH2B.8_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC13 gene.", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1819,19 +3333,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], "publications": [] }, - "cH2B.9_(Homo_sapiens)": { + "H2A.X_(Vertebrata)": { "level": "variant", "description": { - "summary": "cH2B.9_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC14 gene.", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1841,19 +3356,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], "publications": [] }, - "cH2B.10_(Homo_sapiens)": { - "level": "variant", + "H2A.Z": { + "level": "variant_group", "description": { - "summary": "cH2B.10_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC15 gene.", + "summary": "H2A.Z is a replication-independent H2A histone variant strongly conserved in almost all Eukaryotes (exceptions may include some metamonads (e.g. Giardia, Trichomonas), Amebae and parasitic fungi [dalmasso_canonical_2011]). This histone variant is essential from Tetrahymena to mammals (although its knock out in yeast is not lethal) and amounts to around 5-10% of H2A histones [dalmasso_canonical_2011]. H2A.Z containing nucleosomes often localize near transcription start sites (+1 nucleosomes) and enhancer regions, they are thought to be involved in Pol II recruitment, transcription regulation, DNA repair, suppression of antisense RNA, heterochromatin regulation. [giaimo_histone_2019]. H2A.Z nucleosomes have a larger acidic patch, an amino acid insertion in \u03b11-helix and one deletion in the docking domain compared to the canonical H2A. The L1-loop region exhibits four amino acids difference between H2A.Z and canonical H2A and is likely involved in conferring stability and functional specificity of variant nucleosomes via L1-L1 interactions [shaytan_nucleosome_2015]. C-terminal region of the yeast H2A.Z protein interacts with RNA polymerase II (RNAPII), promoting its recruitment at promoters [adam_h2az_2001].", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1863,19 +3379,67 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", - "alternate_names": [], - "publications": [] + "taxonomic_span": "Eukaryotes", + "taxonomic_span_id": "2759", + "alternate_names": [ + { + "name": "Htz1p", + "taxonomy": "saccharomyces" + }, + { + "name": "hv1", + "taxonomy": "tetrahymena" + }, + { + "name": "H2A.V", + "taxonomy": "drosophila" + }, + { + "name": "H2Av", + "taxonomy": "drosophila" + }, + { + "name": "H2AvD", + "taxonomy": "drosophila" + }, + { + "name": "D2", + "taxonomy": "drosophila" + }, + { + "name": "member Z" + } + ], + "publications": [ + "11101893", + "18275809", + "19193230", + "20003410", + "20197778", + "22467210", + "22650316", + "23301656", + "24311584", + "24768041", + "24969791", + "25731851", + "adam_h2az_2001", + "colino-sanguino_h2az-nuclesome_2021", + "dalmasso_canonical_2011", + "giaimo_histone_2019", + "shaytan_nucleosome_2015", + "talbert_histone_2021" + ] }, - "cH2B.11_(Homo_sapiens)": { + "H2A.Z.1_(Chordata)": { "level": "variant", "description": { - "summary": "cH2B.11_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC17 gene.", + "summary": "H2A.Z.1_(Chordata) product of one of two H2A.Z genes converved in chordates, homologous to human H2AZ1 gene [giaimo_histone_2019]. Porducts of H2AZ1 and H2AZ2 genes differ by only three amino acids, however they have acquired some degree of functional indepedence. For example, H2A.Z.1 has been shown to better interact with bromodomain-containing protein 2 (BRD2) [draker_combination_2012], H2A.Z.2 preferentially associates with H3 trimethylated at lysine 4 (H3K4me3) [dryhurst_characterization_2009].", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1885,19 +3449,26 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "Chordata", + "taxonomic_span_id": "7711", "alternate_names": [], - "publications": [] + "publications": [ + "colino-sanguino_h2az-nuclesome_2021", + "draker_combination_2012", + "dryhurst_characterization_2009", + "giaimo_histone_2019", + "talbert_histone_2021" + ] }, - "cH2B.12_(Homo_sapiens)": { + "H2A.Z.1_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "cH2B.12_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC18 gene.", + "summary": "H2A.Z.1_(Homo_sapiens) H2A.Z variant encoded in humans by H2A.Z.1 gene. Differes by only 3 amino acids from the product of H2A.Z.2 gene.", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1907,19 +3478,24 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "Eukaryotes", + "taxonomic_span_id": "2759", "alternate_names": [], - "publications": [] + "publications": [ + "colino-sanguino_h2az-nuclesome_2021", + "giaimo_histone_2019", + "talbert_histone_2021" + ] }, - "cH2B.13_(Homo_sapiens)": { + "H2A.Z.1_(Primates)": { "level": "variant", "description": { - "summary": "cH2B.13_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC21 gene.", + "summary": "H2A.Z.1_(Primates) H2A.Z.1 variant in primates, see H2A.Z.1_(Chordata) variant description.", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1929,19 +3505,24 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "Primates", + "taxonomic_span_id": "9443", "alternate_names": [], - "publications": [] + "publications": [ + "colino-sanguino_h2az-nuclesome_2021", + "giaimo_histone_2019", + "talbert_histone_2021" + ] }, - "cH2B.14_(Homo_sapiens)": { + "H2A.Z.2.s1_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "cH2B.14_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC26 gene.", + "summary": "H2A.Z.2.s1_(Homo_sapiens) this is the main full length splice isoform of H2A.Z.2 in humans as compared to an slternatively spliced H2A.Z.2.s2 isofom which has an alternative shorter C-terminus [giaimo_histone_2019].", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1954,16 +3535,19 @@ "taxonomic_span": "Homo sapiens", "taxonomic_span_id": "9606", "alternate_names": [], - "publications": [] + "publications": [ + "giaimo_histone_2019" + ] }, - "cH2B.15_(Homo_sapiens)": { + "H2A.Z.2.s1_(Primates)": { "level": "variant", "description": { - "summary": "cH2B.15_(Homo_sapiens) -- is an isoform (variant) of clustered (canonical) H2B histones in human endoded by H2BC12L gene. H2BC12L is represented by a human-specific duplication of the H2BC12 gene from the chromosome 6 onto chromosome 21, the gene appears to be expressed, its protein sequence is expected to have two nonsynonymous substitutions with respect to H2BC12 gene.", + "summary": "H2A.Z.2.s1_(Primates) this is the main full length splice isoform of H2A.Z.2 in primates as compared to an slternatively spliced H2A.Z.2.s2 isofom which has an alternative shorter C-terminus [giaimo_histone_2019].", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -1973,78 +3557,47 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "Primates", + "taxonomic_span_id": "9443", "alternate_names": [], - "publications": [] - }, - "cH2B_(Mus_musculus)": { - "level": "variant_group", - "description": { - "summary": "cH2B_(Mus_musculus) -- clustered H2B histones in mouse, often called canonical, replication-dependent, replication-coupled or \"bulk\" H2B histones. repliation-dependent histones in mouse similar to human are found in several clusters. The largest cluster is found on chromosome 13 (more than 50 genes) and smaller clusters on chromosomes 3 and 11 [marzluff_human_2002]. There are 18 replication-dependent H2B genes currently annotated in mouse genome: 15 in cluster on chromosome 13, 2 in cluster on chromosome 3 and 1 on chromosome 11.", - "genes": "null", - "evolution": "null", - "expression": "null", - "knock-out:": "null", - "function": "null", - "sequence": "null", - "localization": "null", - "deposition": "null", - "structure": "null", - "interactions": "null", - "disease": "null", - "caveats": "null" - }, - "taxonomic_span": "Mus musculus", - "taxonomic_span_id": "10090", "publications": [ - "marzluff_human_2002" + "giaimo_histone_2019" ] }, - "cH2B.1_(Mus_musculus)": { + "H2A.Z.2.s2_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "cH2B.1_(Mus_musculus) -- is an isoform (variant) of clustered (canonical) H2B histones in mouse endoded by H2bc1 gene (formerly, Hist1h2ba, Th2b). This is the most divergent gene of the family, its protein product has differences in INSERT HERE. Together with H2ac1 gene they share a common promoter and manifest tissue-specific expression (at least in testis, oocytes and zygotes) [padavattan_structural_2015]. Disruption of Th2a and Th2b genes causes defects in spermatogenesis [shinagawa_disruption_2015]. H2ac1 and H2bc1 contribute to activation of the paternal genome after fertilization [shinagawa_histone_2014]. These variant facilitate OSKM-induced cell reprogramming [shinagawa_histone_2014]. X-ray structure of nucleosome harboring this variant have fewer histone-DNA contacts and perturbed L1-L1-loop interactions. Mutational in vivo analysis suggest histone tails and L1 loop of cH2A.1 are important for reprogramming [padavattan_structural_2015]. Differential scanning calorimetry analysis indicated that the H2ac1/H2bc1 complex was more stable than other combinations of canonical histones [shinagawa_histone_2014]. This variant is related to cH2B.1_(Homo_sapiens) encoded by H2B1C gene, is located in the same position at the largest histone gene cluster, however, their sequence differs at INSERT HERE positions. Structural and in vitro studies suggest that cH2B.1-containing nucleosomes are less stable than RC H2B, which may allow H2B.1 to facilitate histone-protamine exchange during spermatogenesis. More recently, H2B.1 has also been detected in mouse oocytes, where its function is not yet understood [raman_novel_2022]. Note: Since this variant manifests similar features in mice and humans (tissue-specific expression, synteny, divergent sequence with respect to other canonical variants in each species) likely similar variants exist in all supraprimates or in higher taxa. Once and if sufficient evidence accumulates such variants may be grouped into a separate class.", - "taxonomy": "Mus musculus (House mouse)", + "summary": "H2A.Z.2.s2_(Homo_sapiens) this is an alternatively spliced isoform of H2A.Z.2 in humans which has an alternative shorter C-terminus with respect to H2A.Z.2.s1 isoform. This isoform is expressed in a wide range of tissues, including brain tissues. Nucleosome containing H2A.Z.2.s2 isoform are less stable, than nuclesomes with the main isoform. [giaimo_histone_2019].", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", "deposition": "null", "structure": "null", - "interactions": "Govin et al. investigated the stability of nucleosomes incorporating cH2B.1/H2A.L.2 histone dimer (H2A.L.2 encoded by H2al2a gene in mouse was used) and concluded that they were less stable than nucleosomes containing somatic histones [govin_pericentric_2007].", + "interactions": "null", "disease": "null", "caveats": "null" }, - "taxonomic_span": "Mus musculus", - "taxonomic_span_id": "10090", - "alternate_names": [ - { - "name": "Th2b" - }, - { - "name": "TS H2B.1" - } - ], + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [], "publications": [ - "padavattan_structural_2015", - "shinagawa_disruption_2015", - "shinagawa_histone_2014", - "raman_novel_2022" + "giaimo_histone_2019" ] }, - "cH2B.E_(Mus_musculus)": { + "H2A.Z.2.s2_(Primates)": { "level": "variant", "description": { - "summary": "cH2B.E_(Mus_musculus) -- is an isoform (variant) of clustered (canonical) H2B histones in mouse endoded by H2bc21 gene (histone gene cluster on chromosome 3). It differs by four of five amino acids from other cH2Bs in mouse. It is expressed via a polyA-tail containing mRNA, typical of replication-independent variants in the main olfactory epithelium and the vomeronasal organ [santoro_activity-dependent_2012]. Santoro and Dulac showed that its expression is reduced by sensory activity and that it promotes neuronal cell death, such that inactive olfactory neurons display higher levels of the variant and shorter life spans. [santoro_activity-dependent_2012]", - "taxonomy": "Mus musculus (House mouse)", + "summary": "H2A.Z.2.s2_(Primates) this is an alternatively spliced isoform of H2A.Z.2 in primates which has an alternative shorter C-terminus with respect to H2A.Z.2.s1 isoform. This isoform is expressed in a wide range of tissues, including brain tissues. Nucleosome containing H2A.Z.2.s2 isoform are less stable, than nuclesomes with the main isoform. [giaimo_histone_2019].", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -2054,26 +3607,22 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Mus musculus", - "taxonomic_span_id": "10090", - "alternate_names": [ - { - "name": "H2B.21" - } - ], + "taxonomic_span": "Primates", + "taxonomic_span_id": "9443", + "alternate_names": [], "publications": [ - "santoro_activity-dependent_2012" + "giaimo_histone_2019" ] }, - "cH2B_(Plants)": { - "level": "variant_group", + "H2A.Z.2_(Chordata)": { + "level": "variant", "description": { - "summary": "cH2B_(Plants) -- canonical H2B histones of green plants (Viridiplantae), which include green algae and land plants. Currently, this is a loosely defined group of replication-dependent H2B histones in plants together with similar sequences that might have further diversified towards replication-independent tissue-specific expression but have not yet been extensively studied. An example of the latter would be the HTB3 gene of Arabidopsis which has the hallmarks of a replacement histone variant enriched in mature cells [jiang_evolution_2020]. Organisation of canonical histones in green plants is variable. In land plants unlike clustered/canonical histones of animals (see cH2B_(Metazoa)) replication dependent histone mRNAs are polyadenilated and genes are interspersed throught the genome. In chlorophyte green algae, such as Chlamydomonas, genes are grouped in clusteres and mRNAs end in 3'-stem loop similar to those of histone genes in animals [marzluff_metabolism_2008, alvarez-venegas_canonical_2019]. Plant H2Bs vary substantially in the length and sequence of their N-terminal tails [jiang_evolution_2020,bergmuller_characterization_2007]. A study of evolution and functional divergence of H2B histones in plants by Jiang et al. concluded that amongst flowering plants, eudicots had experienced the highest degree of divergence among H2B genes [jiang_evolution_2020]. This divergence appears to have been driven by preferential expression during gametogenesis, including three genes in Arabidopsis (HTB7/8/10 genes) and at least one in tomato. While HTB8 gene in Arabidopsis belongs to a phylogenetically distinct H2B.S variant [jiang_evolution_2020], HTB7 and HTB10 are much more similar in sequence to other H2Bs for now are included as cH2B in our classification [alvarez-venegas_canonical_2019].", - "taxonomy": "Viridiplantae (Plants)", + "summary": "H2A.Z.2_(Chordata) product of one of two H2A.Z genes converved in chordates, homologous to human H2A.Z.2 gene [giaimo_histone_2019]. Porducts of H2A.Z.1 and H2A.Z.2 genes differ by only three amino acids, however they have acquired some degree of functional indepedence. For example, H2A.Z.1 has been shown to better interact with bromodomain-containing protein 2 (BRD2) [draker_combination_2012], H2A.Z.2 preferentially associates with H3 trimethylated at lysine 4 (H3K4me3) [dryhurst_characterization_2009].", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -2083,26 +3632,26 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Viridiplantae", - "taxonomic_span_id": "33090", + "taxonomic_span": "Chordata", + "taxonomic_span_id": "7711", "alternate_names": [], "publications": [ - "jiang_evolution_2020", - "marzluff_metabolism_2008", - " alvarez-venegas_canonical_2019", - "bergmuller_characterization_2007", - "alvarez-venegas_canonical_2019" + "colino-sanguino_h2az-nuclesome_2021", + "draker_combination_2012", + "dryhurst_characterization_2009", + "giaimo_histone_2019", + "talbert_histone_2021" ] }, - "cH2B_(Embryophyta)": { - "level": "variant_group", + "H2A.Z.2_(Primates)": { + "level": "variant", "description": { - "summary": "cH2B_(Embryophyta) -- canonical H2B histones of land plants. In land plants unlike clustered/canonical histones of animals (see cH2A_(Metazoa)) replication dependent histone mRNAs are polyadenilated and genes are interspersed throught the genome [marzluff_metabolism_2008, alvarez-venegas_canonical_2019]. See description of cH2B_(Plants) variant Jiang et al. paper for further information about H2B histones in plant [jiang_evolution_2020].", - "taxonomy": "Embryophyta", + "summary": "H2A.Z.2_(Primates) H2A.Z.2 variant in primates, see H2A.Z.2_(Chordata) variant description.", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -2112,24 +3661,24 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Embryophyta", - "taxonomic_span_id": "3193", + "taxonomic_span": "Primates", + "taxonomic_span_id": "9443", "alternate_names": [], "publications": [ - "marzluff_metabolism_2008", - " alvarez-venegas_canonical_2019", - "jiang_evolution_2020" + "colino-sanguino_h2az-nuclesome_2021", + "giaimo_histone_2019", + "talbert_histone_2021" ] }, - "cH2B_(Chlorophyta)": { - "level": "variant_group", + "H2B": { + "level": "type", "description": { - "summary": "cH2B_(Chlorophyta) -- canonical H2B histones of green algae and similar replication-independent histones. In chlorophyte green algae, such as Chlamydomonas, genes are grouped in clusteres and mRNAs end in 3'-stem loop similar to those of histone genes in animals [marzluff_metabolism_2008, alvarez-venegas_canonical_2019]. See description of cH2B_(Plants) variant Jiang et al. paper for further information about H2B histones in plant [jiang_evolution_2020].", - "taxonomy": "Chlorophyta", + "summary": "H2B is one of the core histone types present in all Eukaryotes. H2B forms dimers with H2A via the \"hand shake\" motif. Two H2A-H2B dimers in turn associate with H3-H4 tetramer to form complete nucleosome core. It has been suggested that H2A and H2B have arisen from H3 and H4 during evolution [malik_phylogenomics_2003]. Structure of H2B consists of a histone fold with a long flexible N-terminal tail which protrudes between the DNA gyres. H2B interacts with H4 in the nucleosome core via a four helix bundle motif. Addtional \u03b1C-helix of H2B decorates the surface of nucleosome. Unlike, H3 and H2A histone, H2B histones have relatively modest number of characterized histone variants. Although in plants, histone H2Bs have undergone significant sequence divergence and expansion in the number of encoding genes [jiang_evolution_2020].", + "taxonomy": "Present in all Eukaryotes.", "genes": "null", - "evolution": "null", + "evolution": "It has been suggested that H2A and H2B have arisen from H3 and H4 during evolution [malik_phylogenomics_2003]. The eukaryotic H3-H4 tetramer resembles the tetramer found in Archaea, and it has been suggested that H2A and H2B have arisen from H3 and H4 later on in histone evolution [henneman_structure_2018]. The histone H2B (HTB) family shows the least conservation of all core histones likely because it is less evolutionarily constrained than its counterparts [alvarez-venegas_canonical_2019].", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -2139,26 +3688,25 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Chlorophyta", - "taxonomic_span_id": "3041", + "taxonomic_span": "Eukaryota", + "taxonomic_span_id": "2759", "alternate_names": [], "publications": [ - "marzluff_metabolism_2008", - " alvarez-venegas_canonical_2019", - "jiang_evolution_2020" + "jiang_evolution_2020", + "malik_phylogenomics_2003" ] }, - "cH2B_(Fungi)": { + "H2B.K": { "level": "variant_group", "description": { - "summary": "cH2B_(Fungi) -- canonical replication-dependent H2B histones in fungi. In most filamentous fungi, genes for the core histones H3, H2A, and H2B, as well as the linker histone H1, are unique [nowrousian_5_2014]. ", - "taxonomy": "Fungi", - "genes": "null", - "evolution": "null", - "expression": "Recent evidence suggests that the specialized stem-loop forming 3-prime-end of replication-dependent histone mRNAs originated early in the evolution of eukaryotes but was completely lost in several lineages, including plants, fungi and most protozoa. Instead, these species synthesize histones from cell-cycle-regulated polyadenylated mRNAs, and regulation is primarily at the level of transcription [marzluff_metabolism_2008].", - "knock-out:": "null", + "summary": "H2B.K is a variant identified so far bioinfomatically by Raman et al. as phylogenetically distinct clade of H2B variants in bony vertebrates [raman_novel_2022]. Newly identified histones H2B.N and H2B.K are primarily expressed in ovaries and early embryos, where they may play key roles in female fertility and early development like the cleavage stage histones of sea urchins. Certain changes that distinguish H2B.K from canonical H2B occur around the second DNA binding loop that could affect DNA binding or specificity. H2B.K\u2019s N-terminal tail differs dramatically from canonical H2B [raman_novel_2022]. N-terminal tail is missing key lysine residues that are posttranslationally modified in canonical H2B. Atypically for H2B proteins, H2B.K also has a variable-length polyglutamine tract in its N-terminal tail that could facilitate protein\u2013protein interactions. H2B.K is a newly identified histone variant, its biochemical properties remain uncharacterized [raman_novel_2022].", + "taxonomy": "Bony vertebrates [raman_novel_2022].", + "genes": "An unusual feature of both H2B.K and H2B.N is that they are encoded by intron-containing genes, whereas all other H2B variants and canonical H2B lack introns [raman_novel_2022].", + "evolution": "H2B.K may have a common ancestor with H2B.N. H2B.K is the only H2B variant for which Raman et al. could identify an ortholog in the shared syntenic location in chicken, a nonmammalian outgroup. They found H2B.K orthologs at least as far back as bony fishes in shared syntenic locations. H2B.K orthologs from vertebrates also group with the previously identified cleavage-stage dependent histones in sea urchin. Both H2B.K and H2B.N were pseudogenized in rodents. Both H2B.K and H2B.N were pseudogenized in rodents. [raman_novel_2022].", + "expression": "H2B.K is expressed in ovaries of opossum, dog, and humans, chicken, whereas H2B.K is expressed in both testes and ovaries in pig. Ovarian expression of H2B.K likely predates the divergence of birds and mammals. Analyses of human oogenesis revealed robust expression of H2B.K and H2B.N in oocytes, with levels increasing across oogenesis. Neither H2B.K nor H2B.N were detected in granulosa cells, which are the somatic cells of the female germline, suggesting again that expression is restricted to the germline. pol(A) signal is detected in the 3-prime-UTR of most H2B.K genes [raman_novel_2022].", + "knock-out": "null", "function": "null", - "sequence": "null", + "sequence": "", "localization": "null", "deposition": "null", "structure": "null", @@ -2166,24 +3714,24 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Fungi", - "taxonomic_span_id": "4751", + "taxonomic_span": "Euteleostomi", + "taxonomic_span_id": "117571", "alternate_names": [], "publications": [ - "nowrousian_5_2014" + "raman_novel_2022" ] }, - "cH2B_(Protists)": { - "level": "variant_group", + "H2B.K_(Homo_sapiens)": { + "level": "variant", "description": { - "summary": "cH2B_(Protists) -- canonical replication-dependent H2B histones in various protists.", - "taxonomy": "Protists", - "genes": "null", + "summary": "H2B.K_(Homo_sapiens) is mainly oocyte specific H2B.K variant in human encoded by H2BK1 gene (formerly H2BE1). See H2B.K description for more information.", + "taxonomy": "Human", + "genes": "H2BK1 gene", "evolution": "null", - "expression": "Recent evidence suggests that the specialized stem-loop forming 3-prime-end of replication-dependent histone mRNAs originated early in the evolution of eukaryotes but was completely lost in several lineages, including plants, fungi and most protozoa. Instead, these species synthesize histones from cell-cycle-regulated polyadenylated mRNAs, and regulation is primarily at the level of transcription [marzluff_metabolism_2008].", - "knock-out:": "null", + "expression": "null", + "knock-out": "null", "function": "null", - "sequence": "null", + "sequence": "", "localization": "null", "deposition": "null", "structure": "null", @@ -2191,20 +3739,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "", - "taxonomic_span_id": "", + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", "alternate_names": [], "publications": [] }, "H2B.L": { "level": "variant_group", "description": { - "summary": "H2B.L (also named subH2B) -- is an unusual H2B variant found outside of the nucleus in the in the subacrosomal space of spermatozoa. First characterized as a major component of the subacrosomal layer of the perinuclear theca (SAL-PT) in bulls sperm heads (named subH2Bv) [aul_major_2001]. SAL-PT resides within in the layer of condensed cytosol between acrosome and the nucleus of the spermatid [tran_involvement_2012]. N-terminal tail of subH2Bv contains a bipartite nuclear localization signal (bNLS) [tran_involvement_2012]. A study be Tran et al. suggested that this bNLS allows subH2Bv during spermiogenesis to target proacrosomic and acrosomic vesicles to the nuclear envelope by binding to the nucleocytoplasmic receptor KPNA [tran_involvement_2012]. In mouse Govin et al. have identified a homologous protein, which was named H2BL1, which was shown to accumalate in late spermiogenesis in condensing spermatids [govin_pericentric_2007]. Although when expressed ectopically fused with EGPFP the protein enters cell nucleus, it is has not been seen developmentally within the nucleus of the spermatid [tran_involvement_2012]. Thus currently there is no evidence that subH2B participates in nucleosome formation. The currently suggested name for this variant is H2B.L [raman_novel_2022].", + "summary": "H2B.L (also named subH2B) is an unusual H2B variant found outside of the nucleus in the in the subacrosomal space of spermatozoa. First characterized as a major component of the subacrosomal layer of the perinuclear theca (SAL-PT) in bulls sperm heads (named subH2Bv) [aul_major_2001]. SAL-PT resides within in the layer of condensed cytosol between acrosome and the nucleus of the spermatid [tran_involvement_2012]. N-terminal tail of subH2Bv contains a bipartite nuclear localization signal (bNLS) [tran_involvement_2012]. A study be Tran et al. suggested that this bNLS allows subH2Bv during spermiogenesis to target proacrosomic and acrosomic vesicles to the nuclear envelope by binding to the nucleocytoplasmic receptor KPNA [tran_involvement_2012]. In mouse Govin et al. have identified a homologous protein, which was named H2BL1, which was shown to accumalate in late spermiogenesis in condensing spermatids [govin_pericentric_2007]. Although when expressed ectopically fused with EGPFP the protein enters cell nucleus, it is has not been seen developmentally within the nucleus of the spermatid [tran_involvement_2012]. Thus currently there is no evidence that subH2B participates in nucleosome formation. The currently suggested name for this variant is H2B.L [raman_novel_2022].", "taxonomy": "Likely mammals, characterized mainly in bull and mouse. In Homininae the gene is pseudogenised (H2BL1P pseudogene in human). Gene is pseudogenised also in many primates [raman_novel_2022].", "genes": "H2bl1 in mouse.", "evolution": "Human genome appears to encode a H2B.L pseudogene, which is a single mutation away from encoding an intact ORF. Frameshifting mutation (and subsequent early stop codon) found in humans is also present in chimpanzee, bonobo, and gorilla, suggesting that a true pseudogenization event occurred around 9 Ma in Homininae [raman_novel_2022].", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "In mouse is around 40% identical to canonical H2B histone. The most divergent part is its unique N-terminal tail, which contains a bipartite nuclear localization signal [tran_involvement_2012]. Protein length in mouse is 122 aa (without initiator methionine), compared to 125 aa for canonical H2B.", "localization": "null", @@ -2231,74 +3779,154 @@ "11892742", "22156475", "aul_major_2001", - "tran_involvement_2012", "govin_pericentric_2007", - "raman_novel_2022" + "raman_novel_2022", + "tran_involvement_2012" ] }, - "H2B.W": { + "H2B.N": { "level": "variant_group", "description": { - "summary": "H2B.W -- is a testis-specific histone variant involved in spermiogenesis. It was suggested to have telomere-associated functions and participate in the telomere-binding complex in the human sperm [churikov_novel_2004, gineitis_human_2000]. It has a long extended N-terminal tail, has about 45% amino acid sequence identity and 70% similarity with both the major somatic H2Bs [churikov_novel_2004]. First, characterized in human as H2BFWT gene (now called H2BW1 gene). In mouse a paralog of H2B.W variant was initially identified by Govin et al. and named H2BL2 [govin_pericentric_2007]. In human beings, unlike other mammals including the mouse, core histones (H2A, H2B, H3 and H4) are not displaced completely during spermiogenesis and account for approximately 15% of the basic chromosomal proteins within the mature sperm [lee_functional_2009]. At least human H2B.W can replace conventional histone H2B in the nucleosome, does not affect the overall structure and stability of the nucleosome [boulard_nh2_2006]. In contrast to conventional H2B, H2B.W was unable to recruit chromosome condensation factors and to participate in the assembly of mitotic chromosomes, this fact is attibuted to its highly divergent NH2 tail [boulard_nh2_2006].", - "taxonomy": "Mammals", - "genes": "Human has two H2B.W-encoding paralogs which are now named as H2BW1 and H2BW2 and two pseudogenes (H2BW3P and H2BW4P) all located on the X chromosome between RAB9B and SLC25A3, while mouse has only one H2B.W-encoding gene (H2bw2) found in a syntenic location. Other mammals have different numbers of H2BW paralogs (between 1 and 4) but these are all located at the same conserved location of the X chromosome [Ruth et al]. The H2BFWT gene contains two introns and is transcribed exclusively in testis, where the spliced polyadenylated mRNA was detected [churikov_novel_2004].", - "evolution": "null", - "expression": "null", - "knock-out:": "null", + "summary": "H2B.N is a variant identified so far bioinfomatically by Raman et al. as phylogenetically distinct clade of H2B variants in mammals [raman_novel_2022]. Newly identified histones H2B.N and H2B.K are primarily expressed in ovaries and early embryos, where they may play key roles in female fertility and early development like the cleavage stage histones of sea urchins. H2B.N shares less then 50% identity with canonical H2Bs in the histone fold domain. Although H2A-, H4-interacting residues, and residues in L2 are largely conserved between H2B.N orthologs, they are highly divergent from cH2Bs. H2B.N orthologs are significantly truncated in their C-terminus. Removing the alpha-C domain eliminates the important nucleosome acidic patch that mediates many other chromatin interactions. This suggests that the unusual H2B.N could endow nucleosomes with unique properties, or that H2B.N might have evolved nonnucleosomal functions, like H2B.L [raman_novel_2022]. H2B.N is a newly identified histone variant, its biochemical properties remain uncharacterized [raman_novel_2022].", + "taxonomy": "Mammals [raman_novel_2022].", + "genes": " An unusual feature of both H2B.K and H2B.N is that they are encoded by intron-containing genes, whereas all other H2B variants and canonical H2B lack introns. Like most mammals, H2B.K and H2B.N are present in single copy in all primates, whereas H2B.1 and H2B.W are present in mul- tiple copies [raman_novel_2022].", + "evolution": "H2B.K may have a common ancestor with H2B.N. Analysis by Raman et al found that H2B.L and H2B.N contain marsupial and platypus (but not chicken) sequences, and therefore arose in the last common ancestor of all mammals. Both H2B.K and H2B.N were pseudogenized in rodents. [raman_novel_2022].", + "expression": "H2B.N was found to be expressed in ovaries of opossum, dog, and humans. Analyses of human oogenesis revealed robust expression of H2B.K and H2B.N in oocytes, with levels increasing across oogenesis. Neither H2B.K nor H2B.N were detected in granulosa cells, which are the somatic cells of the female germline, suggesting again that expression is restricted to the germline. pol(A) signal is detected in the 3-prime-UTR of most H2B.N genes [raman_novel_2022].", + "knock-out": "null", "function": "null", "sequence": "", "localization": "null", "deposition": "null", "structure": "null", "interactions": "null", - "disease": "Single nucleotide polymorphisms (SNPs) in H2B.W genes may result in male infertility. See meta-analysis of several studies by Teimouri et al. [teimouri_association_2018].", + "disease": "null", "caveats": "null" }, "taxonomic_span": "Mammalia", "taxonomic_span_id": "40674", + "alternate_names": [], + "publications": [ + "raman_novel_2022" + ] + }, + "H2B.N_(Homo_sapiens)": { + "level": "variant", + "description": { + "summary": "H2B.N_(Homo_sapiens) is mainly oocyte specific H2B.K variant in human encoded by H2BN1 gene. See H2B.N description for more information.", + "taxonomy": "Human", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", + "alternate_names": [], + "publications": [] + }, + "H2B.O": { + "level": "variant_group", + "description": { + "summary": "H2B.O is a class of H2B sequences identified exclusively in platypus genome that group together in phylogenetic analysis. H2B.O expression appears to be enriched in platypus\u2019 germline tissues (testes or ovaries) albeit at low levels [raman_novel_2022].", + "taxonomy": "Platypus [raman_novel_2022].", + "genes": "null", + "evolution": "null", + "expression": "H2B.O expression appears to be enriched in platypus\u2019 germline tissues (testes or ovaries) albeit at low levels [raman_novel_2022].", + "knock-out": "null", + "function": "null", + "sequence": "", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Ornithorhynchus anatinus", + "taxonomic_span_id": "9258", + "alternate_names": [], + "publications": [ + "raman_novel_2022" + ] + }, + "H2B.S": { + "level": "variant_group", + "description": { + "summary": "H2B.S is a class a new class of highly divergent H2B variants identified by Jiang et al. that specifically accumulate during chromatin compaction of dry seed embryos in multiple species of flowering plants [jiang_evolution_2020].", + "taxonomy": "Flowering plants (angiosperms) [jiang_evolution_2020]", + "genes": "HTB8 gene in Arabidopsis, Solyc06g074750.1 in tomato, LOC_Os09g39730 in rice.", + "evolution": "Despite forming a distinct angiosperm-specific clade, H2B.S variants show a high degree of variation, even amongst closely related genera. Other highly divergent sequences from Streptophyte algae and gymnosperms form a grade basal to H2B.S variants, suggesting a deeper evolutionary origin, which cannot be currently analyzed due to the lack of conserved substitutions and similar sequences in bryophytes, lycophytes and ferns [jiang_evolution_2020].", + "expression": "Arabidopsis HTB8 is specifically expressed in sperm and mature embryos. Unlike Arabidopsis HTB8, expression in anthers, pollen or sperm cells was not evident neither in rice nor maize [jiang_evolution_2020].", + "knock-out": "null", + "function": "For Arabidopsis an adaptive function in cell types that become desiccated, quiescent or show higher degrees of chromatin compaction has been suggested [jiang_evolution_2020].", + "sequence": "The angiosperm-specific clade of Arabidopsis HTB8 orthologs were characterized by conserved substitutions in the histone core, slightly extended C-terminal tails and greatly expanded N-terminal tails with a KVVXETV motif [jiang_evolution_2020].", + "localization": "null", + "deposition": "null", + "structure": "Two HTB8 residues, Arg152 and Met179, were highly conserved among HTB8 orthologs and were positioned in such a way that they might contribute to stronger interactions with DNA and histone H2A, respectively. These and other observations suggest that sequence divergence in HTB8 impact intra-nucleosomal interactions to potentially alter nucleosome structure and/or stability [jiang_evolution_2020].", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Magnoliopsida", + "taxonomic_span_id": "3398", + "alternate_names": [], + "publications": [ + "jiang_evolution_2020" + ] + }, + "H2B.V": { + "level": "variant_group", + "description": { + "summary": "H2B.V is a histone variant characterized so far in Trypanosoma brucei. It shares ~38% sequence identity with major H2B. H2B.V is essential for viability. H2A.Z and H2B.V colocalize throughout the cell cycle and exhibit nearly identical genomic distribution. Data strongly suggest that H2A.Z and H2B.V function together within a single nucleosome [lowell_histone_2005]. H2BV possibly regulates H3 K4 and K76 trimethylation in Trypanosoma brucei [mandava_trypanosome_2008].", + "taxonomy": "Trypanosoma", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Trypanosoma", + "taxonomic_span_id": "5690", "alternate_names": [ { - "name": "H2BFWT" - }, - { - "name": "member W" - }, - { - "name": "type W-T" - }, - { - "name": "H2BL2" - }, - { - "name": "spH2B" + "name": "H2BV" } ], "publications": [ - "11892742", - "22156475", - "churikov_novel_2004", - " gineitis_human_2000", - "govin_pericentric_2007", - "lee_functional_2009", - "boulard_nh2_2006" + "lowell_histone_2005" ] }, - "H2B.W_(Homo_sapiens)": { + "H2B.W": { "level": "variant_group", "description": { - "summary": "H2B.W_(Homo_sapiens) -- is a testis-specific histone variant involved in spermiogenesis. Human has two H2B.W-encoding paralogs which are now named as H2BW1 and H2BW2 genes. See H2B.W description for more information.", + "summary": "H2B.W is a testis-specific histone variant involved in spermiogenesis. It was suggested to have telomere-associated functions and participate in the telomere-binding complex in the human sperm [churikov_novel_2004, gineitis_human_2000]. It has a long extended N-terminal tail, has about 45% amino acid sequence identity and 70% similarity with both the major somatic H2Bs [churikov_novel_2004]. First, characterized in human as H2BFWT gene (now called H2BW1 gene). In mouse a paralog of H2B.W variant was initially identified by Govin et al. and named H2BL2 [govin_pericentric_2007]. In human beings, unlike other mammals including the mouse, core histones (H2A, H2B, H3 and H4) are not displaced completely during spermiogenesis and account for approximately 15% of the basic chromosomal proteins within the mature sperm [lee_functional_2009]. At least human H2B.W can replace conventional histone H2B in the nucleosome, does not affect the overall structure and stability of the nucleosome [boulard_nh2_2006]. In contrast to conventional H2B, H2B.W was unable to recruit chromosome condensation factors and to participate in the assembly of mitotic chromosomes, this fact is attibuted to its highly divergent NH2 tail [boulard_nh2_2006].", "taxonomy": "Mammals", - "genes": "Human has two H2B.W-encoding paralogs which are now named as H2BW1 and H2BW2 and two pseudogenes (H2BW3P and H2BW4P) all located on the X chromosome between RAB9B and SLC25A3. The H2BW1 gene contains two introns and is transcribed exclusively in testis, where the spliced polyadenylated mRNA was detected [churikov_novel_2004].", + "genes": "Human has two H2B.W-encoding paralogs which are now named as H2BW1 and H2BW2 and two pseudogenes (H2BW3P and H2BW4P) all located on the X chromosome between RAB9B and SLC25A3, while mouse has only one H2B.W-encoding gene (H2bw2) found in a syntenic location. Other mammals have different numbers of H2BW paralogs (between 1 and 4) but these are all located at the same conserved location of the X chromosome [Ruth et al]. The H2BFWT gene contains two introns and is transcribed exclusively in testis, where the spliced polyadenylated mRNA was detected [churikov_novel_2004].", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "", "localization": "null", "deposition": "null", "structure": "null", "interactions": "null", - "disease": "Single nucleotide polymorphisms (SNPs) in H2B.W genes may result in male infertility. See meta-analysis of several studies by Teimouri et al. [teimouri_association_2018]. Particularly, there was a significant association between 368A>G transition in H2BW1 and male infertility, resulting in His123Arg substitution.", + "disease": "Single nucleotide polymorphisms (SNPs) in H2B.W genes may result in male infertility. See meta-analysis of several studies by Teimouri et al. [teimouri_association_2018].", "caveats": "null" }, "taxonomic_span": "Mammalia", @@ -2321,19 +3949,24 @@ } ], "publications": [ + " gineitis_human_2000", "11892742", - "22156475" + "22156475", + "boulard_nh2_2006", + "churikov_novel_2004", + "govin_pericentric_2007", + "lee_functional_2009" ] }, "H2B.W.1_(Homo_sapiens)": { - "level": "variant_group", + "level": "variant", "description": { - "summary": "H2B.W.1_(Homo_sapiens) -- is a testis-specific histone variant involved in spermiogenesis encoded by H2BW1 gene (formerly H2BFWT). See H2B.W description for more information.", + "summary": "H2B.W.1_(Homo_sapiens) is a testis-specific histone variant involved in spermiogenesis encoded by H2BW1 gene (formerly H2BFWT). See H2B.W description for more information.", "taxonomy": "Mammals", "genes": "Human has two H2B.W-encoding paralogs which are now named as H2BW1 and H2BW2 and two pseudogenes (H2BW3P and H2BW4P) all located on the X chromosome between RAB9B and SLC25A3. The H2BW1 gene contains two introns and is transcribed exclusively in testis, where the spliced polyadenylated mRNA was detected [churikov_novel_2004].", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "", "localization": "null", @@ -2368,14 +4001,14 @@ ] }, "H2B.W.2_(Homo_sapiens)": { - "level": "variant_group", + "level": "variant", "description": { - "summary": "H2B.W.2_(Homo_sapiens) -- is a testis-specific histone variant involved in spermiogenesis encoded by H2BW2 gene (formerly H2BFM). Currenly, it is not well characterized. See H2B.W description for more information.", + "summary": "H2B.W.2_(Homo_sapiens) is a testis-specific histone variant involved in spermiogenesis encoded by H2BW2 gene (formerly H2BFM). Currenly, it is not well characterized. See H2B.W description for more information.", "taxonomy": "Mammals", "genes": "Human has two H2B.W-encoding paralogs which are now named as H2BW1 and H2BW2 and two pseudogenes (H2BW3P and H2BW4P) all located on the X chromosome between RAB9B and SLC25A3. The H2BW2 gene is locate on X-chromosome.", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "", "localization": "null", @@ -2397,90 +4030,113 @@ "22156475" ] }, - "H2B.K": { - "level": "variant_group", + "H2B.W_(Homo_sapiens)": { + "level": "variant", "description": { - "summary": "H2B.K -- is a variant identified so far bioinfomatically by Raman et al. as phylogenetically distinct clade of H2B variants in bony vertebrates [raman_novel_2022]. Newly identified histones H2B.N and H2B.K are primarily expressed in ovaries and early embryos, where they may play key roles in female fertility and early development like the cleavage stage histones of sea urchins. Certain changes that distinguish H2B.K from canonical H2B occur around the second DNA binding loop that could affect DNA binding or specificity. H2B.K\u2019s N-terminal tail differs dramatically from canonical H2B [raman_novel_2022]. N-terminal tail is missing key lysine residues that are posttranslationally modified in canonical H2B. Atypically for H2B proteins, H2B.K also has a variable-length polyglutamine tract in its N-terminal tail that could facilitate protein\u2013protein interactions. H2B.K is a newly identified histone variant, its biochemical properties remain uncharacterized [raman_novel_2022].", - "taxonomy": "Bony vertebrates [raman_novel_2022].", - "genes": "An unusual feature of both H2B.K and H2B.N is that they are encoded by intron-containing genes, whereas all other H2B variants and canonical H2B lack introns [raman_novel_2022].", - "evolution": "H2B.K may have a common ancestor with H2B.N. H2B.K is the only H2B variant for which Raman et al. could identify an ortholog in the shared syntenic location in chicken, a nonmammalian outgroup. They found H2B.K orthologs at least as far back as bony fishes in shared syntenic locations. H2B.K orthologs from vertebrates also group with the previously identified cleavage-stage dependent histones in sea urchin. Both H2B.K and H2B.N were pseudogenized in rodents. Both H2B.K and H2B.N were pseudogenized in rodents. [raman_novel_2022].", - "expression": "H2B.K is expressed in ovaries of opossum, dog, and humans, chicken, whereas H2B.K is expressed in both testes and ovaries in pig. Ovarian expression of H2B.K likely predates the divergence of birds and mammals. Analyses of human oogenesis revealed robust expression of H2B.K and H2B.N in oocytes, with levels increasing across oogenesis. Neither H2B.K nor H2B.N were detected in granulosa cells, which are the somatic cells of the female germline, suggesting again that expression is restricted to the germline. pol(A) signal is detected in the 3-prime-UTR of most H2B.K genes [raman_novel_2022].", - "knock-out:": "null", + "summary": "H2B.W_(Homo_sapiens) is a testis-specific histone variant involved in spermiogenesis. Human has two H2B.W-encoding paralogs which are now named as H2BW1 and H2BW2 genes. See H2B.W description for more information.", + "taxonomy": "Mammals", + "genes": "Human has two H2B.W-encoding paralogs which are now named as H2BW1 and H2BW2 and two pseudogenes (H2BW3P and H2BW4P) all located on the X chromosome between RAB9B and SLC25A3. The H2BW1 gene contains two introns and is transcribed exclusively in testis, where the spliced polyadenylated mRNA was detected [churikov_novel_2004].", + "evolution": "null", + "expression": "null", + "knock-out": "null", "function": "null", "sequence": "", "localization": "null", "deposition": "null", "structure": "null", "interactions": "null", - "disease": "null", + "disease": "Single nucleotide polymorphisms (SNPs) in H2B.W genes may result in male infertility. See meta-analysis of several studies by Teimouri et al. [teimouri_association_2018]. Particularly, there was a significant association between 368A>G transition in H2BW1 and male infertility, resulting in His123Arg substitution.", "caveats": "null" }, - "taxonomic_span": "Euteleostomi", - "taxonomic_span_id": "117571", - "alternate_names": [], + "taxonomic_span": "Mammalia", + "taxonomic_span_id": "40674", + "alternate_names": [ + { + "name": "H2BFWT" + }, + { + "name": "member W" + }, + { + "name": "type W-T" + }, + { + "name": "H2BL2" + }, + { + "name": "spH2B" + } + ], "publications": [ - "raman_novel_2022" + "11892742", + "22156475" ] }, - "H2B.K_(Homo_sapiens)": { - "level": "variant", + "H2B.Z": { + "level": "variant_group", "description": { - "summary": "H2B.K_(Homo_sapiens) -- is mainly oocyte specific H2B.K variant in human encoded by H2BK1 gene (formerly H2BE1). See H2B.K description for more information.", - "taxonomy": "Human", - "genes": "H2BK1 gene", + "summary": "H2B.Z is an apicomplexan specific variant. Different studies performed in Toxoplasma have shown a nucleosome composition in which H2A.Z, but not H2A.X, dimerizes with H2B.Z, while H2A.X dimerizes with canonical H2B (H2Ba in T. gondii), but never with H2B.Z. This fact is also seen in P. falciparum, although this parasite lacks H2A.X variant and has driven the hypothesis of a new double variant nucleosome exclusive of parasites with particular characteristics [logie_apicomplexa_2020].", + "taxonomy": "null", + "genes": "null", "evolution": "null", - "expression": "null", - "knock-out:": "null", + "expression": " H2B.Z expression was found to be relatively constitutive, showing only slight decrease in early and mid-trophozoites [miao_malaria_2006].", + "knock-out": "null", "function": "null", - "sequence": "", + "sequence": "null", "localization": "null", "deposition": "null", "structure": "null", "interactions": "null", "disease": "null", - "caveats": "null" + "caveats": "Former name for this histone variant H2Bv from Plasmodium can be confused with H2BV from Trypanosoma, though the two variants are not closely related." }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", - "alternate_names": [], - "publications": [] + "taxonomic_span": "Apicomplexa", + "taxonomic_span_id": "5794", + "alternate_names": [ + { + "name": "H2Bv" + } + ], + "publications": [ + "logie_apicomplexa_2020" + ] }, - "H2B.N": { - "level": "variant_group", + "H3": { + "level": "type", "description": { - "summary": "H2B.N -- is a variant identified so far bioinfomatically by Raman et al. as phylogenetically distinct clade of H2B variants in mammals [raman_novel_2022]. Newly identified histones H2B.N and H2B.K are primarily expressed in ovaries and early embryos, where they may play key roles in female fertility and early development like the cleavage stage histones of sea urchins. H2B.N shares less then 50% identity with canonical H2Bs in the histone fold domain. Although H2A-, H4-interacting residues, and residues in L2 are largely conserved between H2B.N orthologs, they are highly divergent from cH2Bs. H2B.N orthologs are significantly truncated in their C-terminus. Removing the alpha-C domain eliminates the important nucleosome acidic patch that mediates many other chromatin interactions. This suggests that the unusual H2B.N could endow nucleosomes with unique properties, or that H2B.N might have evolved nonnucleosomal functions, like H2B.L [raman_novel_2022]. H2B.N is a newly identified histone variant, its biochemical properties remain uncharacterized [raman_novel_2022].", - "taxonomy": "Mammals [raman_novel_2022].", - "genes": " An unusual feature of both H2B.K and H2B.N is that they are encoded by intron-containing genes, whereas all other H2B variants and canonical H2B lack introns. Like most mammals, H2B.K and H2B.N are present in single copy in all primates, whereas H2B.1 and H2B.W are present in mul- tiple copies [raman_novel_2022].", - "evolution": "H2B.K may have a common ancestor with H2B.N. Analysis by Raman et al found that H2B.L and H2B.N contain marsupial and platypus (but not chicken) sequences, and therefore arose in the last common ancestor of all mammals. Both H2B.K and H2B.N were pseudogenized in rodents. [raman_novel_2022].", - "expression": "H2B.N was found to be expressed in ovaries of opossum, dog, and humans. Analyses of human oogenesis revealed robust expression of H2B.K and H2B.N in oocytes, with levels increasing across oogenesis. Neither H2B.K nor H2B.N were detected in granulosa cells, which are the somatic cells of the female germline, suggesting again that expression is restricted to the germline. pol(A) signal is detected in the 3-prime-UTR of most H2B.N genes [raman_novel_2022].", - "knock-out:": "null", + "summary": "H3 is one of the core histone types present in all Eukaryotes. Two H3 and two H4 histones form H3-H4 tetramer via \"hand shake\" and \"four helix bundle\" motifs. Two H2A-H2B dimers then associate with H3-H4 tetramer to form complete nucleosome core. Structurally H3 has a histone fold domain, \u03b1N-helix and a long N-terminal tail with many important post-translational modification sites. The \u03b1N-helix organizes the terminal segment of core nucleosomal DNA. H3 histone class has evolved to encomass a large number of functionally important H3 histone variants. At least two H3 variants are found in most eukaryotic lineages [malik_phylogenomics_2003].", + "taxonomy": "Eukaryotes", + "genes": "null", + "evolution": "The H3\u2013H4 tetramer represents a direct structural and perhaps evolutionary link to the archaeal histone tetramer. Distinct variants of H3 have been usurped for special roles in transcription and even chromosome segregation, whereas H4\u2019s role has remained constant throughout eukaryotic evolution [malik_phylogenomics_2003]. H3 and H4 are more similar to archaeal histones than H2A and H2B, supporting this hypothesis [henneman_structure_2018]. The fact that eukaryotic cells undergo mitosis, in which chromosomes are highly compacted, together with the abundance of gene-poor regions may have favored a histone conformation that wraps DNA twice (eukaryotic octamer) instead of once (archaeal tetramer) and that via its N-terminal tails has the ability to compact DNA at ahigher order [henneman_structure_2018].", + "expression": "null", + "knock-out": "null", "function": "null", - "sequence": "", + "sequence": "null", "localization": "null", "deposition": "null", - "structure": "null", + "structure": "The two-fold symmetry of the eukaryotic nucleosome is organized along the dimerization interface of the two H3 molecules using their C-terminal ends, an example of a four-helix bundle motif. Apart from its heterodimerization with H4, H3 also makes contacts with H2A and has at least two segments of specific contact with the nucleosomal DNA: just upstream of the alpha-N helix where the H3 tail enters the nucleosome between the DNA gyres, and in the loop 1 region [malik_phylogenomics_2003].", "interactions": "null", "disease": "null", "caveats": "null" }, - "taxonomic_span": "Mammalia", - "taxonomic_span_id": "40674", + "taxonomic_span": "Eukaryotes", + "taxonomic_span_id": "2759", "alternate_names": [], "publications": [ - "raman_novel_2022" + "malik_phylogenomics_2003" ] }, - "H2B.N_(Homo_sapiens)": { - "level": "variant", + "H3.1-like_(Plants)": { + "level": "variant_group", "description": { - "summary": "H2B.N_(Homo_sapiens) -- is mainly oocyte specific H2B.K variant in human encoded by H2BN1 gene. See H2B.N description for more information.", - "taxonomy": "Human", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", - "sequence": "", + "sequence": "null", "localization": "null", "deposition": "null", "structure": "null", @@ -2488,22 +4144,22 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], "publications": [] }, - "H2B.O": { + "H3.3": { "level": "variant_group", "description": { - "summary": "H2B.O -- is a class of H2B sequences identified exclusively in platypus genome that group together in phylogenetic analysis. H2B.O expression appears to be enriched in platypus\u2019 germline tissues (testes or ovaries) albeit at low levels [raman_novel_2022].", - "taxonomy": "Platypus [raman_novel_2022].", + "summary": "H3.3 is a diverse functional class comprising replication-independent (also called replacement) variants of the H3 histone. It seems that a distinction between H3 and H3.3 types has arisen numerous times in evolution. Four such instances are at least evident in ciliates, apicomplexans, animals and plants [malik_phylogenomics_2003]. H3.3 are characterized by changes at four positions with respect to cH3s, one in the N-terminal tail and three in the alpha-2-helix of the histone fold domain. Strictly speaking, this is not convergent evolution because the H3.3 versions do not all have the same amino acid residues in these four positions. However, it strongly suggests that a similar constraint has led to these repeated origins of distinguishable H3 and H3.3 types [malik_phylogenomics_2003]. Although, given the likelihood of independent divergences, H3.3 variants from different taxonomic clades may be neither more nor less orthologous to animal H3.3 than their cH3 ounterparts [talbert_unified_2012]. Replication-independent and replication-coupled H3 variants within an organism typically differ in residue 31 (and whether it can be phosphorylated) as well as residues 86?? and 89, but distinguishing residues vary in different organisms and caution is advised in designating H3.3 in less wellstudied eukaryotic kingdoms [talbert_unified_2012].", + "taxonomy": "Eukaryotes", "genes": "null", - "evolution": "null", - "expression": "H2B.O expression appears to be enriched in platypus\u2019 germline tissues (testes or ovaries) albeit at low levels [raman_novel_2022].", - "knock-out:": "null", + "evolution": "According to Malik et al. no eukaryotic genome that has been characterized with only canonical H3 and not H3.3. Although there is little doubt regarding multiple origins of H3.3, it is certainly conceivable that ancestrally, an H3.3 was present in a small, predominantly transcriptionally active genome. The rapid expansion of eukaryotic genomes, large portions of which became silent in differentiated cells, may have selected for H3 and its expansion, both for increasing bulk packaging duties and to ensure transcriptional silencing where appropriate. In this regard, it is important to note that even in the archaeon M. fervidus, this division of labor is evident between HMfA and HMfB5 [malik_phylogenomics_2003].", + "expression": "null", + "knock-out": "null", "function": "null", - "sequence": "", + "sequence": "null", "localization": "null", "deposition": "null", "structure": "null", @@ -2511,47 +4167,46 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Ornithorhynchus anatinus", - "taxonomic_span_id": "9258", + "taxonomic_span": "Eukaryotes", + "taxonomic_span_id": "2759", "alternate_names": [], "publications": [ - "raman_novel_2022" + "malik_phylogenomics_2003", + "talbert_unified_2012" ] }, - "H2B.S": { + "H3.3-like?": { "level": "variant_group", "description": { - "summary": "H2B.S -- is a class a new class of highly divergent H2B variants identified by Jiang et al. that specifically accumulate during chromatin compaction of dry seed embryos in multiple species of flowering plants [jiang_evolution_2020].", - "taxonomy": "Flowering plants (angiosperms) [jiang_evolution_2020]", - "genes": "HTB8 gene in Arabidopsis, Solyc06g074750.1 in tomato, LOC_Os09g39730 in rice.", - "evolution": "Despite forming a distinct angiosperm-specific clade, H2B.S variants show a high degree of variation, even amongst closely related genera. Other highly divergent sequences from Streptophyte algae and gymnosperms form a grade basal to H2B.S variants, suggesting a deeper evolutionary origin, which cannot be currently analyzed due to the lack of conserved substitutions and similar sequences in bryophytes, lycophytes and ferns [jiang_evolution_2020].", - "expression": "Arabidopsis HTB8 is specifically expressed in sperm and mature embryos. Unlike Arabidopsis HTB8, expression in anthers, pollen or sperm cells was not evident neither in rice nor maize [jiang_evolution_2020].", - "knock-out:": "null", - "function": "For Arabidopsis an adaptive function in cell types that become desiccated, quiescent or show higher degrees of chromatin compaction has been suggested [jiang_evolution_2020].", - "sequence": "The angiosperm-specific clade of Arabidopsis HTB8 orthologs were characterized by conserved substitutions in the histone core, slightly extended C-terminal tails and greatly expanded N-terminal tails with a KVVXETV motif [jiang_evolution_2020].", + "summary": "null", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", "localization": "null", "deposition": "null", - "structure": "Two HTB8 residues, Arg152 and Met179, were highly conserved among HTB8 orthologs and were positioned in such a way that they might contribute to stronger interactions with DNA and histone H2A, respectively. These and other observations suggest that sequence divergence in HTB8 impact intra-nucleosomal interactions to potentially alter nucleosome structure and/or stability [jiang_evolution_2020].", + "structure": "null", "interactions": "null", "disease": "null", "caveats": "null" }, - "taxonomic_span": "Magnoliopsida", - "taxonomic_span_id": "3398", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], - "publications": [ - "jiang_evolution_2020" - ] + "publications": [] }, - "gH2B": { - "level": "variant_group", + "H3.3-like_(Animals)": { + "level": "variant", "description": { - "summary": "gH2B is a group of plant H2B variants found in Lilium that are highly divergent from the canonical H2B and are expressed in the generative cell of the bicellular pollen where it may be necessary for chromatin remodeling of the male germline [alvarez-venegas_canonical_2019,yang_proteomic_2016,ueda_unusual_2000]. The subvariants so far identified are named gH2B in Lilium longiflorum, mgH2B in Lilium davidii, and mgH2B.in in Lilium davidii. These subvariants are rather different and are grouped due to lack of further information. Some phylogenetic reconstructions cluster these variant together with H2B.S [alvarez-venegas_canonical_2019], however, this may be likely to long branch attraction, and the exact phylogeny remains to be studied [jiang_evolution_2020].", + "summary": "null", "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -2561,25 +4216,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Lilium", - "taxonomic_span_id": "4688", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], - "publications": [ - "alvarez-venegas_canonical_2019", - "yang_proteomic_2016", - "ueda_unusual_2000", - "jiang_evolution_2020" - ] + "publications": [] }, - "H2B.Z": { - "level": "variant_group", + "H3.3-like_(Plants)": { + "level": "variant", "description": { - "summary": "H2B.Z is an apicomplexan specific variant. Different studies performed in Toxoplasma have shown a nucleosome composition in which H2A.Z, but not H2A.X, dimerizes with H2B.Z, while H2A.X dimerizes with canonical H2B (H2Ba in T. gondii), but never with H2B.Z. This fact is also seen in P. falciparum, although this parasite lacks H2A.X variant and has driven the hypothesis of a new double variant nucleosome exclusive of parasites with particular characteristics [logie_apicomplexa_2020].", + "summary": "null", "taxonomy": "null", "genes": "null", "evolution": "null", - "expression": " H2B.Z expression was found to be relatively constitutive, showing only slight decrease in early and mid-trophozoites [miao_malaria_2006].", - "knock-out:": "null", + "expression": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -2587,57 +4237,51 @@ "structure": "null", "interactions": "null", "disease": "null", - "caveats": "Former name for this histone variant H2Bv from Plasmodium can be confused with H2BV from Trypanosoma, though the two variants are not closely related." + "caveats": "null" }, - "taxonomic_span": "Apicomplexa", - "taxonomic_span_id": "5794", - "alternate_names": [ - { - "name": "H2Bv" - } - ], - "publications": [ - "logie_apicomplexa_2020" - ] + "taxonomic_span": "null", + "taxonomic_span_id": "null", + "alternate_names": [], + "publications": [] }, - "H2B.V": { - "level": "variant_group", + "H3.3_(Animals)": { + "level": "variant", "description": { - "summary": "H2B.V is a histone variant characterized so far in Trypanosoma brucei. It shares ~38% sequence identity with major H2B. H2B.V is essential for viability. H2A.Z and H2B.V colocalize throughout the cell cycle and exhibit nearly identical genomic distribution. Data strongly suggest that H2A.Z and H2B.V function together within a single nucleosome [lowell_histone_2005]. H2BV possibly regulates H3 K4 and K76 trimethylation in Trypanosoma brucei [mandava_trypanosome_2008].", - "taxonomy": "Trypanosoma", - "genes": "null", + "summary": "H3.3_(Animals) is a class of replication-independent (also called replacement) variants of the H3 histone in animals. H3.3 is characterized by changes at four positions with respect to cH3s, one in the N-terminal tail and three in the alpha-2-helix of the histone fold domain (positions 31,86,89,90). The sequence differences within the alpha-2-helix alow H3.3 to interact specifically with its own chaperones (HIRA, ATRX, DAXX). At position 31 H3.3s instead of alanine have serine or threonine which can be phosphorilated. There are multiple studies showing that phosphorylation of this site is functionally important [talbert_unified_2012]. Particularly, H3.3S31ph is associated with H3.3K27 acetylation which helps gene activation and was shown to be essential for gastrulation in Xenopus [sitbon_histone_2020]. The metazoan histone H3.3 has been most closely associated with active transcription, replacing cH3s at active genes and promoters, implicated in diverse biological processes, including development, transcriptional memory and transcriptional reprogramming. However, genetic studies highlighted also its imortance in maintaining heterochromatin at telomeres, centromeres, and pericentromeric regions [jang_histone_2015], as well as revealed essential functions of H3.3 in the germline and early embryonic development [elsaesser_new_2010,yuen_histone_2014,jang_histone_2015].", + "taxonomy": "Animals (Metazoa)", + "genes": "In human H3.3 is encoded by H3-3A and H3-3B genes (formerly, H3F3A and H3F3B), located in chromosome 1 (1q42.12) and 17 (17q25), respectively. In mouse by H3f3a and H3f3b genes. Genes have introns.", "evolution": "null", - "expression": "null", - "knock-out:": "null", - "function": "null", + "expression": "H3.3 mRNAs are polyadenilated. Expressed independent of DNA synthesis through the cell cycle.", + "knock-out": "In mice complete depletion of H3.3 leads to developmental retardation and early embryonic lethality. At the cellular level, H3.3 loss triggers cell cycle suppression and cell death. Surprisingly, H3.3 depletion does not dramatically disrupt gene regulation in the developing embryo. Instead, H3.3 depletion causes dysfunction of heterochromatin structures at telomeres, centromeres, and pericentromeric regions of chromosomes, leading to mitotic defects [jang_histone_2015]. In C. elegans Despite these specific expression patterns, we find that neither loss of individual H3.3 homologs nor the knockout of all five H3.3-coding genes causes sterility or lethality. However, we demonstrate an essential role for the conserved histone chaperone HIRA in the nucleosomal loading of all H3.3 variants. This requirement can be bypassed by mutation of the H3.3-specific residues to those found in H3. While even removal of all H3.3 homologs does not result in lethality, it leads to reduced fertility and viability in response to high-temperature stress [delaney_differential_2018]. Flies that lack both H3.3 genes have reduced viability and individuals that survive to adulthood are completely sterile in both sexes [sakai_transcriptional_2009]. Targeted disruption of one gene (H3f3b) results in a number of phenotypic abnormalities, including a reduction in H3.3 histone levels, leading to male infertility, as well as abnormal sperm and testes morphology. Additionally, null germ cell populations at specific stages in spermatogenesis, in particular spermatocytes and spermatogonia, exhibited increased rates of apoptosis. Disruption of H3f3b also altered histone post-translational modifications and gene expression in the testes, with the most prominent changes occurring at genes involved in spermatogenesis. Finally, H3f3b null testes also exhibited abnormal germ cell chromatin reorganization and reduced protamine incorporation [yuen_histone_2014].", + "function": "H3.3 has been implicated in a variety of biological processes: it is important for embryonic stem cell differentiation, epigenetic reprogramming following somatic cell nuclear transfer, neuron plasticity, the DNA damage response and centromere maintenance. H3.3 is also essential for germ line development in mammals, where it is required for the remodeling of both maternal and paternal gametes [delaney_differential_2018]. Its role in histone replacement at active genes and promoters is highly conserved and has been proposed to participate in the epigenetic transmission of active chromatin states [szenker_double_2011]. Its accumulation at silent loci in pericentric heterochromatin and telomeres, raising questions concerning the actual function of H3.3", "sequence": "null", "localization": "null", - "deposition": "null", + "deposition": "In humans and other animals specialized chaperone HIRA places H3.3 at sites of histone turnover where it replaces canonical H3s. Such sites include active genes, promoters, enhancers, transcription termination sites. Chaperones ATRX and DAXX deposit H3.3 in telomeres, imprinted genes and other heterochromatic loci, where it is modified with the trimethlyated lysine 9 heterochromatic mark (denoted H3K9me3) to maintain heterochromatin at these locations [talbert_histone_2021]. While the majority of nucleosomes are replaced by protamines during mammalian spermatogenesis, some H3.3 nucleosomes are retained and may transmit epigenetic information to the zygote [delaney_differential_2018]. In embryonic stem cells for example, HIRA chaperones H3.3 to both active and repressed genes, including also bivalent promoters normally repressed in embryonic stem cells. This highlights a role of HIRA in establishing chromatin landscapes not always related to active chromatin but key to allow proper differentiation [otero_histone_2014].", "structure": "null", "interactions": "null", - "disease": "null", + "disease": "Mutations in histone genes can affect sites of PTMs causing changes in local and global DNA methylation status. These effects are directly linked to neoplastic transformation by altered gene expression. Recurrent H3.3 histone mutations are increasingly identified in several malignancies and developmental disorders in human [kumar_genes_2021]. Well characterized oncomutations in H3.3 genes include K27M, G34W/L in pediatric high-grade gliomas and K36M and G34V/R in bone tumors [xiong_histone_2016]. Competing models have suggested that H3K27M oncohistones sequester or poison PRC2 complex which deposits H3K27me3 marks. However, Sarthy et al. demonstrated that the K27M epitope only inhibits H3K27 trimethylation on chromatin in vivo, supporting the idea that these oncohistones inhibit chromatin-bound PRC2 complexes. A possible mechanism comes from recent reports [lee_automethylation_2019,wang_regulation_2019] showing that EZH2 (key component of PRC2) methylates itself, and that this automethylation is required for full catalytic activity. These studies also showed that H3K27M blocks EZH2 automethylation, and might contribute to the dominant effect of H3K27M mutations [sarthy_histone_2020].", "caveats": "null" }, - "taxonomic_span": "Trypanosoma", - "taxonomic_span_id": "5690", - "alternate_names": [ - { - "name": "H2BV" - } - ], + "taxonomic_span": "Metazoa", + "taxonomic_span_id": "33208", + "alternate_names": [], "publications": [ - "lowell_histone_2005" + "elsaesser_new_2010", + "jang_histone_2015", + "sitbon_histone_2020", + "talbert_unified_2012", + "yuen_histone_2014" ] }, - "CS_H2B_(Echinoidea)": { - "level": "variant_group", + "H3.3_(Ascomycota)": { + "level": "variant", "description": { - "summary": "CS_H2B_(Echinoidea) is a histone variant class containing cleavage-stage (CS) H2B histones characterized so far in sea urchins. Four classes of histones in sea urchins have been characterized. Three sets of histone variants are coexisting in the embryo at larval stages of sea urchin\u2019s development: the maternally inherited cleavage stage variants (CS) expressed during the two initial cleavage divisions, the early histone variants, which are recruited into embryonic chromatin from middle cleavage stages until hatching and the late variants, that are fundamentally expressed from blastula stage onward [oliver_conservative_2003]. The fourth class of histones in sea urchins are the sperm histones. They are exclusively transcribed during spermatogenesis and code for specialized H1 and H2B proteins with basic N-terminal extensions which are responsible for the unusually high chromatin condensation in mature sperm [mandl_five_1997]. Early, late, and sperm histone genes lack introns, contain the conserved 3-prime terminal stem-loop structure instead of a poly(A) addition site, and thus show the classical hallmarks of replication-dependent histone genes. The CS proteins are the first histones to be synthesized after fertilization in the cleaving embryo. The CS histones appear to be synthesized during oogenesis and in the mature egg, where they give rise to a large maternal pool of histone proteins. The CS proteins are the only histones present in the chromatin of the egg and zygote up to the second cell division. Thereafter, the efficient synthesis of the early histones leads to a rapid dilution of the CS histones in the chromatin except in the nondividing small micromeres, where the CS proteins remain the major histones up to the pluteus larva stage. The maternally stored CS histones play an important role in remodeling of the sperm chromatin after fertilization. Upon entry in the egg cytoplasm, the sperm H1 and H2B proteins present in the male pronucleus are rapidly phosphorylated on their N-terminal extensions, and the sperm H1 protein is subsequently replaced in the chromatin by the CS H1 protein. This exchange of H1 histones is immediately followed by decondensation of the chromatin. At around the time of DNA replication, the CS H2A and H2B proteins start to accumulate in the chromatin of the male pronucleus, which correlates with the transition of the nucleosomal repeat length from 250 bp in the sperm chromatin to 200 bp in the early embryo. As a consequence of this massive chromatin restructuring, the paternal genome is transcriptionally activated already at the beginning of S phase in the first cell cycle, which further emphasizes the importance of the CS histones for early development [mandl_five_1997].", - "taxonomy": "Echinoidea (sea urchins)", - "genes": "null", + "summary": "H3.3_(Ascomycota) is the main form of H3 histone in Ascomycetes.", + "taxonomy": "Fungi", + "genes": "In S. cerevisiae H3 histone is encoded by HHT1 and HHT2 genes", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -2645,29 +4289,22 @@ "structure": "null", "interactions": "null", "disease": "null", - "caveats": "It is likely, that CS_H2B homologs are present in other taxonomic clades. Raman et al. suggested that newly identified histones H2B.N and H2B.K which are primarily expressed in ovaries and early embryos of mammals and may play key roles in female fertility and early development may be related to the cleavage stage histones of sea urchins [raman_novel_2022]. Other CS histones, such as CS H1 in sea urchins are functionally equivalent to frog H1M(B) proteins [mandl_five_1997]." + "caveats": "null" }, - "taxonomic_span": "Echinoidea", - "taxonomic_span_id": "7625", - "alternate_names": [ - { - "name": "cleavage H2B" - } - ], - "publications": [ - "oliver_conservative_2003", - "mandl_five_1997" - ] + "taxonomic_span": "Ascomycota", + "taxonomic_span_id": "4890", + "alternate_names": [], + "publications": [] }, - "early_H2B_(Echinoidea)": { - "level": "variant_group", + "H3.3_(Fungi)": { + "level": "variant", "description": { - "summary": "early_H2B_(Echinoidea) is a histone variant class of early H2B histones characterized so far in sea urchins. Four classes of histones in sea urchins have been characterized. Three sets of histone variants are coexisting in the embryo at larval stages of sea urchin\u2019s development: the maternally inherited cleavage stage variants (CS) expressed during the two initial cleavage divisions, the early histone variants, which are recruited into embryonic chromatin from middle cleavage stages until hatching and the late variants, that are fundamentally expressed from blastula stage onward [oliver_conservative_2003]. The fourth class of histones in sea urchins are the sperm histones [mandl_five_1997]. Early, late, and sperm histone genes lack introns, contain the conserved 3-prime terminal stem-loop structure instead of a poly(A) addition site, and thus show the classical hallmarks of replication-dependent histone genes. The repetitive early histone genes are transcriptionally activated upon meiotic maturation of the egg, are maximally expressed in the rapidly dividing blastula embryo, and are already silenced at the hatching blastula stage, when the transcripts of late histone genes start to accumulate [mandl_five_1997].", - "taxonomy": "Echinoidea (sea urchins)", - "genes": "null", + "summary": "H3.3_(Fungi) is a class of H3 histone variants in Fungi which share similarity to H3.3 in other kingdoms (characteristic amino acids at the four key positions). It is, however, the main form of histone H3 in Ascomycetes, where canonical H3 was lost during evolution [malik_phylogenomics_2003]. While H3.3 in Ascomycetes is the only form of H3 histone it is mainly reffered to as H3 rather than H3.3. In the current classification we will refer to such histones as H3.3_(Ascomycota) to retain its proper placement within our classification. Basidiomycetes have both canonical H3 and H3.3 histones. Fungi H3.3 along with plant and animal H3.3s have evolved independently, but share similar sequence difference with respective canonical H3s. It is likely that they have evolved under similar contraints. Since H3.3 as a separate variant is available only in Basidiomycetes the H3.3/cH3 functional difference in Fungi remains poorly studied. Anju et al. have charaterized two H3 genes in basidiomycete Ustilago maydis U1 and U2. The U1 gene was shown to posses replication-independent expression and sequence characteristic of H3.3 replacement histones, while U2 gene manifested replication-coupled expression typical for canonical H3 [anju_identification_2011].", + "taxonomy": "Fungi", + "genes": "In S. cerevisiae H3 histone is encoded by HHT1 and HHT2 genes. U1 gene in Ustilago maydis.", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -2677,23 +4314,23 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Echinoidea", - "taxonomic_span_id": "7625", + "taxonomic_span": "Fungi", + "taxonomic_span_id": "4751", "alternate_names": [], "publications": [ - "oliver_conservative_2003", - "mandl_five_1997" + "anju_identification_2011", + "malik_phylogenomics_2003" ] }, - "late_H2B_(Echinoidea)": { - "level": "variant_group", + "H3.3_(Homo_sapiens)": { + "level": "variant", "description": { - "summary": "late_H2B_(Echinoidea) is a histone variant class of late H2B histones characterized so far in sea urchins. Four classes of histones in sea urchins have been characterized. Three sets of histone variants are coexisting in the embryo at larval stages of sea urchin\u2019s development: the maternally inherited cleavage stage variants (CS) expressed during the two initial cleavage divisions, the early histone variants, which are recruited into embryonic chromatin from middle cleavage stages until hatching and the late variants, that are fundamentally expressed from blastula stage onward [oliver_conservative_2003]. The fourth class of histones in sea urchins are the sperm histones [mandl_five_1997]. Early, late, and sperm histone genes lack introns, contain the conserved 3-prime terminal stem-loop structure instead of a poly(A) addition site, and thus show the classical hallmarks of replication-dependent histone genes. The repetitive early histone genes are transcriptionally activated upon meiotic maturation of the egg, are maximally expressed in the rapidly dividing blastula embryo, and are already silenced at the hatching blastula stage, when the transcripts of late histone genes start to accumulate [mandl_five_1997]. Late genes are active from the late blastula stage onward [maxson_evolution_1987].", - "taxonomy": "Echinoidea (sea urchins)", + "summary": "H3.3_(Homo_sapiens) is a class of replication-independent (also called replacement) variants of the H3 histone in human encoded by H3-3A and H3-3B genes. Both genes code for an identical protein. See H3.3_(Animals) for details description of this variant.", + "taxonomy": "Homo sapiens", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -2703,117 +4340,118 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Echinoidea", - "taxonomic_span_id": "7625", + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", "alternate_names": [], - "publications": [ - "oliver_conservative_2003", - "mandl_five_1997", - "maxson_evolution_1987" - ] + "publications": [] }, - "sperm_H2B_(Echinoidea)": { - "level": "variant_group", + "H3.3_(Plants)": { + "level": "variant", "description": { - "summary": "sperm_H2B_(Echinoidea) is a histone variant class of sperm H2B histones characterized so far in sea urchins. Four classes of histones in sea urchins have been characterized. Three sets of histone variants are coexisting in the embryo at larval stages of sea urchin\u2019s development: the maternally inherited cleavage stage variants (CS) expressed during the two initial cleavage divisions, the early histone variants, which are recruited into embryonic chromatin from middle cleavage stages until hatching and the late variants, that are fundamentally expressed from blastula stage onward [oliver_conservative_2003]. The fourth class of histones in sea urchins are the sperm histones. They are exclusively transcribed during spermatogenesis and code for specialized H1 and H2B proteins with basic N-terminal extensions which are responsible for the unusually high chromatin condensation in mature sperm [mandl_five_1997]. In parechinus angulosus the characterized sperm H2B sequence has a repeating pentapeptide in the N-terminal region [strickland_complete_1978].", - "taxonomy": "Echinoidea (sea urchins)", - "genes": "null", + "summary": "H3.3_(Plants) is a class of replication-independent (also called replacement) variants of the H3 histone in green plants (Viridiplantae), which include green algae and land plants. Despite having the same name as H3.3 of animals, similar functions and key amino acids differences with repective canonical H3s, plant H3.3 has evolved independently. However, this strongly suggests that a similar constraint has led to these repeated origins of distinguishable H3 and H3.3 types [malik_phylogenomics_2003]. H3.3 in plants is characterized by changes at four positions with respect to cH3s, two in the N-terminal tail and two in the alpha-2-helix of the histone fold domain (positions 31, 41, 87, 90, compare with positions 31,87,89,90 in animals). At position 31 H3.3s in plants instead of alanine usially have threonine which can be phosphorilated [talbert_unified_2012]. H3.3 is likely involved in transcriptional regulation, is enriched in the body of actively transcribed genes, promoters and downstream of transcription termination sites in some genes [alvarez-venegas_canonical_2019]. Certain mechanisms of H3.3 action have been reported. Jacob et al. have shown that SET domain of the histone H3 lysine-27 (H3K27) methyltransferase ATXR5 have a bipartite catalytic domain that specifically reads alanine-31 of H3.1. Thus variation at position 31 between H3.1 and replication-independent H3.3 is responsible for inhibiting the activity of ATXR5 and its paralog, ATXR6 [jacob_selective_2014]. Wollmann et al. proposed that H3.3 prevents recruitment of H1, inhibiting H1\u2019s promotion of chromatin folding that restricts access to DNA methyltransferases responsible for gene body methylation. Thus, gene body methylation is likely shaped by H3.3 dynamics in conjunction with transcriptional activity [wollmann_histone_2017].", + "taxonomy": "Green plants (Viridiplantae)", + "genes": "In contrast to intronless cH3s, H3.3 in plants have introns. In Arabidopsis H3.3 is represented by HTR4, HTR5, and HTR8 genes [alvarez-venegas_canonical_2019].", "evolution": "null", - "expression": "null", - "knock-out:": "null", + "expression": "In Arabidopsis, H3.3 genes do not show replication-dependent expression and are rather expressed throughout the cell cycle. In addition, expression of Arabidopsis genes encoding histone H3.3 occurs not only in young, undifferentiated, but also in mature tissues suggesting that the expression of these genes continues after cell division ceases [alvarez-venegas_canonical_2019].", + "knock-out": "In Arabidopsis, removal of three H3.3 genes (HTR4, HTR5,and HTR8) causes defects in male gametogenesis and results in embryonic lethality [wollmann_histone_2017].", "function": "null", - "sequence": "null", + "sequence": "Characteristic changes between cH3 and H3.3 in plants are A31T, F41Y, S87H, and A90L [alvarez-venegas_canonical_2019].", "localization": "null", - "deposition": "null", + "deposition": "Similar to animals, plants have a specialized chaperone HIRA that places H3.3 at sites of histone turnover where it replaces canonical H3s [otero_histone_2014] Such sites include active genes, promoters, enhancers, transcription termination sites. In animals chaperones ATRX and DAXX deposit H3.3 in telomeres, imprinted genes and other heterochromatic loci [talbert_histone_2021]. A DAXX homolog has not been found in plants so far, but there is 1 gene coding for a homolog of ATRX. There are also several genes distantly related to animal DEK, which was shown to have histone chaperone activity. The structural and functional characterization of these chaperones in plants awaits future studies [otero_histone_2014].", "structure": "null", "interactions": "null", "disease": "null", "caveats": "null" }, - "taxonomic_span": "Echinoidea", - "taxonomic_span_id": "7625", + "taxonomic_span": "Viridiplantae", + "taxonomic_span_id": "33090", "alternate_names": [], "publications": [ - "oliver_conservative_2003", - "mandl_five_1997", - "strickland_complete_1978" + "alvarez-venegas_canonical_2019", + "jacob_selective_2014", + "malik_phylogenomics_2003", + "talbert_unified_2012", + "wollmann_histone_2017" ] }, - "H3": { - "level": "type", - "description": { - "summary": "H3 is one of the core histone types present in all Eukaryotes. Two H3 and two H4 histones form H3-H4 tetramer via \"hand shake\" and \"four helix bundle\" motifs. Two H2A-H2B dimers then associate with H3-H4 tetramer to form complete nucleosome core. Structurally H3 has a histone fold domain, \u03b1N-helix and a long N-terminal tail with many important post-translational modification sites. The \u03b1N-helix organizes the terminal segment of core nucleosomal DNA. H3 histone class has evolved to encomass a large number of functionally important H3 histone variants. At least two H3 variants are found in most eukaryotic lineages [malik_phylogenomics_2003].", - "taxonomy": "Eukaryotes", - "genes": "null", - "evolution": "The H3\u2013H4 tetramer represents a direct structural and perhaps evolutionary link to the archaeal histone tetramer. Distinct variants of H3 have been usurped for special roles in transcription and even chromosome segregation, whereas H4\u2019s role has remained constant throughout eukaryotic evolution [malik_phylogenomics_2003]. H3 and H4 are more similar to archaeal histones than H2A and H2B, supporting this hypothesis [henneman_structure_2018]. The fact that eukaryotic cells undergo mitosis, in which chromosomes are highly compacted, together with the abundance of gene-poor regions may have favored a histone conformation that wraps DNA twice (eukaryotic octamer) instead of once (archaeal tetramer) and that via its N-terminal tails has the ability to compact DNA at ahigher order [henneman_structure_2018].", + "H3.3_(Protists)": { + "level": "variant", + "description": { + "summary": "H3.3_(Protists) is a class of H3.3-like replication-independent (also called replacement) variants of the H3 histone in Protists. hv2 H3 histone variant in Tetrahymena thermophila is among the few from this group that have been characterized [yu_constitutive_1997]. Sequence analysis suggests that other protists such as Porphyra, Thalassiosira, Dictyostelium have H3 histones with characteristic differences at positions 31 and 85-89, which may suggest the presence of H3.3-like histones in their genomes [talbert_unified_2012].", + "taxonomy": "Fungi", + "genes": "HHT3 Tetrahymena thermophila", + "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", "deposition": "null", - "structure": "The two-fold symmetry of the eukaryotic nucleosome is organized along the dimerization interface of the two H3 molecules using their C-terminal ends, an example of a four-helix bundle motif. Apart from its heterodimerization with H4, H3 also makes contacts with H2A and has at least two segments of specific contact with the nucleosomal DNA: just upstream of the alpha-N helix where the H3 tail enters the nucleosome between the DNA gyres, and in the loop 1 region [malik_phylogenomics_2003].", + "structure": "null", "interactions": "null", "disease": "null", "caveats": "null" }, - "taxonomic_span": "Eukaryotes", - "taxonomic_span_id": "2759", + "taxonomic_span": "SAR,Metamonada,Discoba,Amoebozoa", + "taxonomic_span_id": "2698737,2611341,2611352,554915", + "alternate_names": [ + { + "name": "hv2" + } + ], "publications": [ - "malik_phylogenomics_2003" + "talbert_unified_2012", + "yu_constitutive_1997" ] }, - "cH3": { + "H3.4_(Mammalia)": { "level": "variant_group", "description": { - "summary": "cH3 -- canonical H3 histones. This is a loosely defined group that encompasses major H3 histone proteins that are mainly expressed during S-phase of the cell cycle in eukaryotes and are highly conserved even between distantly related species. Such proteins are often called replication dependent (RD), replication coupled (RC), clustered or \"bulk\" histones [marzluff_metabolism_2008,talbert_histone_2021]. They are likely similar to the original H3 histones of the last common ancestor of eukaryotes [malik_phylogenomics_2003]. Expression of canonical histones during S-phase is often tightly regulated, but mechanisms may differ among kindoms [marzluff_birth_2017,pontarotti_long-term_2009]. Canonical histone genes are often present as large mulrigene families clustered together in certain locations of the genome. However, there are known limitations to the definition given above. Functional diversification of paralogous genes is a common process in evolution -- in some species multiple copies of canonical histone genes have undergone diversification in terms of sequence variation, cell-cycle or tissue-specific expression patterns. Such diversification for cH3s is rather limited compared to cH2As and cH2Bs. In humans there are only two very similar cH3 isoforms both expressed in S-phase (cH3.1 and cH3.2). However, the mamal-specific H3.4 variant, which manifests tissue specific expression, is in fact a very closely related to the canonical H3s (similarly to cH2A.1 and cH2B.1 is is located within histone gene clusters and has mRNA with a stem-loop). In plants, some cH3s show variable expression patterns [alvarez-venegas_canonical_2019]. Hence, whether a particular gene should be regarded as a canonical, a bona fide variant or a canonical subvariant/isoform may be a matter of debate and definition in each particular case. Another complication with defining cH3 class is that major H3 variants, such as H3.3, may only have 3-4 amino acid deference with the canonical H3 histone. They may have arisen multiple times during evolution and hence their functional classification does not match the phylogenetic classificstion. Ascomycetes are thought to have lost cH3 genes and generally have only a single form which is H3.3-like, it is usually referred to simply as H3 [talbert_unified_2012, malik_phylogenomics_2003]. Within the current hierarchical classification system, additional information about the cH3 class may be gained by looking at the description of its subclasses. ", - "taxonomy": "Eukaryotes, although lost in ascomycetes.", - "genes": "null", + "summary": "H3.4_(Mammalia) is a mammal-specific H3 histone variant highly expressed in testis and at lower level in other tissues [kycia_tudor_2014]. This variant is also reffered to as H3.1t, H3T, or TS H3.4. The H3.4 variant is very similar to canonical H3 histones both in sequence, gene location and transcriptional regulation. In human H3.4 has only 4 amino acid difference from cH3s (A23V,V71M, A98S, A111V), its gene is located within histone gene cluster, is intronless, its mRNA has a stem-loop structure. H3.4 expression is replication-dependent [ueda_testis-specific_2017]. Mouse H3.4 was shown to be essential for very early stages of spermatogenesis, its deficiency leads to azoospermia because of the loss of haploid germ cells. When differentiating spermatogonia emerge in normal spermatogenesis, H3.4 appears and replaces the canonical H3 proteins [ueda_testis-specific_2017]. Structural studies have revealed that H3.4 containing nucleosome are less stable, particularly due to V71M and A111V substitutions [tachiwana_structural_2010]. Tachiwana et al. have found that H3.4/H4 is not efficiently incorporated into the nucleosome by human Nap1 chaperone, due to its defective H3.4/H4 deposition on DNA. In contrast, human Nap2 chaperone, a paralog of Nap1, promoted nucleosome assembly with H3.4/H4. Mutational analyses revealed that the A111V mutation in H3.4 is essential for this difference [tachiwana_nucleosome_2008]. It was demostrated that A23V mutation favors the interaction of trymethyllysine-binding Tudor domains of PHF1 and PHF2 proteins (critical components of the PCR2 complex) with H3K27me3 marks. PHF1 co-localizes with H3.4 in testis and its Tudor domain preferentially binds to H3.4K27me3 over canonical H3K27me3 in vitro, implicating that H3.4K27me3 might be a physiological ligand of PHF1/19. [dong_structural_2020, kycia_tudor_2014].", + "taxonomy": "Mammals", + "genes": "In human is encoded by H3-4 gene (formerly HIST3H3, also an alias name H3C16 has been suggested (Seal et al.)), in mouse by H3f4 gene. The gene encodes mRNA with a stem loop structure. In human the gene is located on chromosome 1 adjacent to genes H2AC25 and H2BC26 in a small histone gene cluster.", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "Knockout mice for H3.4 were first generated in 2017; both male and female H3t null mice were viable and healthy, but the male mice were sterile. H3.4 deficiency leads to azoospermia because of the loss of haploid germ cells[ueda_testis-specific_2017].", "function": "null", "sequence": "null", "localization": "null", "deposition": "null", - "structure": "null", + "structure": "PDB structure of human H3.4 containing nucleosome is available with id 3A6N [tachiwana_structural_2010].", "interactions": "null", - "disease": "null", - "caveats": "" + "disease": "The single\u2011nucleotide polymorphism c190C>T (Arg64Cys) in the human testis\u2011specific histone variant, H3.4, was studied in Japanese patients for its association with Sertoli cell\u2011only syndrome, which causes infertility [dong_structural_2020].", + "caveats": "null" }, - "taxonomic_span": "Eukaryota", - "taxonomic_span_id": "2759", + "taxonomic_span": "Mammalia", + "taxonomic_span_id": "40674", "alternate_names": [ { - "name": "canonical H3" - }, - { - "name": "RC H3" + "name": "H3T" }, { - "name": "RD H3" + "name": "H3.1t" } ], "publications": [ - "marzluff_metabolism_2008", - "talbert_histone_2021", - "malik_phylogenomics_2003", - "marzluff_birth_2017", - "pontarotti_long-term_2009", - "alvarez-venegas_canonical_2019", - "talbert_unified_2012", - " malik_phylogenomics_2003" + " kycia_tudor_2014", + "22650316", + "8986613", + "dong_structural_2020", + "kycia_tudor_2014", + "tachiwana_nucleosome_2008", + "tachiwana_structural_2010", + "ueda_testis-specific_2017" ] }, - "cH3_(Animals)": { + "H3.5_(Primates_or_Hominids?)": { "level": "variant_group", "description": { - "summary": "cH3_(Animals) -- clustered H3 histones in animals (Metazoa), often called canonical, replication-dependent, replication-coupled or \"bulk\" H3 histones are a major class of H3 histones in animals with high sequence similarity across all animal species. Histone genes encodig these proteins have several particular features. 1) These genes lack introns and are found in multiple similar copies clustered along the genome togerther with other core histone genes (H4, H3, H2B, and optionally H1). The exact organisation may vary from tandemly repeated quintets of H3, H4, H2A, H2B, H1 genes transcribed from the same strand to non-tandem jumbled arrays of genes transcribed from divergent promoters [pontarotti_long-term_2009]. 2) These genes are mainly expressed during S-phase of the cell cycle in a coordinated fashion (hence the name \"replication dendent\") and produce mRNAs that are not polyadenylated but rather end in a conserved stem-loop, which is further bound by the stem-loop binding protein (SLBP). mRNAs are rapidly degraded after the S-phase. 3) These genes are present in a specialized nuclear domain, the histone locus body (HLB), which concetrates factors for histone mRNA transcription and processing (in humans these include NPAT, U7 snRNP, FLASH) [marzluff_birth_2017].", - "taxonomy": "Animals (Metazoa)", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -2821,25 +4459,22 @@ "structure": "null", "interactions": "null", "disease": "null", - "caveats": "1) Clustered histones may still exhibit some level of sequence variation between the multiple gene copies in certain species. Although for cH3 this variation is very limited (only two isoforms in humans: H3.1 and H3.2. 2) In C. elegans an alternative mechanism of mRNA 3'-end processing evolved resulting in loss of HLB and histone clusters [marzluff_birth_2017, pontarotti_long-term_2009]." + "caveats": "null" }, - "taxonomic_span": "Metazoa", - "taxonomic_span_id": "33208", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], - "publications": [ - "pontarotti_long-term_2009", - "marzluff_birth_2017" - ] + "publications": [] }, - "cH3_(Vertebrata)": { + "H3.6_(Mammals?)?": { "level": "variant_group", "description": { - "summary": "cH3_(Vertebrata) -- clustered H3 histones in vertebrates, often called canonical, replication-dependent, replication-coupled or \"bulk\" H3 histones. This is a subclass of cH3_(Animals) (see it for a detailed description).", - "taxonomy": "Vertebrates (Vertebrata)", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -2849,20 +4484,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Vertebrata", - "taxonomic_span_id": "7742", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], "publications": [] }, - "cH3_(Mammalia)": { + "H3.7_(Mammals?)?": { "level": "variant_group", "description": { - "summary": "cH3_(Mammalia) -- clustered H3 histones in mammals, often called canonical, replication-dependent, replication-coupled or \"bulk\" H3 histones. This is a subclass of cH3_(Vertebrata) and cH3_(Animals) (see it for a detailed description). Mammalian cH3s have the primary cH3.2 isoform and a mammal-specific cH3.1 paralog [talbert_histone_2021].", - "taxonomy": "Vertebrates (Vertebrata)", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -2872,22 +4507,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Mammalia", - "taxonomic_span_id": "40674", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], - "publications": [ - "talbert_histone_2021" - ] + "publications": [] }, - "cH3.1_(Mammalia)": { + "H3.8_(Mammals?)?": { "level": "variant_group", "description": { - "summary": "cH3.1_(Mammalia) -- a mamal specific subvariant of cH3 histone in mammals. Mammalian cH3s have the primary cH3.2 isoform and a mammal-specific cH3.1 paralog [talbert_histone_2021]. cH3.2 is the most common replicative histone in eukaryotes, cH3.1 differs from it by only one residue at position 96 [ray-gallet_histone_2021].", - "taxonomy": "Mammals (Mammalia)", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -2897,23 +4530,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Mammalia", - "taxonomic_span_id": "40674", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], - "publications": [ - "talbert_histone_2021", - "ray-gallet_histone_2021" - ] + "publications": [] }, - "cH3.1_(Homo_sapiens)": { - "level": "variant", + "H3.B_(Giardia?)": { + "level": "variant_group", "description": { - "summary": "cH3.1_(Homo_sapiens) -- a mammal-specific cH3.1 paralog of canonical H3 histone in human encoded by the following 10 genes on chromosome 6: H3C1-H3C4, H3C6-H3C8, H3C10-H3C12. cH3.2 is the most common replicative histone in eukaryotes, cH3.1 differs from it by only one residue at position 96 [ray-gallet_histone_2021].", - "taxonomy": "Homo sapiens", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -2923,22 +4553,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "Giardia", + "taxonomic_span_id": "5740", "alternate_names": [], - "publications": [ - "ray-gallet_histone_2021" - ] + "publications": [] }, - "cH3.2_(Mammalia)": { + "H3.P_(Moneuplotes?)": { "level": "variant_group", "description": { - "summary": "cH3.2_(Mammalia) -- is a subvariant of cH3 histone in mammals, which corresponds to the most common replicative histone in eukaryotes, cH3.2 differs from cH3.2 by only one residue at position 96 [ray-gallet_histone_2021].", - "taxonomy": "Mammals (Mammalia)", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -2948,22 +4576,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Mammalia", - "taxonomic_span_id": "40674", + "taxonomic_span": "Moneuplotes", + "taxonomic_span_id": "152459", "alternate_names": [], - "publications": [ - "ray-gallet_histone_2021" - ] + "publications": [] }, - "cH3.2_(Homo_sapiens)": { - "level": "variant", + "H3.V_(Trypanosomes?)": { + "level": "variant_group", "description": { - "summary": "cH3.2_(Homo_sapiens) -- cH3.2 cH3 histone isoform in human, encoded by the following 3 genes on chromosome 1: H3C13, H3C14, H3C15. cH3.2 is the most common replicative histone in eukaryotes, cH3.1 differs from it by only one residue at position 96 [ray-gallet_histone_2021].", - "taxonomy": "Homo sapiens", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -2973,22 +4599,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Homo sapiens", - "taxonomic_span_id": "9606", + "taxonomic_span": "Trypanosomes", + "taxonomic_span_id": "93954", "alternate_names": [], - "publications": [ - "ray-gallet_histone_2021" - ] + "publications": [] }, - "cH3_(Plants)": { - "level": "variant_group", + "H3.X_(Homo_sapiens)": { + "level": "variant", "description": { - "summary": "cH3_(Plants) -- canonical H3 histones of green plants (Viridiplantae), which include green algae and land plants. This is a loosely defined group of replication-dependent H3 histones in plants together with similar sequences that might have further diversified towards replication-independent tissue-specific expression but have not yet been extensively studied. Currenly not much is known about the functional specialization of various cH3s isoforms in plants [alvarez-venegas_canonical_2019]. The canonical histone H3 or cH3.1 from higher plants is remarkably similar to that of animals, fungi, and even lower eukaryotes. A sequence comparison indicates that only four amino acid substitutions, F41Y, K53R, A90M, and A96C, differentiate the canonical histone H3 from plants and mammals. Interestingly, the five HTR genes from Arabidopsis encoding histone H3.1 do not contain introns and are expressed in tissues containing highly dividing cells and all but one are expressed during the S-phase of the cell cycle. In a similar way, the seven genes encoding H3.1 from rice also lack introns and several of them are expressed in highly dividing tissues [alvarez-venegas_canonical_2019]. Organisation of canonical histones in green plants is variable. In land plants unlike clustered/canonical histones of animals (see cH3_(Metazoa)) replication dependent histone mRNAs are polyadenilated and genes are interspersed throught the genome. In chlorophyte green algae, such as Chlamydomonas, genes are grouped in clusteres and mRNAs end in 3'-stem loop similar to those of histone genes in animals [marzluff_metabolism_2008, alvarez-venegas_canonical_2019]. ", - "taxonomy": "Viridiplantae (Plants)", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -2998,24 +4622,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Viridiplantae", - "taxonomic_span_id": "33090", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], - "publications": [ - "alvarez-venegas_canonical_2019", - "marzluff_metabolism_2008", - " alvarez-venegas_canonical_2019" - ] + "publications": [] }, - "cH3_(Embryophyta)": { - "level": "variant_group", + "H3.X_(Primates?)": { + "level": "variant", "description": { - "summary": "cH3_(Embryophyta) -- canonical replication-dependent H3 histones of land plants and similar replication-independent histones. In land plants unlike clustered/canonical histones of animals (see cH3_(Metazoa)) replication dependent histone mRNAs are polyadenilated and genes are interspersed throught the genome. [marzluff_metabolism_2008, alvarez-venegas_canonical_2019]", - "taxonomy": "Embryophyta", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -3025,23 +4645,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Embryophyta", - "taxonomic_span_id": "3193", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], - "publications": [ - "marzluff_metabolism_2008", - " alvarez-venegas_canonical_2019" - ] + "publications": [] }, - "cH3_(Chlorophyta)": { - "level": "variant_group", + "H3.Y_(Homo_sapiens)": { + "level": "variant", "description": { - "summary": "cH3_(Chlorophyta) -- canonical replication-dependent H3 histones of green algae and similar replication-independent histones. In chlorophyte green algae, such as Chlamydomonas, genes are grouped in clusteres and mRNAs end in 3'-stem loop similar to those of histone genes in animals [marzluff_metabolism_2008, alvarez-venegas_canonical_2019]", - "taxonomy": "Chlorophyta", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -3051,23 +4668,51 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Chlorophyta", - "taxonomic_span_id": "3041", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], + "publications": [] + }, + "H3.Y_(Primates?)": { + "level": "variant", + "description": { + "summary": "H3.Y is involved in memory formation due to its presence in neurons in human hippocampus. One splice isoform has an extended C-terminal alpha tail that may interacts with the H2A.Z acidic patch", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Primates", + "taxonomic_span_id": "9443", + "alternate_names": [ + { + "name": "H3.X", + "gene": "2" + } + ], "publications": [ - "marzluff_metabolism_2008", - " alvarez-venegas_canonical_2019" + "20819935", + "22650316" ] }, - "cH3_(Fungi)": { - "level": "variant_group", + "H3_(Lilly???)": { + "level": "variant", "description": { - "summary": "cH3_(Fungi) -- canonical replication-dependent H3 histones in fungi, excluding ascomycetes which have lost this gene class. In Ascomycetes such as Saccharomyces cerevisiae, only H3.3 gene is present. Comparison with the basally branching Basidiomycetes, which have both H3 and H3.3, led Malik et al. to the conclusion that only the H3.3 version has been retained in Ascomycetes, presumably because H3.3 can deposit both during and after replication, whereas H3 cannot [malik_phylogenomics_2003].", - "taxonomy": "Fungi", + "summary": "null", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -3077,22 +4722,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Fungi", - "taxonomic_span_id": "4751", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], - "publications": [ - "malik_phylogenomics_2003" - ] + "publications": [] }, - "cH3_(Protists)": { - "level": "variant_group", + "H4": { + "level": "type", "description": { - "summary": "cH3_(Protists) -- canonical replication-dependent H3 histones in various protists.", - "taxonomy": "Protists", + "summary": "H4 is one of the core histones. Two H4s and two H3s form H3-H4 tetramer via \"hand shake\" and \"four helix bundle\" motifs. Two H2A-H2B dimers then associate with H3-H4 tetramer to form complete nucleosome core. H4 is the most conservative histone type and has very few known variants. Structure of H4 has a histone fold domain and a flexible N-terminal tail. H4 provides sites for H2B interaction via \"four-helix bundle\" and forms a small \u03b2-sheet with H2Aa.", + "taxonomy": "null", "genes": "null", "evolution": "null", - "expression": "Recent evidence suggests that the specialized stem-loop forming 3-prime-end of replication-dependent histone mRNAs originated early in the evolution of eukaryotes but was completely lost in several lineages, including plants, fungi and most protozoa. Instead, these species synthesize histones from cell-cycle-regulated polyadenylated mRNAs, and regulation is primarily at the level of transcription [marzluff_metabolism_2008].", - "knock-out:": "null", + "expression": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -3102,20 +4745,20 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "SAR,Metamonada,Discoba,Amoebozoa", - "taxonomic_span_id": "2698737,2611341,2611352,554915", + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], "publications": [] }, - "H3.3": { + "late_H2B_(Echinoidea)": { "level": "variant_group", "description": { - "summary": "H3.3 -- is a diverse functional class comprising replication-independent (also called replacement) variants of the H3 histone. It seems that a distinction between H3 and H3.3 types has arisen numerous times in evolution. Four such instances are at least evident in ciliates, apicomplexans, animals and plants [malik_phylogenomics_2003]. H3.3 are characterized by changes at four positions with respect to cH3s, one in the N-terminal tail and three in the alpha-2-helix of the histone fold domain. Strictly speaking, this is not convergent evolution because the H3.3 versions do not all have the same amino acid residues in these four positions. However, it strongly suggests that a similar constraint has led to these repeated origins of distinguishable H3 and H3.3 types [malik_phylogenomics_2003]. Although, given the likelihood of independent divergences, H3.3 variants from different taxonomic clades may be neither more nor less orthologous to animal H3.3 than their cH3 ounterparts [talbert_unified_2012]. Replication-independent and replication-coupled H3 variants within an organism typically differ in residue 31 (and whether it can be phosphorylated) as well as residues 86?? and 89, but distinguishing residues vary in different organisms and caution is advised in designating H3.3 in less wellstudied eukaryotic kingdoms [talbert_unified_2012].", - "taxonomy": "Eukaryotes", + "summary": "late_H2B_(Echinoidea) is a histone variant class of late H2B histones characterized so far in sea urchins. Four classes of histones in sea urchins have been characterized. Three sets of histone variants are coexisting in the embryo at larval stages of sea urchin\u2019s development: the maternally inherited cleavage stage variants (CS) expressed during the two initial cleavage divisions, the early histone variants, which are recruited into embryonic chromatin from middle cleavage stages until hatching and the late variants, that are fundamentally expressed from blastula stage onward [oliver_conservative_2003]. The fourth class of histones in sea urchins are the sperm histones [mandl_five_1997]. Early, late, and sperm histone genes lack introns, contain the conserved 3-prime terminal stem-loop structure instead of a poly(A) addition site, and thus show the classical hallmarks of replication-dependent histone genes. The repetitive early histone genes are transcriptionally activated upon meiotic maturation of the egg, are maximally expressed in the rapidly dividing blastula embryo, and are already silenced at the hatching blastula stage, when the transcripts of late histone genes start to accumulate [mandl_five_1997]. Late genes are active from the late blastula stage onward [maxson_evolution_1987].", + "taxonomy": "Echinoidea (sea urchins)", "genes": "null", - "evolution": "According to Malik et al. no eukaryotic genome that has been characterized with only canonical H3 and not H3.3. Although there is little doubt regarding multiple origins of H3.3, it is certainly conceivable that ancestrally, an H3.3 was present in a small, predominantly transcriptionally active genome. The rapid expansion of eukaryotic genomes, large portions of which became silent in differentiated cells, may have selected for H3 and its expansion, both for increasing bulk packaging duties and to ensure transcriptional silencing where appropriate. In this regard, it is important to note that even in the archaeon M. fervidus, this division of labor is evident between HMfA and HMfB5 [malik_phylogenomics_2003].", + "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -3125,52 +4768,86 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Eukaryotes", - "taxonomic_span_id": "2759", + "taxonomic_span": "Echinoidea", + "taxonomic_span_id": "7625", "alternate_names": [], "publications": [ - "malik_phylogenomics_2003", - "talbert_unified_2012" + "mandl_five_1997", + "maxson_evolution_1987", + "oliver_conservative_2003" ] }, - "H3.3_(Animals)": { + "macroH2A": { "level": "variant_group", "description": { - "summary": "H3.3_(Animals) -- is a class of replication-independent (also called replacement) variants of the H3 histone in animals. H3.3 is characterized by changes at four positions with respect to cH3s, one in the N-terminal tail and three in the alpha-2-helix of the histone fold domain (positions 31,86,89,90). The sequence differences within the alpha-2-helix alow H3.3 to interact specifically with its own chaperones (HIRA, ATRX, DAXX). At position 31 H3.3s instead of alanine have serine or threonine which can be phosphorilated. There are multiple studies showing that phosphorylation of this site is functionally important [talbert_unified_2012]. Particularly, H3.3S31ph is associated with H3.3K27 acetylation which helps gene activation and was shown to be essential for gastrulation in Xenopus [sitbon_histone_2020]. The metazoan histone H3.3 has been most closely associated with active transcription, replacing cH3s at active genes and promoters, implicated in diverse biological processes, including development, transcriptional memory and transcriptional reprogramming. However, genetic studies highlighted also its imortance in maintaining heterochromatin at telomeres, centromeres, and pericentromeric regions [jang_histone_2015], as well as revealed essential functions of H3.3 in the germline and early embryonic development [elsaesser_new_2010,yuen_histone_2014,jang_histone_2015].", - "taxonomy": "Animals (Metazoa)", - "genes": "In human H3.3 is encoded by H3-3A and H3-3B genes (formerly, H3F3A and H3F3B), located in chromosome 1 (1q42.12) and 17 (17q25), respectively. In mouse by H3f3a and H3f3b genes. Genes have introns.", + "summary": "macroH2A is the largest replication independent H2A histone variant characterized by an additional non-histone ~30 kDa macro domain connected to the C-end of the histone fold via an unstructured linker. MacroH2A is conserved and widespread in vertebrates, but also found in invertebrates. MacroH2A is involved in heterochromatin formation, X-inactivation and transcriptional regulation. MacroH2A is broadly distributed across the genome, found at H3K27me3-decorated faculatative heterochromatin, constitutive heterochromatin regions, is incorporated at sites of DNA damage. Macro domains may be capable of binding NAD+ derived metabolites, such as ADP-ribose and poly-ADP-ribose. Mammals have two macroH2A genes (macroH2A.1 and macroH2A.2 in humans) [sun_histone_2019].", + "taxonomy": "null", + "genes": "null", "evolution": "null", - "expression": "H3.3 mRNAs are polyadenilated. Expressed independent of DNA synthesis through the cell cycle.", - "knock-out:": "In mice complete depletion of H3.3 leads to developmental retardation and early embryonic lethality. At the cellular level, H3.3 loss triggers cell cycle suppression and cell death. Surprisingly, H3.3 depletion does not dramatically disrupt gene regulation in the developing embryo. Instead, H3.3 depletion causes dysfunction of heterochromatin structures at telomeres, centromeres, and pericentromeric regions of chromosomes, leading to mitotic defects [jang_histone_2015]. In C. elegans Despite these specific expression patterns, we find that neither loss of individual H3.3 homologs nor the knockout of all five H3.3-coding genes causes sterility or lethality. However, we demonstrate an essential role for the conserved histone chaperone HIRA in the nucleosomal loading of all H3.3 variants. This requirement can be bypassed by mutation of the H3.3-specific residues to those found in H3. While even removal of all H3.3 homologs does not result in lethality, it leads to reduced fertility and viability in response to high-temperature stress [delaney_differential_2018]. Flies that lack both H3.3 genes have reduced viability and individuals that survive to adulthood are completely sterile in both sexes [sakai_transcriptional_2009]. Targeted disruption of one gene (H3f3b) results in a number of phenotypic abnormalities, including a reduction in H3.3 histone levels, leading to male infertility, as well as abnormal sperm and testes morphology. Additionally, null germ cell populations at specific stages in spermatogenesis, in particular spermatocytes and spermatogonia, exhibited increased rates of apoptosis. Disruption of H3f3b also altered histone post-translational modifications and gene expression in the testes, with the most prominent changes occurring at genes involved in spermatogenesis. Finally, H3f3b null testes also exhibited abnormal germ cell chromatin reorganization and reduced protamine incorporation [yuen_histone_2014].", - "function": "H3.3 has been implicated in a variety of biological processes: it is important for embryonic stem cell differentiation, epigenetic reprogramming following somatic cell nuclear transfer, neuron plasticity, the DNA damage response and centromere maintenance. H3.3 is also essential for germ line development in mammals, where it is required for the remodeling of both maternal and paternal gametes [delaney_differential_2018]. Its role in histone replacement at active genes and promoters is highly conserved and has been proposed to participate in the epigenetic transmission of active chromatin states [szenker_double_2011]. Its accumulation at silent loci in pericentric heterochromatin and telomeres, raising questions concerning the actual function of H3.3", + "expression": "null", + "knock-out": "null", + "function": "null", "sequence": "null", "localization": "null", - "deposition": "In humans and other animals specialized chaperone HIRA places H3.3 at sites of histone turnover where it replaces canonical H3s. Such sites include active genes, promoters, enhancers, transcription termination sites. Chaperones ATRX and DAXX deposit H3.3 in telomeres, imprinted genes and other heterochromatic loci, where it is modified with the trimethlyated lysine 9 heterochromatic mark (denoted H3K9me3) to maintain heterochromatin at these locations [talbert_histone_2021]. While the majority of nucleosomes are replaced by protamines during mammalian spermatogenesis, some H3.3 nucleosomes are retained and may transmit epigenetic information to the zygote [delaney_differential_2018]. In embryonic stem cells for example, HIRA chaperones H3.3 to both active and repressed genes, including also bivalent promoters normally repressed in embryonic stem cells. This highlights a role of HIRA in establishing chromatin landscapes not always related to active chromatin but key to allow proper differentiation [otero_histone_2014].", + "deposition": "null", "structure": "null", "interactions": "null", - "disease": "Mutations in histone genes can affect sites of PTMs causing changes in local and global DNA methylation status. These effects are directly linked to neoplastic transformation by altered gene expression. Recurrent H3.3 histone mutations are increasingly identified in several malignancies and developmental disorders in human [kumar_genes_2021]. Well characterized oncomutations in H3.3 genes include K27M, G34W/L in pediatric high-grade gliomas and K36M and G34V/R in bone tumors [xiong_histone_2016]. Competing models have suggested that H3K27M oncohistones sequester or poison PRC2 complex which deposits H3K27me3 marks. However, Sarthy et al. demonstrated that the K27M epitope only inhibits H3K27 trimethylation on chromatin in vivo, supporting the idea that these oncohistones inhibit chromatin-bound PRC2 complexes. A possible mechanism comes from recent reports [lee_automethylation_2019,wang_regulation_2019] showing that EZH2 (key component of PRC2) methylates itself, and that this automethylation is required for full catalytic activity. These studies also showed that H3K27M blocks EZH2 automethylation, and might contribute to the dominant effect of H3K27M mutations [sarthy_histone_2020].", + "disease": "null", "caveats": "null" }, "taxonomic_span": "Metazoa", "taxonomic_span_id": "33208", - "alternate_names": [], + "alternate_names": [ + { + "name": "mH2A" + }, + { + "name": "macroH2A1", + "gene": "1" + }, + { + "name": "macroH2A2", + "gene": "2" + }, + { + "name": "macroH2A1.1", + "gene": "1", + "splice": "1" + }, + { + "name": "macroH2A1.2", + "gene": "1", + "splice": "2" + }, + { + "name": "macroH2A2.1", + "gene": "2", + "splice": "1" + }, + { + "name": "macroH2A2.2", + "gene": "2", + "splice": "2" + } + ], "publications": [ - "talbert_unified_2012", - "sitbon_histone_2020", - "jang_histone_2015", - "elsaesser_new_2010", - "yuen_histone_2014" + "16107708", + "16803903", + "20543561", + "22650316", + "25731851", + "sun_histone_2019" ] }, - "H3.3_(Homo_sapiens)": { + "macroH2A.1.s1_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "H3.3_(Homo_sapiens) -- is a class of replication-independent (also called replacement) variants of the H3 histone in human encoded by H3-3A and H3-3B genes. Both genes code for an identical protein. See H3.3_(Animals) for details description of this variant.", - "taxonomy": "Homo sapiens", + "summary": "macroH2A.1.s1_(Homo_sapiens) is a splice isoform encoded by macroH2A.1 gene in humans. The macro domain of macroH2A.1.s1 isoform is capable of binding NAD+ derived metabolites, such as ADP-ribose and poly-ADP-ribose, while other isoforms (including those produced by macroH2A.2 gene homologs) do not have this ability [sun_histone_2019].", + "taxonomy": "null", "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -3183,46 +4860,44 @@ "taxonomic_span": "Homo sapiens", "taxonomic_span_id": "9606", "alternate_names": [], - "publications": [] + "publications": [ + "sun_histone_2019" + ] }, - "H3.3_(Plants)": { - "level": "variant_group", + "macroH2A.1.s1_(Mammalia)": { + "level": "variant", "description": { - "summary": "H3.3_(Plants) -- is a class of replication-independent (also called replacement) variants of the H3 histone in green plants (Viridiplantae), which include green algae and land plants. Despite having the same name as H3.3 of animals, similar functions and key amino acids differences with repective canonical H3s, plant H3.3 has evolved independently. However, this strongly suggests that a similar constraint has led to these repeated origins of distinguishable H3 and H3.3 types [malik_phylogenomics_2003]. H3.3 in plants is characterized by changes at four positions with respect to cH3s, two in the N-terminal tail and two in the alpha-2-helix of the histone fold domain (positions 31, 41, 87, 90, compare with positions 31,87,89,90 in animals). At position 31 H3.3s in plants instead of alanine usially have threonine which can be phosphorilated [talbert_unified_2012]. H3.3 is likely involved in transcriptional regulation, is enriched in the body of actively transcribed genes, promoters and downstream of transcription termination sites in some genes [alvarez-venegas_canonical_2019]. Certain mechanisms of H3.3 action have been reported. Jacob et al. have shown that SET domain of the histone H3 lysine-27 (H3K27) methyltransferase ATXR5 have a bipartite catalytic domain that specifically reads alanine-31 of H3.1. Thus variation at position 31 between H3.1 and replication-independent H3.3 is responsible for inhibiting the activity of ATXR5 and its paralog, ATXR6 [jacob_selective_2014]. Wollmann et al. proposed that H3.3 prevents recruitment of H1, inhibiting H1\u2019s promotion of chromatin folding that restricts access to DNA methyltransferases responsible for gene body methylation. Thus, gene body methylation is likely shaped by H3.3 dynamics in conjunction with transcriptional activity [wollmann_histone_2017].", - "taxonomy": "Green plants (Viridiplantae)", - "genes": "In contrast to intronless cH3s, H3.3 in plants have introns. In Arabidopsis H3.3 is represented by HTR4, HTR5, and HTR8 genes [alvarez-venegas_canonical_2019].", + "summary": "macroH2A.1.s1_(Mammalia) is a splice isoform encoded by one of the macroH2A genes in mammals (coresponds to macroH2A.1 gene in humans). The macro domain of macroH2A.1.s1 isoform is capable of binding NAD+ derived metabolites, such as ADP-ribose and poly-ADP-ribose, while other isoforms (including those produced by macroH2A.2 gene homologs) do not have this ability [sun_histone_2019].", + "taxonomy": "null", + "genes": "null", "evolution": "null", - "expression": "In Arabidopsis, H3.3 genes do not show replication-dependent expression and are rather expressed throughout the cell cycle. In addition, expression of Arabidopsis genes encoding histone H3.3 occurs not only in young, undifferentiated, but also in mature tissues suggesting that the expression of these genes continues after cell division ceases [alvarez-venegas_canonical_2019].", - "knock-out:": "In Arabidopsis, removal of three H3.3 genes (HTR4, HTR5,and HTR8) causes defects in male gametogenesis and results in embryonic lethality [wollmann_histone_2017].", + "expression": "null", + "knock-out": "null", "function": "null", - "sequence": "Characteristic changes between cH3 and H3.3 in plants are A31T, F41Y, S87H, and A90L [alvarez-venegas_canonical_2019].", + "sequence": "null", "localization": "null", - "deposition": "Similar to animals, plants have a specialized chaperone HIRA that places H3.3 at sites of histone turnover where it replaces canonical H3s [otero_histone_2014] Such sites include active genes, promoters, enhancers, transcription termination sites. In animals chaperones ATRX and DAXX deposit H3.3 in telomeres, imprinted genes and other heterochromatic loci [talbert_histone_2021]. A DAXX homolog has not been found in plants so far, but there is 1 gene coding for a homolog of ATRX. There are also several genes distantly related to animal DEK, which was shown to have histone chaperone activity. The structural and functional characterization of these chaperones in plants awaits future studies [otero_histone_2014].", + "deposition": "null", "structure": "null", "interactions": "null", "disease": "null", "caveats": "null" }, - "taxonomic_span": "Viridiplantae", - "taxonomic_span_id": "33090", + "taxonomic_span": "Mammalia", + "taxonomic_span_id": "40674", "alternate_names": [], "publications": [ - "malik_phylogenomics_2003", - "talbert_unified_2012", - "alvarez-venegas_canonical_2019", - "jacob_selective_2014", - "wollmann_histone_2017" + "sun_histone_2019" ] }, - "H3.3_(Fungi)": { - "level": "variant_group", + "macroH2A.1.s2_(Homo_sapiens)": { + "level": "variant", "description": { - "summary": "H3.3_(Fungi) -- is a class of H3 histone variants in Fungi which share similarity to H3.3 in other kingdoms (characteristic amino acids at the four key positions). It is, however, the main form of histone H3 in Ascomycetes, where canonical H3 was lost during evolution [malik_phylogenomics_2003]. While H3.3 in Ascomycetes is the only form of H3 histone it is mainly reffered to as H3 rather than H3.3. In the current classification we will refer to such histones as H3.3_(Ascomycota) to retain its proper placement within our classification. Basidiomycetes have both canonical H3 and H3.3 histones. Fungi H3.3 along with plant and animal H3.3s have evolved independently, but share similar sequence difference with respective canonical H3s. It is likely that they have evolved under similar contraints. Since H3.3 as a separate variant is available only in Basidiomycetes the H3.3/cH3 functional difference in Fungi remains poorly studied. Anju et al. have charaterized two H3 genes in basidiomycete Ustilago maydis U1 and U2. The U1 gene was shown to posses replication-independent expression and sequence characteristic of H3.3 replacement histones, while U2 gene manifested replication-coupled expression typical for canonical H3 [anju_identification_2011].", - "taxonomy": "Fungi", - "genes": "In S. cerevisiae H3 histone is encoded by HHT1 and HHT2 genes. U1 gene in Ustilago maydis.", + "summary": "macroH2A.1.s2_(Homo_sapiens) is a splice isoform encoded by macroH2A.1 gene in humans. The macro domain of macroH2A.1.s2 isoform is not capable of binding NAD+ derived metabolites, such as ADP-ribose and poly-ADP-ribose [sun_histone_2019].", + "taxonomy": "null", + "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -3232,23 +4907,22 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Fungi", - "taxonomic_span_id": "4751", + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", "alternate_names": [], "publications": [ - "malik_phylogenomics_2003", - "anju_identification_2011" + "sun_histone_2019" ] }, - "H3.3_(Ascomycota)": { - "level": "variant_group", + "macroH2A.1.s2_(Mammalia)": { + "level": "variant", "description": { - "summary": "H3.3_(Ascomycota) -- is the main form of H3 histone in Ascomycetes.", - "taxonomy": "Fungi", - "genes": "In S. cerevisiae H3 histone is encoded by HHT1 and HHT2 genes", + "summary": "macroH2A.1.s2_(Mammalia) is a splice isoform encoded by one of the macroH2A genes in mammals (coresponds to macroH2A.1 gene in humans). The macro domain of macroH2A.1.s2 isoform is not capable of binding NAD+ derived metabolites, such as ADP-ribose and poly-ADP-ribose [sun_histone_2019].", + "taxonomy": "null", + "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -3258,20 +4932,22 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "Ascomycota", - "taxonomic_span_id": "4890", + "taxonomic_span": "Mammalia", + "taxonomic_span_id": "40674", "alternate_names": [], - "publications": [] + "publications": [ + "sun_histone_2019" + ] }, - "H3.3_(Protists)": { - "level": "variant_group", + "macroH2A.1_(Mammalia)": { + "level": "variant", "description": { - "summary": "H3.3_(Protists) -- is a class of H3.3-like replication-independent (also called replacement) variants of the H3 histone in Protists. hv2 H3 histone variant in Tetrahymena thermophila is among the few from this group that have been characterized [yu_constitutive_1997]. Sequence analysis suggests that other protists such as Porphyra, Thalassiosira, Dictyostelium have H3 histones with characteristic differences at positions 31 and 85-89, which may suggest the presence of H3.3-like histones in their genomes [talbert_unified_2012].", - "taxonomy": "Fungi", - "genes": "HHT3 Tetrahymena thermophila", + "summary": "macroH2A.1_(Mammalia) is a protein encoded by one of the macroH2A genes in mammals (coresponds to macroH2A.1 gene in humans). This gene further produces two splice variants macroH2A.1.s1 and macroH2A.1.s2 by inclusion of mutually exclusive exons encoding a region within the macro domain. The macro domain of macroH2A.1.s1 isoform is capable of binding NAD+ derived metabolites, such as ADP-ribose and poly-ADP-ribose, while other isoforms (including those produced by macroH2A.2 gene homologs) do not have this ability [sun_histone_2019].", + "taxonomy": "null", + "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "null", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", @@ -3281,311 +4957,216 @@ "disease": "null", "caveats": "null" }, - "taxonomic_span": "SAR,Metamonada,Discoba,Amoebozoa", - "taxonomic_span_id": "2698737,2611341,2611352,554915", - "alternate_names": [ - { - "name": "hv2" - } - ], + "taxonomic_span": "Mammalia", + "taxonomic_span_id": "40674", + "alternate_names": [], "publications": [ - "yu_constitutive_1997", - "talbert_unified_2012" + "sun_histone_2019" ] }, - "H3.4_(Mammalia)": { + "macroH2A.2_(Homo_sapiens)": { "level": "variant", "description": { - "summary": "H3.4_(Mammalia) -- is a mammal-specific H3 histone variant highly expressed in testis and at lower level in other tissues [kycia_tudor_2014]. This variant is also reffered to as H3.1t, H3T, or TS H3.4. The H3.4 variant is very similar to canonical H3 histones both in sequence, gene location and transcriptional regulation. In human H3.4 has only 4 amino acid difference from cH3s (A23V,V71M, A98S, A111V), its gene is located within histone gene cluster, is intronless, its mRNA has a stem-loop structure. H3.4 expression is replication-dependent [ueda_testis-specific_2017]. Mouse H3.4 was shown to be essential for very early stages of spermatogenesis, its deficiency leads to azoospermia because of the loss of haploid germ cells. When differentiating spermatogonia emerge in normal spermatogenesis, H3.4 appears and replaces the canonical H3 proteins [ueda_testis-specific_2017]. Structural studies have revealed that H3.4 containing nucleosome are less stable, particularly due to V71M and A111V substitutions [tachiwana_structural_2010]. Tachiwana et al. have found that H3.4/H4 is not efficiently incorporated into the nucleosome by human Nap1 chaperone, due to its defective H3.4/H4 deposition on DNA. In contrast, human Nap2 chaperone, a paralog of Nap1, promoted nucleosome assembly with H3.4/H4. Mutational analyses revealed that the A111V mutation in H3.4 is essential for this difference [tachiwana_nucleosome_2008]. It was demostrated that A23V mutation favors the interaction of trymethyllysine-binding Tudor domains of PHF1 and PHF2 proteins (critical components of the PCR2 complex) with H3K27me3 marks. PHF1 co-localizes with H3.4 in testis and its Tudor domain preferentially binds to H3.4K27me3 over canonical H3K27me3 in vitro, implicating that H3.4K27me3 might be a physiological ligand of PHF1/19. [dong_structural_2020, kycia_tudor_2014].", - "taxonomy": "Mammals", - "genes": "In human is encoded by H3-4 gene (formerly HIST3H3, also an alias name H3C16 has been suggested (Seal et al.)), in mouse by H3f4 gene. The gene encodes mRNA with a stem loop structure. In human the gene is located on chromosome 1 adjacent to genes H2AC25 and H2BC26 in a small histone gene cluster.", + "summary": "macroH2A.2_(Homo_sapiens) is a protein encoded by macroH2A.2 gene in humans. The macro domain of macroH2A.2 variant is not capable of binding NAD+ derived metabolites [sun_histone_2019].", + "taxonomy": "null", + "genes": "null", "evolution": "null", "expression": "null", - "knock-out:": "Knockout mice for H3.4 were first generated in 2017; both male and female H3t null mice were viable and healthy, but the male mice were sterile. H3.4 deficiency leads to azoospermia because of the loss of haploid germ cells[ueda_testis-specific_2017].", + "knock-out": "null", "function": "null", "sequence": "null", "localization": "null", "deposition": "null", - "structure": "PDB structure of human H3.4 containing nucleosome is available with id 3A6N [tachiwana_structural_2010].", + "structure": "null", "interactions": "null", - "disease": "The single\u2011nucleotide polymorphism c190C>T (Arg64Cys) in the human testis\u2011specific histone variant, H3.4, was studied in Japanese patients for its association with Sertoli cell\u2011only syndrome, which causes infertility [dong_structural_2020].", + "disease": "null", "caveats": "null" }, - "taxonomic_span": "Mammalia", - "taxonomic_span_id": "40674", - "alternate_names": [ - { - "name": "H3T" - } - ], - "publications": [ - "kycia_tudor_2014", - "ueda_testis-specific_2017", - "tachiwana_structural_2010", - "tachiwana_nucleosome_2008", - "dong_structural_2020", - " kycia_tudor_2014" - ] - }, - "cenH3_(Plants)": { - "level": "variant_group", - "description": "cenH3 is a centromere-specific histone variant, which replaces canonical H3 in centromeric nucleosomes. It is required for kinetochore formation, mitotic progression and chromosome segregation. cenH3 has an extended L1-loop and its N-terminal tail is very different from other H3 variants. cenH3s have an extended L1-loop and usually replace Phe84 in canonical H3 with Trp, and Thr 107 with Ala, Cys, or Ser. cenH3s ususally lack a conserved glutamine in the alpha1 helix of the histone fold. cenH3s typically have only about 50-60% amino acid identity to canonical H3 in the histone fold domain and no conservation of the N-terminus.", - "taxonomic_span": "Eukaryotes", - "taxonomic_span_id": "2759", - "alternate_names": [ - { - "name": "CENP-A" - }, - { - "name": "Cse4" - }, - { - "name": "HCP-3" - }, - { - "name": "CNP1" - }, - { - "name": "HTR12" - }, - { - "name": "CNA1" - }, - { - "name": "cid" - } - ], - "publications": [ - "22650316", - "19766562", - "25956076", - "23324462", - "21743476", - "14583738" - ] - }, - "H3.Y_(Primates?)": { - "level": "variant_group", - "description": "H3.Y is involved in memory formation due to its presence in neurons in human hippocampus. One splice isoform has an extended C-terminal alpha tail that may interacts with the H2A.Z acidic patch", - "taxonomic_span": "Primates", - "taxonomic_span_id": "9443", - "alternate_names": [ - { - "name": "H3.X", - "gene": 2 - } - ], - "publications": [ - "22650316", - "20819935" - ] - }, - "H3.3_(Eukarya)": { - "level": "variant_group", - "description": "The major replication-independent or replacement H3, important for development, transcription, and chromosome segregation. It typically differs from the canonical H3 by only a few amino acids that are necessary for replication-independent assembly. ", - "taxonomic_span": "Eukaryotes", - "taxonomic_span_id": "2759", - "alternate_names": [ - { - "name": "soH3-1", - "gene": 1 - }, - { - "name": "soH3-2", - "gene": 2 - }, - { - "name": "hv2", - "gene": 1 - } - ], - "publications": [ - "22650316", - "20738881", - "19412883", - "24229707", - "14583738" - ] - }, - "TS_H3.4": { - "level": "variant_group", - "description": "Testis spesific mamal H3 variant.", - "taxonomic_span": "Mammalia", - "taxonomic_span_id": "40674", - "alternate_names": [ - { - "name": "H3.1t" - } - ], - "publications": [ - "22650316", - "8986613" - ] - }, - "H3.5_(Mammals?)": { - "level": "variant_group", - "description": "A hominid specific variant expressed in seminiferous tubules of human testis.", - "taxonomic_span": "Hominids", - "taxonomic_span_id": "9604", - "alternate_names": [], - "publications": [ - "21274551" - ] - }, - "H3.5_(Hominids?)": { - "level": "variant_group", - "description": "A hominid specific variant expressed in seminiferous tubules of human testis.", - "taxonomic_span": "Hominids", - "taxonomic_span_id": "9604", - "alternate_names": [], - "publications": [ - "21274551" - ] - }, - "H3.P_(Moneuplotes?)": { - "level": "variant_group", - "description": "null", - "taxonomic_span": "Moneuplotes", - "taxonomic_span_id": "152459", - "alternate_names": [], - "publications": [] - }, - "H3.V_(Trypanosomes?)": { - "level": "variant_group", - "description": "null", - "taxonomic_span": "Trypanosomes", - "taxonomic_span_id": "93954", - "alternate_names": [], - "publications": [] - }, - "H3.B_(Giardia?)": { - "level": "variant_group", - "description": "null", - "taxonomic_span": "Giardia", - "taxonomic_span_id": "5740", + "taxonomic_span": "Homo sapiens", + "taxonomic_span_id": "9606", "alternate_names": [], - "publications": [] - }, - "H4": { - "level": "type", - "description": "H4 is one of the core histones. Two H4s and two H3s form H3-H4 tetramer via \"hand shake\" and \"four helix bundle\" motifs. Two H2A-H2B dimers then associate with H3-H4 tetramer to form complete nucleosome core. H4 is the most conservative histone type and has very few known variants. Structure of H4 has a histone fold domain and a flexible N-terminal tail. H4 provides sites for H2B interaction via \"four-helix bundle\" and forms a small \u03b2-sheet with H2Aa." - }, - "cH4": { - "level": "variant_group", - "description": "Canonical histones are replication-dependent while histone variants are replication-independent, constitutively expressed during cell cycle. Genes encoding canonical histones are typically located within multigene clusters and use specific type of regulation at the RNA level with a stem loop structure instead of polyA tail", - "taxonomic_span": "Eukaryotes", - "taxonomic_span_id": "2759", - "alternate_names": [ - { - "name": "ca H4" - } - ], "publications": [ - "22650316" + "sun_histone_2019" ] }, - "H1": { - "level": "type", - "description": "H1 is the linker histone. Associates with the nucleosome core and linker DNA near the DNA entry-exit points. The resulting particle is called chromatosome. H1-histone is lysine rich, has long disordered C-terminal tail and a short N-terminal tail. The globular domain has three helices and a wing, so-called \"winged helix\" motif." - }, - "generic_H1": { - "level": "variant_group", - "description": "H1 has mainly species specific variants. In current version of HistoneDB all H1 are presented as genericH1 class, except for several interesting species specific variants which are provided as separate classes.", - "taxonomic_span": "Eukaryotes", - "taxonomic_span_id": "2759", - "alternate_names": [ - { - "name": "gen H1" - } - ], + "macroH2A.2_(Mammalia)": { + "level": "variant", + "description": { + "summary": "macroH2A.2_(Mammalia) is a protein encoded by one of the macroH2A genes in mammals (coresponds to macroH2A.2 gene in humans). The macro domain of macroH2A.2 variant is not capable of binding NAD+ derived metabolites [sun_histone_2019].", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Mammalia", + "taxonomic_span_id": "40674", + "alternate_names": [], "publications": [ - "22650316", - "23945933", - "10973918", - "11149891", - "26212454" + "sun_histone_2019" ] }, - "H1.0": { + "OO_H1.8": { "level": "variant_group", - "description": "H1.0 is a replication independent linker histone found in animals expressed in terminally differentiated cells. Has a common monophyletic origin that can be traced back before the differentiation between protostomes and deuterostomes, very early in metazoan evolution.", - "taxonomic_span": "Metazoa", - "taxonomic_span_id": "33208", + "description": { + "summary": "Sequences collected here belong to (OO) H1.8 - an oocyte specific variant of H1 common in mammals.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Mammalia", + "taxonomic_span_id": "40674", "alternate_names": [ { - "name": "H1\u00b0" - }, - { - "name": "H5", - "taxonomy": "aves" - }, - { - "name": "H1\u03b4" - }, - { - "name": "RI H1" + "name": "H1oo" } ], "publications": [ - "22650316", - "23945933", - "7066298", - "2898141" - ] - }, - "H1.1": { - "level": "variant_group", - "description": "H1.1 is a replication independent linker histone.", - "taxonomic_span": "Homo", - "taxonomic_span_id": "9605", - "alternate_names": [], - "publications": [ - "26689747" + "22650316" ] }, - "H1.2": { + "scH1": { "level": "variant_group", - "description": "H1.2 is a replication independent linker histone.", - "taxonomic_span": "Homo", - "taxonomic_span_id": "9605", + "description": { + "summary": "A special variant of H1 found in Saccharomyces and probably other yeast species that has two globular domains. Saccharomyces cerevisiae has only one gene that encodes H1 histone (HHO1).", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Saccharomyces(?)", + "taxonomic_span_id": "4930", "alternate_names": [], "publications": [ - "26689747" + "8772381" ] }, - "H1.3": { + "short_H2A": { "level": "variant_group", - "description": "H1.3 is a replication independent linker histone.", - "taxonomic_span": "Homo", - "taxonomic_span_id": "9605", - "alternate_names": [], + "description": { + "summary": "short_H2A is a class encompassing several histone H2A variants in placental (eutherian) mammals with shortened C-terminus expressed mainly during mammalian male germ cell development before the nearly complete replacement of histones by protamines in sperm nuclei. The repertoires of short histone H2A variants vary extensively among eutherian mammals due to lineage-specific gains and losses. Short H2A variants include H2A.B, H2A.L, H2A.P, H2A.Q, their genes are usually located on X chromosome and are intronless. These four clades of eutherian mammal short H2A variants emerged from a single, well-supported monophyletic clade, confirming their common ancestry [molaro_evolutionary_2018]. Due to shortened docking domain and changes within the acidic patch nucleosomes incorporating short H2As wrap less DNA (120-130 bp) and form loosely packed chromatin. There are few conserved residues in the histone fold domain of sH2As that distinguish them from each other, instead much of their specialization may stem from changes in the N- and C-terminal tails of these variatns [molaro_evolutionary_2018]. Abberant short H2A upregulation was reported in a broad range of cancers [chew_short_2021]. Caveats: H2A.B is also expressed in the brain [jiang_short_2020].", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Eutheria", + "taxonomic_span_id": "9347", + "alternate_names": [ + { + "name": "sH2A" + } + ], "publications": [ - "26689747" + "chew_short_2021", + "jiang_short_2020", + "molaro_evolutionary_2018" ] }, - "H1.4": { + "sperm_H2B_(Echinoidea)": { "level": "variant_group", - "description": "H1.4 is a replication independent linker histone.", - "taxonomic_span": "Homo", - "taxonomic_span_id": "9605", + "description": { + "summary": "sperm_H2B_(Echinoidea) is a histone variant class of sperm H2B histones characterized so far in sea urchins. Four classes of histones in sea urchins have been characterized. Three sets of histone variants are coexisting in the embryo at larval stages of sea urchin\u2019s development: the maternally inherited cleavage stage variants (CS) expressed during the two initial cleavage divisions, the early histone variants, which are recruited into embryonic chromatin from middle cleavage stages until hatching and the late variants, that are fundamentally expressed from blastula stage onward [oliver_conservative_2003]. The fourth class of histones in sea urchins are the sperm histones. They are exclusively transcribed during spermatogenesis and code for specialized H1 and H2B proteins with basic N-terminal extensions which are responsible for the unusually high chromatin condensation in mature sperm [mandl_five_1997]. In parechinus angulosus the characterized sperm H2B sequence has a repeating pentapeptide in the N-terminal region [strickland_complete_1978].", + "taxonomy": "Echinoidea (sea urchins)", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "Echinoidea", + "taxonomic_span_id": "7625", "alternate_names": [], "publications": [ - "26689747" + "mandl_five_1997", + "oliver_conservative_2003", + "strickland_complete_1978" ] }, - "H1.5": { - "level": "variant_group", - "description": "H1.5 is a replication independent linker histone.", - "taxonomic_span": "Homo", - "taxonomic_span_id": "9605", + "TS H3.10": { + "level": "variant", + "description": { + "summary": "null", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], - "publications": [ - "26689747" - ] + "publications": [] }, "TS_H1.6": { "level": "variant_group", - "description": "Sequences collected here belong to (TS) H1.6 - a testis specific variant of H1 common in mammals.", + "description": { + "summary": "Sequences collected here belong to (TS) H1.6 - a testis specific variant of H1 common in mammals.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, "taxonomic_span": "Mammalia", "taxonomic_span_id": "40674", "alternate_names": [ @@ -3599,7 +5180,22 @@ }, "TS_H1.7": { "level": "variant_group", - "description": "Sequences collected here belong to (TS) H1.7 - a testis specific variant of H1 common in mammals.", + "description": { + "summary": "Sequences collected here belong to (TS) H1.7 - a testis specific variant of H1 common in mammals.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, "taxonomic_span": "Mammalia", "taxonomic_span_id": "40674", "alternate_names": [ @@ -3611,23 +5207,24 @@ "22650316" ] }, - "OO_H1.8": { - "level": "variant_group", - "description": "Sequences collected here belong to (OO) H1.8 - an oocyte specific variant of H1 common in mammals.", - "taxonomic_span": "Mammalia", - "taxonomic_span_id": "40674", - "alternate_names": [ - { - "name": "H1oo" - } - ], - "publications": [ - "22650316" - ] - }, "TS_H1.9": { "level": "variant_group", - "description": "Sequences collected here belong to (TS) H1.9 - a testis specific variant of H1 common in mammals.", + "description": { + "summary": "Sequences collected here belong to (TS) H1.9 - a testis specific variant of H1 common in mammals.", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, "taxonomic_span": "Mammalia", "taxonomic_span_id": "40674", "alternate_names": [ @@ -3639,29 +5236,28 @@ "22650316" ] }, - "H1.10": { - "level": "variant_group", - "description": "Sequences collected here belong to H1.10 here - a vertebrate specific H1 variant.", - "taxonomic_span": "Vertebrates", - "taxonomic_span_id": "7742", - "alternate_names": [ - { - "name": "H1x" - } - ], - "publications": [ - "22650316" - ] - }, - "scH1": { - "level": "variant_group", - "description": "A special variant of H1 found in Saccharomyces and probably other yeast species that has two globular domains. Saccharomyces cerevisiae has only one gene that encodes H1 histone (HHO1).", - "taxonomic_span": "Saccharomyces(?)", - "taxonomic_span_id": "4930", + "Viral": { + "level": "type", + "description": { + "summary": "null", + "taxonomy": "null", + "genes": "null", + "evolution": "null", + "expression": "null", + "knock-out": "null", + "function": "null", + "sequence": "null", + "localization": "null", + "deposition": "null", + "structure": "null", + "interactions": "null", + "disease": "null", + "caveats": "null" + }, + "taxonomic_span": "null", + "taxonomic_span_id": "null", "alternate_names": [], - "publications": [ - "8772381" - ] + "publications": [] } } } \ No newline at end of file