Provide a comprehensive cross-database identifier and functional mapping reference for human MYC. This should serve as a definitive lookup resource for researchers. ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 1: GENE IDENTIFIERS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Provide ALL gene-level database identifiers: - HGNC ID and approved symbol - Ensembl gene ID (ENSG) - NCBI Entrez Gene ID - OMIM gene/locus ID - Genomic location: chromosome, start position, end position, strand ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 2: TRANSCRIPT IDENTIFIERS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ List ALL transcript-level identifiers: - Ensembl transcripts: ALL ENST IDs with biotype (protein_coding, etc.) How many total transcripts? - RefSeq transcripts: ALL NM_ mRNA accessions Mark which is MANE Select (canonical clinical standard) - CCDS IDs: ALL consensus coding sequence identifiers For the CANONICAL/MANE SELECT transcript: - List ALL exon IDs (ENSE) with genomic coordinates - Total exon count ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 3: PROTEIN IDENTIFIERS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ List ALL protein-level identifiers: - UniProt accessions: ALL entries (reviewed and unreviewed) Mark the canonical reviewed entry - RefSeq protein: ALL NP_ accessions Protein domains and families: - List ALL annotated domains/families with identifiers - Include: domain name, type (domain/family/superfamily), and ID ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 4: STRUCTURE IDENTIFIERS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Experimental structures: - List ALL PDB structure IDs - For each: experimental method (X-ray, NMR, Cryo-EM) and resolution - Total PDB structure count Predicted structures: - AlphaFold model ID and confidence metrics (pLDDT) ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 5: CROSS-SPECIES ORTHOLOGS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ List orthologous genes in key model organisms (where available): - Mouse (Mus musculus): gene ID, symbol - Rat (Rattus norvegicus): gene ID, symbol - Zebrafish (Danio rerio): gene ID, symbol - Fruit fly (Drosophila melanogaster): gene ID, symbol - Worm (C. elegans): gene ID, symbol - Yeast (S. cerevisiae): gene ID, symbol ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 6: CLINICAL VARIANTS & AI PREDICTIONS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Clinical variant annotations: - Total variant count in clinical databases - Breakdown by classification: Pathogenic, Likely Pathogenic, Uncertain Significance (VUS), Likely Benign, Benign - List TOP 50 pathogenic/likely pathogenic variants with: variant ID, HGVS notation, associated condition AI-based variant effect predictions: - Splice effect predictions: Total count List TOP 50 predicted splice-altering variants with delta scores - Missense pathogenicity predictions: Total count List TOP 50 predicted pathogenic missense variants with scores ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 7: BIOLOGICAL PATHWAYS & GENE ONTOLOGY ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Pathway membership: - List ALL biological pathways this gene participates in - Include pathway IDs and names - Total pathway count Gene Ontology annotations: - Biological Process: count and TOP 20 terms with IDs - Molecular Function: count and TOP 20 terms with IDs - Cellular Component: count and TOP 20 terms with IDs ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 8: PROTEIN INTERACTIONS & MOLECULAR NETWORKS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Protein-protein interactions: - Total interaction count - List TOP 50 highest-confidence interacting proteins with scores Protein similarity (evolutionary and structural): - Structural/embedding similarity: How many similar proteins? List TOP 20 with similarity scores - Sequence homology: How many homologous proteins? List TOP 20 with identity/similarity scores ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 9: TRANSCRIPTION FACTOR REGULATORY DATA ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ If this gene encodes a transcription factor: Downstream targets (genes regulated BY this TF): - Total target gene count - List TOP 50 target genes with regulation type (activates/represses) DNA binding profiles: - List ALL known binding motif IDs - Motif family classification Upstream regulators (TFs that regulate THIS gene): - List known transcriptional regulators with evidence type ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 10: DRUG & PHARMACOLOGY DATA ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ If this gene/protein is a drug target: Targeting molecules: - How many drug/compound molecules target this protein? - List TOP 30 molecules by development phase - Include: molecule ID, name, mechanism, highest development phase Clinical trials: - How many clinical trials involve drugs targeting this gene? - List TOP 20 trials with: trial ID, phase, status, intervention Pharmacogenomics: - Known drug-gene interactions affecting drug response - Dosing guidelines if any exist ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 11: EXPRESSION PROFILES ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Tissue expression: - Which tissues express this gene most highly? - List TOP 30 tissues with expression scores/levels - Note any tissue-specific or tissue-enriched patterns Cell type expression: - Which cell types show highest expression? - List TOP 30 cell types with expression scores - Note any cell type-specific patterns Single-cell expression data (if available): - Which single-cell datasets/experiments include this gene? - Notable cell population patterns ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 12: DISEASE ASSOCIATIONS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Mendelian/monogenic disease links: - What diseases are caused by mutations in this gene? - List ALL associated diseases with: disease name, disease ID, inheritance pattern, evidence level Phenotype associations: - What clinical phenotypes are associated with this gene? - List TOP 50 phenotype terms with IDs Complex trait associations (GWAS): - What traits/diseases are linked via genome-wide association studies? - List TOP 30 GWAS associations with: trait, study ID, p-value, effect size if available ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ FORMATTING REQUIREMENTS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ - Present each section with clear headers - Use tables for listing multiple items - Always include COUNTS for every category - For lists with 50 items: show total count + TOP 50 - For lists with

Question

Provide a comprehensive cross-database identifier and functional mapping
reference for human MYC. This should serve as a definitive
lookup resource for researchers.

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 1: GENE IDENTIFIERS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Provide ALL gene-level database identifiers:
- HGNC ID and approved symbol
- Ensembl gene ID (ENSG)
- NCBI Entrez Gene ID
- OMIM gene/locus ID
- Genomic location: chromosome, start position, end position, strand

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 2: TRANSCRIPT IDENTIFIERS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
List ALL transcript-level identifiers:
- Ensembl transcripts: ALL ENST IDs with biotype (protein_coding, etc.)
  How many total transcripts?
- RefSeq transcripts: ALL NM_ mRNA accessions
  Mark which is MANE Select (canonical clinical standard)
- CCDS IDs: ALL consensus coding sequence identifiers

For the CANONICAL/MANE SELECT transcript:
- List ALL exon IDs (ENSE) with genomic coordinates
- Total exon count

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 3: PROTEIN IDENTIFIERS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
List ALL protein-level identifiers:
- UniProt accessions: ALL entries (reviewed and unreviewed)
  Mark the canonical reviewed entry
- RefSeq protein: ALL NP_ accessions

Protein domains and families:
- List ALL annotated domains/families with identifiers
- Include: domain name, type (domain/family/superfamily), and ID

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 4: STRUCTURE IDENTIFIERS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Experimental structures:
- List ALL PDB structure IDs
- For each: experimental method (X-ray, NMR, Cryo-EM) and resolution
- Total PDB structure count

Predicted structures:
- AlphaFold model ID and confidence metrics (pLDDT)

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 5: CROSS-SPECIES ORTHOLOGS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
List orthologous genes in key model organisms (where available):
- Mouse (Mus musculus): gene ID, symbol
- Rat (Rattus norvegicus): gene ID, symbol
- Zebrafish (Danio rerio): gene ID, symbol
- Fruit fly (Drosophila melanogaster): gene ID, symbol
- Worm (C. elegans): gene ID, symbol
- Yeast (S. cerevisiae): gene ID, symbol

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 6: CLINICAL VARIANTS & AI PREDICTIONS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Clinical variant annotations:
- Total variant count in clinical databases
- Breakdown by classification: Pathogenic, Likely Pathogenic,
  Uncertain Significance (VUS), Likely Benign, Benign
- List TOP 50 pathogenic/likely pathogenic variants with:
  variant ID, HGVS notation, associated condition

AI-based variant effect predictions:
- Splice effect predictions: Total count
  List TOP 50 predicted splice-altering variants with delta scores
- Missense pathogenicity predictions: Total count
  List TOP 50 predicted pathogenic missense variants with scores

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 7: BIOLOGICAL PATHWAYS & GENE ONTOLOGY
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Pathway membership:
- List ALL biological pathways this gene participates in
- Include pathway IDs and names
- Total pathway count

Gene Ontology annotations:
- Biological Process: count and TOP 20 terms with IDs
- Molecular Function: count and TOP 20 terms with IDs
- Cellular Component: count and TOP 20 terms with IDs

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 8: PROTEIN INTERACTIONS & MOLECULAR NETWORKS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Protein-protein interactions:
- Total interaction count
- List TOP 50 highest-confidence interacting proteins with scores

Protein similarity (evolutionary and structural):
- Structural/embedding similarity: How many similar proteins?
  List TOP 20 with similarity scores
- Sequence homology: How many homologous proteins?
  List TOP 20 with identity/similarity scores

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 9: TRANSCRIPTION FACTOR REGULATORY DATA
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
If this gene encodes a transcription factor:

Downstream targets (genes regulated BY this TF):
- Total target gene count
- List TOP 50 target genes with regulation type (activates/represses)

DNA binding profiles:
- List ALL known binding motif IDs
- Motif family classification

Upstream regulators (TFs that regulate THIS gene):
- List known transcriptional regulators with evidence type

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 10: DRUG & PHARMACOLOGY DATA
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
If this gene/protein is a drug target:

Targeting molecules:
- How many drug/compound molecules target this protein?
- List TOP 30 molecules by development phase
- Include: molecule ID, name, mechanism, highest development phase

Clinical trials:
- How many clinical trials involve drugs targeting this gene?
- List TOP 20 trials with: trial ID, phase, status, intervention

Pharmacogenomics:
- Known drug-gene interactions affecting drug response
- Dosing guidelines if any exist

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 11: EXPRESSION PROFILES
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Tissue expression:
- Which tissues express this gene most highly?
- List TOP 30 tissues with expression scores/levels
- Note any tissue-specific or tissue-enriched patterns

Cell type expression:
- Which cell types show highest expression?
- List TOP 30 cell types with expression scores
- Note any cell type-specific patterns

Single-cell expression data (if available):
- Which single-cell datasets/experiments include this gene?
- Notable cell population patterns

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 12: DISEASE ASSOCIATIONS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Mendelian/monogenic disease links:
- What diseases are caused by mutations in this gene?
- List ALL associated diseases with: disease name, disease ID,
  inheritance pattern, evidence level

Phenotype associations:
- What clinical phenotypes are associated with this gene?
- List TOP 50 phenotype terms with IDs

Complex trait associations (GWAS):
- What traits/diseases are linked via genome-wide association studies?
- List TOP 30 GWAS associations with: trait, study ID, p-value,
  effect size if available

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
FORMATTING REQUIREMENTS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
- Present each section with clear headers
- Use tables for listing multiple items
- Always include COUNTS for every category
- For lists with >50 items: show total count + TOP 50
- For lists with <50 items: show ALL items
- Always include database identifiers (IDs), not just names
- Mark canonical/primary/reviewed entries where applicable
- If a section has no data available, state "No data available"
  rather than omitting the section

Accepted Answer

COMPREHENSIVE CROSS-DATABASE IDENTIFIER AND FUNCTIONAL MAPPING REFERENCE Human MYC (c-Myc Proto-Oncogene)
Section 1: Gene Identifiers Primary Gene Identifiers
DatabaseIdentifierNotes HGNC IDHGNC:7553Approved HGNC SymbolMYCApproved symbol Full NameMYC proto-oncogene, bHLH transcription factor Ensembl GeneENSG00000136997GRCh38 NCBI Entrez Gene4609protein-coding OMIM190080Gene/Locus Locus Typegene with protein product Locus Groupprotein-coding gene StatusApproved Genomic Location (GRCh38/hg38) …

Attribute	Value
Chromosome	8
Cytogenetic Band	8q24.21
Start Position	127,735,434
End Position	127,742,951
Strand	+ (forward)
Gene Length	7,518 bp
Biotype	protein_coding

- Aliases	- Previous Name	- Gene Group	Ensembl Transcripts (Total
c-Myc, bHLHe39, MYCC	v-myc avian myelocytomatosis viral oncogene homolog	Basic helix-loop-helix proteins
			Transcript Identifiers**	15)

Transcript ID	Biotype	Start	End	Strand
ENST00000259523	protein_coding	127,735,434	127,740,477	+
ENST00000377970	protein_coding	127,736,084	127,741,434	+
ENST00000517291	protein_coding	127,735,519	127,738,772	+
ENST00000520751	protein_coding_CDS_not_defined	127,736,231	127,738,475	+
ENST00000524013	protein_coding	127,736,220	127,741,372	+
ENST00000621592	protein_coding	127,736,231	127,742,951	+
ENST00000641036	protein_coding	127,736,046	127,736,612	+
ENST00000641252	protein_coding	127,735,473	127,735,817	+
ENST00000651626	protein_coding	127,735,659	127,741,434	+
ENST00000652288	protein_coding	127,737,621	127,741,434	+
ENST00000707113	protein_coding	127,736,958	127,741,434	+
ENST00000707114	protein_coding	127,737,724	127,741,434	+
ENST00000707115	protein_coding	127,737,737	127,741,434	+
ENST00000707116	protein_coding	127,737,745	127,741,434	+
ENST00000707117	protein_coding_CDS_not_defined	127,739,073	127,741,434	+

Accession	Type	Chromosome	Status	MANE Select
NM_002467	mRNA	8	REVIEWED	Yes (Canonical)
NM_001354870	mRNA	8	REVIEWED	No

Accession	Chromosome	Status	MANE Select
NP_002458	8	REVIEWED	Yes (Canonical)
NP_001341799	8	REVIEWED	No

MYC Gene Complete Identifier and Functional Mapping Reference

Structured Data Sources

Database	Identifier	Notes
HGNC ID	HGNC:7553	Approved
HGNC Symbol	MYC	Approved symbol
Full Name	MYC proto-oncogene, bHLH transcription factor
Ensembl Gene	ENSG00000136997	GRCh38
NCBI Entrez Gene	4609	protein-coding
OMIM	190080	Gene/Locus
Locus Type	gene with protein product
Locus Group	protein-coding gene
Status	Approved

Exon ID	Start	End	Length	Strand
ENSE00001848036	127,735,434	127,736,623	1,190 bp	+
ENSE00003540079	127,738,248	127,739,019	772 bp	+
ENSE00001766895	127,740,398	127,740,477	80 bp	+

Accession	Name	Status	Length	Mass
P01106	Myc proto-oncogene protein	Reviewed (Canonical)	454 aa	50,565 Da
Q14899		Unreviewed	-	-
Q16591		Unreviewed	-	-
A0A0B4J1R1		Unreviewed	-	-
A0A494C1T8		Unreviewed	-	-
H0YBG3		Unreviewed	-	-

Attribute	Value
Primary Name	Myc proto-oncogene protein
Alternative Names	Class E basic helix-loop-helix protein 39; Proto-oncogene c-Myc; Transcription factor p64
Length	454 amino acids
Molecular Mass	50,565 Da

InterPro ID	Name	Type
IPR002418	Tscrpt_reg_Myc	Family
IPR003327	Myc-LZ	Domain
IPR011598	bHLH_dom	Domain
IPR012682	Tscrpt_reg_Myc_N	Domain
IPR036638	HLH_DNA-bd_sf	Homologous_superfamily
IPR050433	Myc_transcription_factors	Family

Pfam ID	Description
PF00010	Helix-loop-helix DNA-binding domain
PF01056	Myc amino-terminal region
PF02344	Myc-type, basic helix-loop-helix leucine zipper

PDB ID	Title	Method	Resolution
6G6K	Human MYC:MAX bHLHZip complex	X-RAY DIFFRACTION	1.35 Å
1NKP	Myc-Max recognizing DNA	X-RAY DIFFRACTION	1.8 Å
4Y7R	WDR5 with MYC MbIIIb peptide	X-RAY DIFFRACTION	1.898 Å
8Q1N	Cyclic peptide binder of WDR5	X-RAY DIFFRACTION	1.843 Å
8J2Q	Cypovirus Polyhedra with c-Myc	X-RAY DIFFRACTION	1.92 Å
5I4Z	Apo OmoMYC	X-RAY DIFFRACTION	1.95 Å
8X8V	Cypovirus Polyhedra with c-Myc	X-RAY DIFFRACTION	2.0 Å
8X8S	Cypovirus Polyhedra with c-Myc	X-RAY DIFFRACTION	2.04 Å
1EE4	Karyopherin with c-Myc NLS	X-RAY DIFFRACTION	2.1 Å
6G6L	Human MYC:MAX bHLHZip complex	X-RAY DIFFRACTION	2.2 Å
6G6J	Human MYC:MAX bHLHZip complex	X-RAY DIFFRACTION	2.25 Å
6E16	c-Myc-TBP-TAF1 ternary	X-RAY DIFFRACTION	2.4 Å
7T1Y	Fbw7-Skp1-MycCdegron	X-RAY DIFFRACTION	2.55 Å
8WLG	Cypovirus with c-Myc fragment	X-RAY DIFFRACTION	2.55 Å
6C4U	FHA with Myc-pTBD peptide	X-RAY DIFFRACTION	2.6 Å
5I50	OmoMYC bound to DNA	X-RAY DIFFRACTION	2.701 Å
2OR9	Anti-c-myc antibody 9E10 Fab	X-RAY DIFFRACTION	2.7 Å
7T1Z	Fbw7-Skp1-MycNdegron	X-RAY DIFFRACTION	2.77 Å
6E24	c-Myc-TBP-TAF1 ternary	X-RAY DIFFRACTION	3.001 Å
9QNH	Myc pS294 with 14-3-3sigma	X-RAY DIFFRACTION	1.3 Å
1A93	c-MYC-MAX leucine zipper	SOLUTION NMR	-
2A93	c-MYC-MAX leucine zipper (40 structures)	SOLUTION NMR	-
1MV0	BIN1 interaction with c-Myc	SOLUTION NMR	-
8OTS	OCT4 and MYC-MAX on nucleosome	ELECTRON MICROSCOPY	3.3 Å
8OTT	MYC-MAX on nucleosome at SHL+5.8	ELECTRON MICROSCOPY	3.3 Å

Attribute	Value
AlphaFold ID	P01106
Sequence Length	3,551 (full entry)
Global pLDDT	61.38
Fraction pLDDT Very High	0.21 (21%)

Note
Low overall confidence reflects intrinsically disordered regions characteristic of transcription factors.
	Cross-Species Orthologs**

Organism	Gene ID	Symbol	Biotype
Mouse (Mus musculus)	ENSMUSG00000022346	Myc	protein_coding
Rat (Rattus norvegicus)	ENSRNOG00000004500	Myc	protein_coding
Zebrafish (Danio rerio)	ENSDARG00000007241	mycb	protein_coding
Zebrafish (Danio rerio)	ENSDARG00000045695	myca	protein_coding

CCDS ID
CCDS6359
CCDS87627

- Worm (C. elegans)	- Yeast (S. cerevisiae)	ClinVar Variants Summary (Total
No direct ortholog	No direct ortholog
		Clinical Variants & AI Predictions**	46)

Classification	Count
Pathogenic	4
Likely Pathogenic	1
Benign	4
Likely Benign	3
Benign/Likely Benign	2
Uncertain Significance (VUS)	10
Other/Not Classified	22

ClinVar ID	HGVS	Type	Classification
12574	NM_002467.6:c.214C>T (p.Pro72Ser)	SNV	Pathogenic
12575	NM_002467.6:c.302A>C (p.Asn101Thr)	SNV	Pathogenic
12576	NM_002467.6:c.162G>C (p.Glu54Asp)	SNV	Pathogenic
2658815	NM_002467.6:c.217A>G (p.Thr73Ala)	SNV	Pathogenic
810340	8q24.21 (128750494-128753204)x3	CNV gain	Likely Pathogenic

ClinVar ID	HGVS	Type
1679939	c.77A>G (p.Asn26Ser)	SNV
2286886	c.409G>C (p.Glu137Gln)	SNV
2468497	c.909C>G (p.Ser303Arg)	SNV
2510151	c.671C>T (p.Ala224Val)	SNV
2658812	c.30+4A>T	SNV
3154445	c.1228A>G (p.Ile410Val)	SNV
3154448	c.1297G>C (p.Asp433His)	SNV
3297249	c.544G>A (p.Gly182Ser)	SNV
3400454	c.814G>A (p.Glu272Lys)	SNV
3915251	c.688G>T (p.Ala230Ser)	SNV

Variant ID	Effect	Score
8:127736625:T:G	donor_loss	0.98
8:127736622:AGGT:A	donor_loss	0.98
8:127736623:GGT:G	donor_loss	0.98
8:127736624:GTAA:G	donor_loss	0.98
8:127736610:T:TA	donor_gain	0.97
8:127736611:A:AA	donor_gain	0.97
8:127736620:CCAG:C	donor_gain	0.97
8:127736624:G:GG	donor_gain	0.96
8:127736197:C:G	donor_gain	0.93
8:127736619:ACCAG:A	donor_gain	0.93
8:127737196:G:GT	donor_gain	0.92
8:127736621:CAG:C	donor_gain	0.87
8:127736612:G:GG	donor_gain	0.85
8:127736622:AG:A	donor_gain	0.82
8:127736623:GG:G	donor_gain	0.82
8:127736196:GC:G	donor_gain	0.77
8:127736633:G:GT	donor_gain	0.75
8:127737196:GAA:G	donor_gain	0.73
8:127736197:C:CG	donor_gain	0.70
8:127737198:A:G	donor_gain	0.68

Variant ID	Protein Change	Pathogenicity Score	Class
8:127738305:G:C	D15H	0.739	likely_pathogenic
8:127738299:G:C	D13H	0.664	likely_pathogenic
8:127738300:A:T	D13V	0.650	likely_pathogenic
8:127738306:A:T	D15V	0.650	likely_pathogenic
8:127738300:A:C	D13A	0.572	likely_pathogenic
8:127738305:G:T	D15Y	0.610	likely_pathogenic

Pathway ID	Name	Disease?
R-HSA-1362277	Transcription of E2F targets under negative control by DREAM complex	No
R-HSA-201556	Signaling by ALK	No
R-HSA-2122947	NOTCH1 Intracellular Domain Regulates Transcription	No
R-HSA-2173796	SMAD2/SMAD3:SMAD4 heterotrimer regulates transcription	No
R-HSA-2644606	Constitutive Signaling by NOTCH1 PEST Domain Mutants	Yes
R-HSA-2894862	Constitutive Signaling by NOTCH1 HD+PEST Domain Mutants	Yes
R-HSA-4411364	Binding of TCF/LEF:CTNNB1 to target gene promoters	No
R-HSA-5687128	MAPK6/MAPK4 signaling	No
R-HSA-5689880	Ub-specific processing proteases	No
R-HSA-6785807	Interleukin-4 and Interleukin-13 signaling	No
R-HSA-69202	Cyclin E associated events during G1/S transition	No
R-HSA-69656	Cyclin A:Cdk2-associated events at S phase entry	No
R-HSA-8866911	TFAP2 family regulates transcription of cell cycle factors	No
R-HSA-8951430	RUNX3 regulates WNT signaling	No
R-HSA-9018519	Estrogen-dependent gene expression	No
R-HSA-9616222	Transcriptional regulation of granulopoiesis	No
R-HSA-9764562	Regulation of CDH1 mRNA translation by microRNAs	No
R-HSA-9818749	Regulation of NFE2L2 gene expression	No
R-HSA-9909649	Regulation of PD-L1(CD274) transcription	No

GO ID	Term
GO:0000978	RNA polymerase II cis-regulatory region sequence-specific DNA binding
GO:0000981	DNA-binding transcription factor activity, RNA polymerase II-specific
GO:0001046	core promoter sequence-specific DNA binding
GO:0001221	transcription coregulator binding
GO:0001227	DNA-binding transcription repressor activity, RNA polymerase II-specific
GO:0001228	DNA-binding transcription activator activity, RNA polymerase II-specific
GO:0003677	DNA binding
GO:0031625	ubiquitin protein ligase binding
GO:0042802	identical protein binding
GO:0044877	protein-containing complex binding
GO:0046983	protein dimerization activity
GO:0070888	E-box binding
GO:0140297	DNA-binding transcription factor binding
GO:0140537	transcription regulator activator activity
GO:1905761	SCF ubiquitin ligase complex binding

GO ID	Term
GO:0000082	G1/S transition of mitotic cell cycle
GO:0000122	negative regulation of transcription by RNA polymerase II
GO:0000165	MAPK cascade
GO:0006338	chromatin remodeling
GO:0006357	regulation of transcription by RNA polymerase II
GO:0006366	transcription by RNA polymerase II
GO:0006974	DNA damage response
GO:0008284	positive regulation of cell population proliferation
GO:0008630	intrinsic apoptotic signaling pathway in response to DNA damage
GO:0010468	regulation of gene expression
GO:0010628	positive regulation of gene expression
GO:0016055	Wnt signaling pathway
GO:0016072	rRNA metabolic process
GO:0032204	regulation of telomere maintenance
GO:0043066	negative regulation of apoptotic process
GO:0045893	positive regulation of DNA-templated transcription
GO:0045944	positive regulation of transcription by RNA polymerase II
GO:0051276	chromosome organization
GO:0071456	cellular response to hypoxia
GO:1902255	positive regulation of intrinsic apoptotic signaling pathway by p53 class mediator

GO ID	Term
GO:0000785	chromatin
GO:0000791	euchromatin
GO:0005634	nucleus
GO:0005654	nucleoplasm
GO:0005730	nucleolus
GO:0005819	spindle
GO:0016604	nuclear body
GO:0030424	axon
GO:0032991	protein-containing complex
GO:0048471	perinuclear region of cytoplasm
GO:0071943	Myc-Max complex
GO:0090571	RNA polymerase II transcription repressor complex

UniProt B	Score	Protein Name
P01106	997	MYC (self)
P04637	997	TP53
P38398	995	BRCA1
Q09472	994	EP300
Q9Y4A5	993	TRRAP
Q96GN5	991	USP28
Q01094	990	E2F1
O00499	989	BIN1
P25912	987	HIC1
Q9UL40	986	ZNF131
P84022	983	SMAD3
Q9Y6K1	983	DNMT3A
Q16665	982	HIF1A
Q9NZI8	980	IGF2BP1
Q13105	976	ZBTB17

Gene Symbol	Interaction Types
MAX	Affinity Capture-Western, Affinity Capture-MS
FBXW7	Affinity Capture-Western
USP28	Affinity Capture-Western
USP37	Affinity Capture-Western
USP36	Affinity Capture-Western
CREBBP	Affinity Capture-Western, Reconstituted Complex
KAT2A	Affinity Capture-Western, Reconstituted Complex
TRRAP	Reconstituted Complex
SKP2	Affinity Capture-Western
HDAC1	Affinity Capture-MS

UniProt	Top Similarity	Avg Similarity
P01106	1.0000	0.9947
P23583	1.0000	0.9947
P68271	1.0000	0.9944
P68272	1.0000	0.9944
P0C0N8	1.0000	0.9921
P0C0N9	1.0000	0.9921
A1YG22	0.9999	0.9947
A2T7L5	0.9999	0.9948
B8XIA5	0.9999	0.9948
P01108	0.9999	0.9942

UniProt	Identity %	Bitscore
P61244	100.0	290
P61245	100.0	290
P68271	100.0	796
P68272	100.0	796
A1YG22	99.8	794
P23583	99.8	815
Q64210	99.1	819
P20389	99.1	819
B8XIA5	99.1	805
P01106	99.1	816

Motif ID	Name	Collection	Class	Family
MA0147.4	MYC	CORE	Basic helix-loop-helix factors	bHLH-ZIP
MA0147.3	MYC	CORE	Basic helix-loop-helix factors	bHLH-ZIP
MA0059.2	MAX::MYC	CORE	Basic helix-loop-helix factors	bHLH-ZIP
MA0059.1	MAX::MYC	CORE	Basic helix-loop-helix factors	bHLH-ZIP

Target Gene	Mechanism	Score
CCND1	transcriptional regulation	0.50
CDK4	transcriptional regulation	0.57
CDC25A	transcriptional regulation	0.63
CCNA2	transcriptional regulation	0.42
CDK6	transcriptional regulation	0.45
CUL1	transcriptional regulation	0.48
DNMT3A	binding	0.71
LDHA	transcriptional regulation	0.56
HK2	transcriptional regulation	0.37
SLC2A1	transcriptional regulation	0.43
VEGFA	transcriptional regulation	0.46
ENO1	transcriptional regulation	0.41
SIRT2	transcriptional regulation	0.47

Target Gene	Mechanism	Score
CDKN1A	transcriptional regulation	0.78
CDKN2A	transcriptional regulation	0.77
CDKN2B	transcriptional regulation	0.60
CDKN1B	transcriptional regulation	0.53
SMAD2	—	0.68
SMAD3	binding	0.69
HLA-A	transcriptional regulation	0.27
HLA-B	transcriptional regulation	0.27
HLA-C	transcriptional regulation	0.26
DKK1	transcriptional regulation	0.39
SFRP1	transcriptional regulation	0.36

TF	Confidence
E2F1	High
CTNNB1 (β-catenin)	High
CTCF	High
DLX5	High
HNF4A	High
IKZF1	High
NOTCH1	(via SIGNOR)
STAT3	(via SIGNOR)
LEF1	High
FOXM1	—
ERG	—

TF	Confidence
FOS	High
JUN	High
JUND	High
CEBPA	High
CEBPB	High
HOXB13	High
IKZF3	High
KLF11	High
GLI1	High
ENO1	High
SMAD3/SMAD4	(via SIGNOR)

Target ID	Name	Type
CHEMBL1250348	Myc proto-oncogene protein	SINGLE PROTEIN
CHEMBL3301395	c-Myc/Max	PROTEIN COMPLEX
CHEMBL4106127	c-Myc/c-Max	PROTEIN-PROTEIN INTERACTION
CHEMBL4296141	VHL/Myc proto-oncogene protein	PROTEIN-PROTEIN INTERACTION
CHEMBL4888452	MAP2K3/Myc proto-oncogene protein	PROTEIN-PROTEIN INTERACTION
CHEMBL5465202	Cereblon/Myc proto-oncogene protein	PROTEIN-PROTEIN INTERACTION
CHEMBL5465553	WDR5-MYC	PROTEIN-PROTEIN INTERACTION

ChEMBL ID	Name	Type	Highest Phase
CHEMBL165	RESVERATROL	Small molecule	Phase 3
CHEMBL4297458	EZOBRESIB	Small molecule	Phase 2

Attribute	Value
PharmGKB ID	PA31353
Symbol	MYC
VIP Gene	Yes
CPIC Guideline	No
Chromosome	chr8

Attribute	Value
Gene ID	ENSG00000136997
Species	Homo sapiens
Expression Breadth	Ubiquitous
Total Present Calls	256
Max Expression Score	99.12