Provide a comprehensive cross-database identifier and functional mapping reference for human SRC. This should serve as a definitive lookup resource for researchers. ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 1: GENE IDENTIFIERS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Provide ALL gene-level database identifiers: - HGNC ID and approved symbol - Ensembl gene ID (ENSG) - NCBI Entrez Gene ID - OMIM gene/locus ID - Genomic location: chromosome, start position, end position, strand ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 2: TRANSCRIPT IDENTIFIERS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ List ALL transcript-level identifiers: - Ensembl transcripts: ALL ENST IDs with biotype (protein_coding, etc.) How many total transcripts? - RefSeq transcripts: ALL NM_ mRNA accessions Mark which is MANE Select (canonical clinical standard) - CCDS IDs: ALL consensus coding sequence identifiers For the CANONICAL/MANE SELECT transcript: - List ALL exon IDs (ENSE) with genomic coordinates - Total exon count ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 3: PROTEIN IDENTIFIERS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ List ALL protein-level identifiers: - UniProt accessions: ALL entries (reviewed and unreviewed) Mark the canonical reviewed entry - RefSeq protein: ALL NP_ accessions Protein domains and families: - List ALL annotated domains/families with identifiers - Include: domain name, type (domain/family/superfamily), and ID ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 4: STRUCTURE IDENTIFIERS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Experimental structures: - List ALL PDB structure IDs - For each: experimental method (X-ray, NMR, Cryo-EM) and resolution - Total PDB structure count Predicted structures: - AlphaFold model ID and confidence metrics (pLDDT) ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 5: CROSS-SPECIES ORTHOLOGS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ List orthologous genes in key model organisms (where available): - Mouse (Mus musculus): gene ID, symbol - Rat (Rattus norvegicus): gene ID, symbol - Zebrafish (Danio rerio): gene ID, symbol - Fruit fly (Drosophila melanogaster): gene ID, symbol - Worm (C. elegans): gene ID, symbol - Yeast (S. cerevisiae): gene ID, symbol ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 6: CLINICAL VARIANTS & AI PREDICTIONS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Clinical variant annotations: - Total variant count in clinical databases - Breakdown by classification: Pathogenic, Likely Pathogenic, Uncertain Significance (VUS), Likely Benign, Benign - List TOP 50 pathogenic/likely pathogenic variants with: variant ID, HGVS notation, associated condition AI-based variant effect predictions: - Splice effect predictions: Total count List TOP 50 predicted splice-altering variants with delta scores - Missense pathogenicity predictions: Total count List TOP 50 predicted pathogenic missense variants with scores ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 7: BIOLOGICAL PATHWAYS & GENE ONTOLOGY ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Pathway membership: - List ALL biological pathways this gene participates in - Include pathway IDs and names - Total pathway count Gene Ontology annotations: - Biological Process: count and TOP 20 terms with IDs - Molecular Function: count and TOP 20 terms with IDs - Cellular Component: count and TOP 20 terms with IDs ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 8: PROTEIN INTERACTIONS & MOLECULAR NETWORKS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Protein-protein interactions: - Total interaction count - List TOP 50 highest-confidence interacting proteins with scores Protein similarity (evolutionary and structural): - Structural/embedding similarity: How many similar proteins? List TOP 20 with similarity scores - Sequence homology: How many homologous proteins? List TOP 20 with identity/similarity scores ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 9: TRANSCRIPTION FACTOR REGULATORY DATA ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ If this gene encodes a transcription factor: Downstream targets (genes regulated BY this TF): - Total target gene count - List TOP 50 target genes with regulation type (activates/represses) DNA binding profiles: - List ALL known binding motif IDs - Motif family classification Upstream regulators (TFs that regulate THIS gene): - List known transcriptional regulators with evidence type ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 10: DRUG & PHARMACOLOGY DATA ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ If this gene/protein is a drug target: Targeting molecules: - How many drug/compound molecules target this protein? - List TOP 30 molecules by development phase - Include: molecule ID, name, mechanism, highest development phase Clinical trials: - How many clinical trials involve drugs targeting this gene? - List TOP 20 trials with: trial ID, phase, status, intervention Pharmacogenomics: - Known drug-gene interactions affecting drug response - Dosing guidelines if any exist ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 11: EXPRESSION PROFILES ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Tissue expression: - Which tissues express this gene most highly? - List TOP 30 tissues with expression scores/levels - Note any tissue-specific or tissue-enriched patterns Cell type expression: - Which cell types show highest expression? - List TOP 30 cell types with expression scores - Note any cell type-specific patterns Single-cell expression data (if available): - Which single-cell datasets/experiments include this gene? - Notable cell population patterns ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 12: DISEASE ASSOCIATIONS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Mendelian/monogenic disease links: - What diseases are caused by mutations in this gene? - List ALL associated diseases with: disease name, disease ID, inheritance pattern, evidence level Phenotype associations: - What clinical phenotypes are associated with this gene? - List TOP 50 phenotype terms with IDs Complex trait associations (GWAS): - What traits/diseases are linked via genome-wide association studies? - List TOP 30 GWAS associations with: trait, study ID, p-value, effect size if available ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ FORMATTING REQUIREMENTS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ - Present each section with clear headers - Use tables for listing multiple items - Always include COUNTS for every category - For lists with 50 items: show total count + TOP 50 - For lists with

Question

Provide a comprehensive cross-database identifier and functional mapping
reference for human SRC. This should serve as a definitive
lookup resource for researchers.

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 1: GENE IDENTIFIERS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Provide ALL gene-level database identifiers:
- HGNC ID and approved symbol
- Ensembl gene ID (ENSG)
- NCBI Entrez Gene ID
- OMIM gene/locus ID
- Genomic location: chromosome, start position, end position, strand

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 2: TRANSCRIPT IDENTIFIERS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
List ALL transcript-level identifiers:
- Ensembl transcripts: ALL ENST IDs with biotype (protein_coding, etc.)
  How many total transcripts?
- RefSeq transcripts: ALL NM_ mRNA accessions
  Mark which is MANE Select (canonical clinical standard)
- CCDS IDs: ALL consensus coding sequence identifiers

For the CANONICAL/MANE SELECT transcript:
- List ALL exon IDs (ENSE) with genomic coordinates
- Total exon count

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 3: PROTEIN IDENTIFIERS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
List ALL protein-level identifiers:
- UniProt accessions: ALL entries (reviewed and unreviewed)
  Mark the canonical reviewed entry
- RefSeq protein: ALL NP_ accessions

Protein domains and families:
- List ALL annotated domains/families with identifiers
- Include: domain name, type (domain/family/superfamily), and ID

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 4: STRUCTURE IDENTIFIERS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Experimental structures:
- List ALL PDB structure IDs
- For each: experimental method (X-ray, NMR, Cryo-EM) and resolution
- Total PDB structure count

Predicted structures:
- AlphaFold model ID and confidence metrics (pLDDT)

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 5: CROSS-SPECIES ORTHOLOGS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
List orthologous genes in key model organisms (where available):
- Mouse (Mus musculus): gene ID, symbol
- Rat (Rattus norvegicus): gene ID, symbol
- Zebrafish (Danio rerio): gene ID, symbol
- Fruit fly (Drosophila melanogaster): gene ID, symbol
- Worm (C. elegans): gene ID, symbol
- Yeast (S. cerevisiae): gene ID, symbol

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 6: CLINICAL VARIANTS & AI PREDICTIONS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Clinical variant annotations:
- Total variant count in clinical databases
- Breakdown by classification: Pathogenic, Likely Pathogenic,
  Uncertain Significance (VUS), Likely Benign, Benign
- List TOP 50 pathogenic/likely pathogenic variants with:
  variant ID, HGVS notation, associated condition

AI-based variant effect predictions:
- Splice effect predictions: Total count
  List TOP 50 predicted splice-altering variants with delta scores
- Missense pathogenicity predictions: Total count
  List TOP 50 predicted pathogenic missense variants with scores

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 7: BIOLOGICAL PATHWAYS & GENE ONTOLOGY
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Pathway membership:
- List ALL biological pathways this gene participates in
- Include pathway IDs and names
- Total pathway count

Gene Ontology annotations:
- Biological Process: count and TOP 20 terms with IDs
- Molecular Function: count and TOP 20 terms with IDs
- Cellular Component: count and TOP 20 terms with IDs

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 8: PROTEIN INTERACTIONS & MOLECULAR NETWORKS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Protein-protein interactions:
- Total interaction count
- List TOP 50 highest-confidence interacting proteins with scores

Protein similarity (evolutionary and structural):
- Structural/embedding similarity: How many similar proteins?
  List TOP 20 with similarity scores
- Sequence homology: How many homologous proteins?
  List TOP 20 with identity/similarity scores

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 9: TRANSCRIPTION FACTOR REGULATORY DATA
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
If this gene encodes a transcription factor:

Downstream targets (genes regulated BY this TF):
- Total target gene count
- List TOP 50 target genes with regulation type (activates/represses)

DNA binding profiles:
- List ALL known binding motif IDs
- Motif family classification

Upstream regulators (TFs that regulate THIS gene):
- List known transcriptional regulators with evidence type

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 10: DRUG & PHARMACOLOGY DATA
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
If this gene/protein is a drug target:

Targeting molecules:
- How many drug/compound molecules target this protein?
- List TOP 30 molecules by development phase
- Include: molecule ID, name, mechanism, highest development phase

Clinical trials:
- How many clinical trials involve drugs targeting this gene?
- List TOP 20 trials with: trial ID, phase, status, intervention

Pharmacogenomics:
- Known drug-gene interactions affecting drug response
- Dosing guidelines if any exist

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 11: EXPRESSION PROFILES
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Tissue expression:
- Which tissues express this gene most highly?
- List TOP 30 tissues with expression scores/levels
- Note any tissue-specific or tissue-enriched patterns

Cell type expression:
- Which cell types show highest expression?
- List TOP 30 cell types with expression scores
- Note any cell type-specific patterns

Single-cell expression data (if available):
- Which single-cell datasets/experiments include this gene?
- Notable cell population patterns

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 12: DISEASE ASSOCIATIONS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Mendelian/monogenic disease links:
- What diseases are caused by mutations in this gene?
- List ALL associated diseases with: disease name, disease ID,
  inheritance pattern, evidence level

Phenotype associations:
- What clinical phenotypes are associated with this gene?
- List TOP 50 phenotype terms with IDs

Complex trait associations (GWAS):
- What traits/diseases are linked via genome-wide association studies?
- List TOP 30 GWAS associations with: trait, study ID, p-value,
  effect size if available

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
FORMATTING REQUIREMENTS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
- Present each section with clear headers
- Use tables for listing multiple items
- Always include COUNTS for every category
- For lists with >50 items: show total count + TOP 50
- For lists with <50 items: show ALL items
- Always include database identifiers (IDs), not just names
- Mark canonical/primary/reviewed entries where applicable
- If a section has no data available, state "No data available"
  rather than omitting the section

Accepted Answer

Section 1: Gene Identifiers Primary Gene Identifiers
DatabaseIdentifierDescription HGNCHGNC:11283Approved symbol: SRC HGNC NameSRC proto-oncogene, non-receptor tyrosine kinaseOfficial full name Ensembl GeneENSG00000197122Human gene (GRCh38) NCBI Entrez6714Gene ID OMIM190090Gene/locus entry Genomic Location (GRCh38/hg38) AttributeValue Chromosome20 Start Position37,344,673 End Position37,406,050 Strand+ (positive) Cytoband20q11.23 Gene Length61,378 bp Biotypeprotein_coding Additional Gene …

Attribute	Value
Locus Type	gene with protein product
Gene Groups	SH2 domain containing; Src family tyrosine kinases
Previous Symbols	SRC1
Aliases	ASV, c-src
Status	Approved

Transcript ID	Biotype	Start	End	Notes
ENST00000373578	protein_coding	37,346,140	37,406,050	Major transcript
ENST00000358208	protein_coding	37,384,150	37,406,050
ENST00000373558	protein_coding	37,384,150	37,406,050
ENST00000373567	protein_coding	37,383,668	37,406,050
ENST00000692112	protein_coding	37,346,109	37,406,050
ENST00000692423	protein_coding	37,346,140	37,406,050
ENST00000693012	protein_coding	37,346,140	37,387,801
ENST00000876226	protein_coding	37,344,673	37,405,431
ENST00000876227	protein_coding	37,344,681	37,405,429
ENST00000876228	protein_coding	37,344,714	37,405,418
ENST00000876229	protein_coding	37,344,718	37,405,415
ENST00000876230	protein_coding	37,345,108	37,405,414
ENST00000876231	protein_coding	37,345,138	37,405,432
ENST00000876232	protein_coding	37,345,213	37,405,418
ENST00000876233	protein_coding	37,345,936	37,405,418
ENST00000876234	protein_coding	37,346,125	37,405,415
ENST00000876235	protein_coding	37,346,140	37,405,415
ENST00000876236	protein_coding	37,346,140	37,404,632
ENST00000876237	protein_coding	37,383,899	37,405,420
ENST00000921683	protein_coding	37,345,711	37,405,415
ENST00000921684	protein_coding	37,346,324	37,405,415
ENST00000950593	protein_coding	37,383,596	37,405,416
ENST00000467556	retained_intron	37,400,149	37,401,957
ENST00000472968	retained_intron	37,384,323	37,394,174
ENST00000489153	retained_intron	37,393,745	37,397,746
ENST00000493775	retained_intron	37,402,313	37,403,031
ENST00000477066	CDS_not_defined	37,396,426	37,405,422
ENST00000477475	CDS_not_defined	37,400,251	37,402,292
ENST00000497734	CDS_not_defined	37,344,685	37,382,787

Accession	Type	Status	MANE Select
NM_198291	mRNA	REVIEWED	✓ MANE Select
NM_005417	mRNA	REVIEWED

Accession	Status	MANE Select
NP_938033	REVIEWED	✓ MANE Select
NP_005408	REVIEWED

SRC Gene Complete Identifier and Functional Mapping Reference

Structured Data Sources

Database	Identifier	Description
HGNC	HGNC:11283	Approved symbol: SRC
HGNC Name	SRC proto-oncogene, non-receptor tyrosine kinase	Official full name
Ensembl Gene	ENSG00000197122	Human gene (GRCh38)
NCBI Entrez	6714	Gene ID
OMIM	190090	Gene/locus entry

Attribute	Value
Chromosome	20
Start Position	37,344,673
End Position	37,406,050
Strand	+ (positive)
Cytoband	20q11.23
Gene Length	61,378 bp
Biotype	protein_coding