Provide a comprehensive cross-database identifier and functional mapping reference for human PDGFRA. This should serve as a definitive lookup resource for researchers. ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 1: GENE IDENTIFIERS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Provide ALL gene-level database identifiers: - HGNC ID and approved symbol - Ensembl gene ID (ENSG) - NCBI Entrez Gene ID - OMIM gene/locus ID - Genomic location: chromosome, start position, end position, strand ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 2: TRANSCRIPT IDENTIFIERS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ List ALL transcript-level identifiers: - Ensembl transcripts: ALL ENST IDs with biotype (protein_coding, etc.) How many total transcripts? - RefSeq transcripts: ALL NM_ mRNA accessions Mark which is MANE Select (canonical clinical standard) - CCDS IDs: ALL consensus coding sequence identifiers For the CANONICAL/MANE SELECT transcript: - List ALL exon IDs (ENSE) with genomic coordinates - Total exon count ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 3: PROTEIN IDENTIFIERS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ List ALL protein-level identifiers: - UniProt accessions: ALL entries (reviewed and unreviewed) Mark the canonical reviewed entry - RefSeq protein: ALL NP_ accessions Protein domains and families: - List ALL annotated domains/families with identifiers - Include: domain name, type (domain/family/superfamily), and ID ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 4: STRUCTURE IDENTIFIERS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Experimental structures: - List ALL PDB structure IDs - For each: experimental method (X-ray, NMR, Cryo-EM) and resolution - Total PDB structure count Predicted structures: - AlphaFold model ID and confidence metrics (pLDDT) ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 5: CROSS-SPECIES ORTHOLOGS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ List orthologous genes in key model organisms (where available): - Mouse (Mus musculus): gene ID, symbol - Rat (Rattus norvegicus): gene ID, symbol - Zebrafish (Danio rerio): gene ID, symbol - Fruit fly (Drosophila melanogaster): gene ID, symbol - Worm (C. elegans): gene ID, symbol - Yeast (S. cerevisiae): gene ID, symbol ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 6: CLINICAL VARIANTS & AI PREDICTIONS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Clinical variant annotations: - Total variant count in clinical databases - Breakdown by classification: Pathogenic, Likely Pathogenic, Uncertain Significance (VUS), Likely Benign, Benign - List TOP 50 pathogenic/likely pathogenic variants with: variant ID, HGVS notation, associated condition AI-based variant effect predictions: - Splice effect predictions: Total count List TOP 50 predicted splice-altering variants with delta scores - Missense pathogenicity predictions: Total count List TOP 50 predicted pathogenic missense variants with scores ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 7: BIOLOGICAL PATHWAYS & GENE ONTOLOGY ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Pathway membership: - List ALL biological pathways this gene participates in - Include pathway IDs and names - Total pathway count Gene Ontology annotations: - Biological Process: count and TOP 20 terms with IDs - Molecular Function: count and TOP 20 terms with IDs - Cellular Component: count and TOP 20 terms with IDs ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 8: PROTEIN INTERACTIONS & MOLECULAR NETWORKS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Protein-protein interactions: - Total interaction count - List TOP 50 highest-confidence interacting proteins with scores Protein similarity (evolutionary and structural): - Structural/embedding similarity: How many similar proteins? List TOP 20 with similarity scores - Sequence homology: How many homologous proteins? List TOP 20 with identity/similarity scores ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 9: TRANSCRIPTION FACTOR REGULATORY DATA ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ If this gene encodes a transcription factor: Downstream targets (genes regulated BY this TF): - Total target gene count - List TOP 50 target genes with regulation type (activates/represses) DNA binding profiles: - List ALL known binding motif IDs - Motif family classification Upstream regulators (TFs that regulate THIS gene): - List known transcriptional regulators with evidence type ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 10: DRUG & PHARMACOLOGY DATA ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ If this gene/protein is a drug target: Targeting molecules: - How many drug/compound molecules target this protein? - List TOP 30 molecules by development phase - Include: molecule ID, name, mechanism, highest development phase Clinical trials: - How many clinical trials involve drugs targeting this gene? - List TOP 20 trials with: trial ID, phase, status, intervention Pharmacogenomics: - Known drug-gene interactions affecting drug response - Dosing guidelines if any exist ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 11: EXPRESSION PROFILES ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Tissue expression: - Which tissues express this gene most highly? - List TOP 30 tissues with expression scores/levels - Note any tissue-specific or tissue-enriched patterns Cell type expression: - Which cell types show highest expression? - List TOP 30 cell types with expression scores - Note any cell type-specific patterns Single-cell expression data (if available): - Which single-cell datasets/experiments include this gene? - Notable cell population patterns ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ SECTION 12: DISEASE ASSOCIATIONS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ Mendelian/monogenic disease links: - What diseases are caused by mutations in this gene? - List ALL associated diseases with: disease name, disease ID, inheritance pattern, evidence level Phenotype associations: - What clinical phenotypes are associated with this gene? - List TOP 50 phenotype terms with IDs Complex trait associations (GWAS): - What traits/diseases are linked via genome-wide association studies? - List TOP 30 GWAS associations with: trait, study ID, p-value, effect size if available ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ FORMATTING REQUIREMENTS ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ - Present each section with clear headers - Use tables for listing multiple items - Always include COUNTS for every category - For lists with 50 items: show total count + TOP 50 - For lists with

Question

Provide a comprehensive cross-database identifier and functional mapping
reference for human PDGFRA. This should serve as a definitive
lookup resource for researchers.

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 1: GENE IDENTIFIERS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Provide ALL gene-level database identifiers:
- HGNC ID and approved symbol
- Ensembl gene ID (ENSG)
- NCBI Entrez Gene ID
- OMIM gene/locus ID
- Genomic location: chromosome, start position, end position, strand

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 2: TRANSCRIPT IDENTIFIERS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
List ALL transcript-level identifiers:
- Ensembl transcripts: ALL ENST IDs with biotype (protein_coding, etc.)
  How many total transcripts?
- RefSeq transcripts: ALL NM_ mRNA accessions
  Mark which is MANE Select (canonical clinical standard)
- CCDS IDs: ALL consensus coding sequence identifiers

For the CANONICAL/MANE SELECT transcript:
- List ALL exon IDs (ENSE) with genomic coordinates
- Total exon count

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 3: PROTEIN IDENTIFIERS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
List ALL protein-level identifiers:
- UniProt accessions: ALL entries (reviewed and unreviewed)
  Mark the canonical reviewed entry
- RefSeq protein: ALL NP_ accessions

Protein domains and families:
- List ALL annotated domains/families with identifiers
- Include: domain name, type (domain/family/superfamily), and ID

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 4: STRUCTURE IDENTIFIERS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Experimental structures:
- List ALL PDB structure IDs
- For each: experimental method (X-ray, NMR, Cryo-EM) and resolution
- Total PDB structure count

Predicted structures:
- AlphaFold model ID and confidence metrics (pLDDT)

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 5: CROSS-SPECIES ORTHOLOGS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
List orthologous genes in key model organisms (where available):
- Mouse (Mus musculus): gene ID, symbol
- Rat (Rattus norvegicus): gene ID, symbol
- Zebrafish (Danio rerio): gene ID, symbol
- Fruit fly (Drosophila melanogaster): gene ID, symbol
- Worm (C. elegans): gene ID, symbol
- Yeast (S. cerevisiae): gene ID, symbol

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 6: CLINICAL VARIANTS & AI PREDICTIONS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Clinical variant annotations:
- Total variant count in clinical databases
- Breakdown by classification: Pathogenic, Likely Pathogenic,
  Uncertain Significance (VUS), Likely Benign, Benign
- List TOP 50 pathogenic/likely pathogenic variants with:
  variant ID, HGVS notation, associated condition

AI-based variant effect predictions:
- Splice effect predictions: Total count
  List TOP 50 predicted splice-altering variants with delta scores
- Missense pathogenicity predictions: Total count
  List TOP 50 predicted pathogenic missense variants with scores

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 7: BIOLOGICAL PATHWAYS & GENE ONTOLOGY
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Pathway membership:
- List ALL biological pathways this gene participates in
- Include pathway IDs and names
- Total pathway count

Gene Ontology annotations:
- Biological Process: count and TOP 20 terms with IDs
- Molecular Function: count and TOP 20 terms with IDs
- Cellular Component: count and TOP 20 terms with IDs

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 8: PROTEIN INTERACTIONS & MOLECULAR NETWORKS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Protein-protein interactions:
- Total interaction count
- List TOP 50 highest-confidence interacting proteins with scores

Protein similarity (evolutionary and structural):
- Structural/embedding similarity: How many similar proteins?
  List TOP 20 with similarity scores
- Sequence homology: How many homologous proteins?
  List TOP 20 with identity/similarity scores

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 9: TRANSCRIPTION FACTOR REGULATORY DATA
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
If this gene encodes a transcription factor:

Downstream targets (genes regulated BY this TF):
- Total target gene count
- List TOP 50 target genes with regulation type (activates/represses)

DNA binding profiles:
- List ALL known binding motif IDs
- Motif family classification

Upstream regulators (TFs that regulate THIS gene):
- List known transcriptional regulators with evidence type

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 10: DRUG & PHARMACOLOGY DATA
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
If this gene/protein is a drug target:

Targeting molecules:
- How many drug/compound molecules target this protein?
- List TOP 30 molecules by development phase
- Include: molecule ID, name, mechanism, highest development phase

Clinical trials:
- How many clinical trials involve drugs targeting this gene?
- List TOP 20 trials with: trial ID, phase, status, intervention

Pharmacogenomics:
- Known drug-gene interactions affecting drug response
- Dosing guidelines if any exist

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 11: EXPRESSION PROFILES
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Tissue expression:
- Which tissues express this gene most highly?
- List TOP 30 tissues with expression scores/levels
- Note any tissue-specific or tissue-enriched patterns

Cell type expression:
- Which cell types show highest expression?
- List TOP 30 cell types with expression scores
- Note any cell type-specific patterns

Single-cell expression data (if available):
- Which single-cell datasets/experiments include this gene?
- Notable cell population patterns

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
SECTION 12: DISEASE ASSOCIATIONS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
Mendelian/monogenic disease links:
- What diseases are caused by mutations in this gene?
- List ALL associated diseases with: disease name, disease ID,
  inheritance pattern, evidence level

Phenotype associations:
- What clinical phenotypes are associated with this gene?
- List TOP 50 phenotype terms with IDs

Complex trait associations (GWAS):
- What traits/diseases are linked via genome-wide association studies?
- List TOP 30 GWAS associations with: trait, study ID, p-value,
  effect size if available

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
FORMATTING REQUIREMENTS
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
- Present each section with clear headers
- Use tables for listing multiple items
- Always include COUNTS for every category
- For lists with >50 items: show total count + TOP 50
- For lists with <50 items: show ALL items
- Always include database identifiers (IDs), not just names
- Mark canonical/primary/reviewed entries where applicable
- If a section has no data available, state "No data available"
  rather than omitting the section

Accepted Answer

Section 1: Gene Identifiers
DatabaseIdentifierDescription HGNC IDHGNC:8803Approved symbol: PDGFRA HGNC Nameplatelet derived growth factor receptor alpha Ensembl GeneENSG00000134853 NCBI Entrez5156 OMIM173490Gene/locus CCDSCCDS3495Consensus CDS PharmGKBPA33147VIP gene Genomic Location (GRCh38/hg38) AttributeValue Chromosome4 Cytogenetic Band4q12 Start Position54,229,130 End Position54,298,246 Strand+ (forward) Genomic AccessionNC_000004.12 Gene Span~69.1 kb Gene Aliases CD140a, CD140A
PDGFR2, …

Transcript ID	Biotype	Start	End	Strand
ENST00000257290	protein_coding	54,229,293	54,298,245	+
ENST00000958745	protein_coding	54,229,132	54,298,243	+
ENST00000958746	protein_coding	54,229,147	54,298,244	+
ENST00000958747	protein_coding	54,229,249	54,298,243	+
ENST00000958748	protein_coding	54,229,281	54,298,242	+
ENST00000958749	protein_coding	54,229,303	54,298,246	+
ENST00000958750	protein_coding	54,229,823	54,298,245	+
ENST00000958751	protein_coding	54,229,881	54,298,244	+
ENST00000958752	protein_coding	54,230,014	54,298,242	+
ENST00000958753	protein_coding	54,229,130	54,297,345	+
ENST00000958754	protein_coding	54,232,722	54,298,244	+
ENST00000958755	protein_coding	54,233,102	54,298,246	+
ENST00000870889	protein_coding	54,231,979	54,298,245	+
ENST00000870890	protein_coding	54,233,071	54,298,244	+
ENST00000508170	protein_coding	54,229,280	54,265,353	+
ENST00000503856	protein_coding	54,229,843	54,263,776	+
ENST00000504461	protein_coding	54,230,322	54,263,773	+
ENST00000512143	protein_coding	54,229,293	54,261,412	+
ENST00000512522	protein_coding	54,243,575	54,263,762	+
ENST00000509490	nonsense_mediated_decay	54,229,311	54,281,978	+
ENST00000461294	retained_intron	54,276,751	54,278,246	+
ENST00000507536	retained_intron	54,277,176	54,281,977	+
ENST00000509092	retained_intron	54,229,292	54,280,758	+

PDGFRA Gene Complete Identifier and Functional Mapping Reference

Structured Data Sources

Database	Identifier	Description
HGNC ID	HGNC:8803	Approved symbol: PDGFRA
HGNC Name	platelet derived growth factor receptor alpha
Ensembl Gene	ENSG00000134853
NCBI Entrez	5156
OMIM	173490	Gene/locus
CCDS	CCDS3495	Consensus CDS
PharmGKB	PA33147	VIP gene

Attribute	Value
Chromosome	4
Cytogenetic Band	4q12
Start Position	54,229,130
End Position	54,298,246
Strand	+ (forward)
Genomic Accession	NC_000004.12
Gene Span	~69.1 kb

Accession	Type	MANE Select	Chromosome
NM_006206	mRNA	✓ YES	4
NM_001347827	mRNA		4
NM_001347828	mRNA		4
NM_001347829	mRNA		4
NM_001347830	mRNA		4