|
|
Database: monDom4 Primary Table: xenoRefGene Row Count: 323,356   Data last updated: 2020-08-22
Format description: A gene prediction with some additional info. On download server: MariaDB table dump directory
field | example | SQL type | info | description |
bin | 1429 | smallint(5) unsigned | range | Indexing field to speed chromosome range queries. |
name | NM_001042785 | varchar(255) | values | Name of gene (usually transcript_id from GTF) |
chrom | chrUn | varchar(255) | values | Reference sequence chromosome or scaffold |
strand | - | char(1) | values | + or - for strand |
txStart | 110723731 | int(10) unsigned | range | Transcription start position (or end position for minus strand item) |
txEnd | 110728644 | int(10) unsigned | range | Transcription end position (or start position for minus strand item) |
cdsStart | 110723731 | int(10) unsigned | range | Coding region start (or end position for minus strand item) |
cdsEnd | 110728644 | int(10) unsigned | range | Coding region end (or start position for minus strand item) |
exonCount | 4 | int(10) unsigned | range | Number of exons |
exonStarts | 110723731,110725299,1107275... | longblob | | Exon start positions (or end positions for minus strand item) |
exonEnds | 110723944,110725455,1107276... | longblob | | Exon end positions (or start positions for minus strand item) |
score | 0 | int(11) | range | score |
name2 | Ekar | varchar(255) | values | Alternate name (e.g. gene_id from GTF) |
cdsStartStat | incmpl | enum('none', 'unk', 'incmpl', 'cmpl') | values | Status of CDS start annotation (none, unknown, incomplete, or complete) |
cdsEndStat | incmpl | enum('none', 'unk', 'incmpl', 'cmpl') | values | Status of CDS end annotation (none, unknown, incomplete, or complete) |
exonFrames | 0,0,0,0, | longblob | | Reading frame of the start of the CDS region of the exon, in the direction of transcription (0,1,2), or -1 if there is no CDS region. |
|
| |
|
|
Connected Tables and Joining Fields
|
|
hgFixed.gbCdnaInfo.acc (via xenoRefGene.name)
hgFixed.gbMiscDiff.acc (via xenoRefGene.name)
hgFixed.gbSeq.acc (via xenoRefGene.name)
hgFixed.gbWarn.acc (via xenoRefGene.name)
hgFixed.imageClone.acc (via xenoRefGene.name)
monDom4.all_est.qName (via xenoRefGene.name)
monDom4.all_mrna.qName (via xenoRefGene.name)
monDom4.refGene.name (via xenoRefGene.name)
monDom4.refSeqAli.qName (via xenoRefGene.name)
monDom4.xenoMrna.qName (via xenoRefGene.name)
monDom4.xenoRefFlat.name (via xenoRefGene.name)
monDom4.xenoRefSeqAli.qName (via xenoRefGene.name)
| |
|
|
Sample Rows
|
|
bin | name | chrom | strand | txStart | txEnd | cdsStart | cdsEnd | exonCount | exonStarts | exonEnds | score | name2 | cdsStartStat | cdsEndStat | exonFrames |
---|
1429 | NM_001042785 | chrUn | - | 110723731 | 110728644 | 110723731 | 110728644 | 4 | 110723731,110725299,110727556,110728605, | 110723944,110725455,110727655,110728644, | 0 | Ekar | incmpl | incmpl | 0,0,0,0, |
4088 | NM_001080655 | chr3 | - | 459251986 | 459253266 | 459251986 | 459253266 | 5 | 459251986,459252197,459252445,459252672,459253200, | 459252103,459252278,459252596,459252812,459253266, | 0 | pnpla7a | incmpl | incmpl | 0,0,2,0,0, |
4039 | NM_001035422 | chr1 | + | 452777615 | 452778161 | 452777615 | 452778161 | 1 | 452777615, | 452778161, | 0 | RNF183 | incmpl | cmpl | 0, |
2723 | NM_001035421 | chr2 | + | 280351867 | 280352710 | 280352008 | 280352710 | 2 | 280351867,280352563, | 280352548,280352710, | 0 | KCTD11 | cmpl | cmpl | 0,0, |
2299 | NM_001035421 | chr7 | + | 224698771 | 224699614 | 224698912 | 224699614 | 2 | 224698771,224699467, | 224699452,224699614, | 0 | KCTD11 | cmpl | cmpl | 0,0, |
4054 | NM_001035420 | chr3 | - | 454745119 | 454765080 | 454745119 | 454765080 | 7 | 454745119,454747467,454748808,454750712,454751078,454751764,454765017, | 454745315,454747610,454748930,454750845,454751144,454751887,454765080, | 0 | CNN2 | cmpl | incmpl | 2,0,1,0,0,0,0, |
2830 | NR_129499 | chr8 | + | 294272578 | 294272638 | 294272638 | 294272638 | 1 | 294272578, | 294272638, | 0 | MIR148A | unk | unk | -1, |
2042 | NM_001163489 | chr2 | + | 191008467 | 191039583 | 191030763 | 191038626 | 13 | 191008467,191030763,191031244,191033022,191033362,191033619,191034446,191035335,191036566,191036853,191038129,191038467,19103955 ... | 191008495,191030862,191031348,191033139,191033488,191033792,191034597,191035517,191036684,191036988,191038262,191038626,19103958 ... | 0 | Sema4a | incmpl | incmpl | -1,0,0,2,0,0,2,0,2,0,1,0,-1, |
4443 | NM_001193351 | chr2 | - | 505718692 | 505718809 | 505718692 | 505718809 | 1 | 505718692, | 505718809, | 0 | LYRM9 | cmpl | incmpl | 0, |
622 | NM_194298 | chr1 | + | 4855433 | 4880515 | 4855452 | 4878643 | 8 | 4855433,4863035,4867906,4874582,4874774,4874927,4878541,4880476, | 4855648,4863171,4868012,4874747,4874788,4875398,4878643,4880515, | 0 | SLC16A9 | cmpl | incmpl | 0,1,2,0,0,0,0,-1, |
|
Note: all start coordinates in our database are 0-based, not
1-based. See explanation
here.
| |
|
|
|