|
|
Database: aplCal1 Primary Table: xenoRefGene Row Count: 246,163   Data last updated: 2020-08-17
Format description: A gene prediction with some additional info. On download server: MariaDB table dump directory
field | example | SQL type | info | description |
bin | 73 | smallint(5) unsigned | range | Indexing field to speed chromosome range queries. |
name | NM_032961 | varchar(255) | values | Name of gene (usually transcript_id from GTF) |
chrom | scaffold_182 | varchar(255) | values | Reference sequence chromosome or scaffold |
strand | + | char(1) | values | + or - for strand |
txStart | 96089 | int(10) unsigned | range | Transcription start position (or end position for minus strand item) |
txEnd | 283454 | int(10) unsigned | range | Transcription end position (or start position for minus strand item) |
cdsStart | 283454 | int(10) unsigned | range | Coding region start (or end position for minus strand item) |
cdsEnd | 283454 | int(10) unsigned | range | Coding region end (or start position for minus strand item) |
exonCount | 3 | int(10) unsigned | range | Number of exons |
exonStarts | 96089,168752,283427, | longblob | | Exon start positions (or end positions for minus strand item) |
exonEnds | 96115,168781,283454, | longblob | | Exon end positions (or start positions for minus strand item) |
score | 0 | int(11) | range | score |
name2 | PCDH10 | varchar(255) | values | Alternate name (e.g. gene_id from GTF) |
cdsStartStat | unk | enum('none', 'unk', 'incmpl', 'cmpl') | values | Status of CDS start annotation (none, unknown, incomplete, or complete) |
cdsEndStat | unk | enum('none', 'unk', 'incmpl', 'cmpl') | values | Status of CDS end annotation (none, unknown, incomplete, or complete) |
exonFrames | -1,-1,-1, | longblob | | Reading frame of the start of the CDS region of the exon, in the direction of transcription (0,1,2), or -1 if there is no CDS region. |
|
| |
|
|
Connected Tables and Joining Fields
|
|
aplCal1.all_est.qName (via xenoRefGene.name)
aplCal1.all_mrna.qName (via xenoRefGene.name)
aplCal1.xenoRefFlat.name (via xenoRefGene.name)
aplCal1.xenoRefSeqAli.qName (via xenoRefGene.name)
hgFixed.gbCdnaInfo.acc (via xenoRefGene.name)
hgFixed.gbMiscDiff.acc (via xenoRefGene.name)
hgFixed.gbSeq.acc (via xenoRefGene.name)
hgFixed.gbWarn.acc (via xenoRefGene.name)
hgFixed.imageClone.acc (via xenoRefGene.name)
| |
|
|
Sample Rows
|
|
bin | name | chrom | strand | txStart | txEnd | cdsStart | cdsEnd | exonCount | exonStarts | exonEnds | score | name2 | cdsStartStat | cdsEndStat | exonFrames |
---|
73 | NM_032961 | scaffold_182 | + | 96089 | 283454 | 283454 | 283454 | 3 | 96089,168752,283427, | 96115,168781,283454, | 0 | PCDH10 | unk | unk | -1,-1,-1, |
586 | NM_001107076 | scaffold_517 | + | 174560 | 188009 | 174560 | 188009 | 6 | 174560,184008,184620,184682,186270,187805, | 174662,184071,184622,184740,186348,188009, | 0 | Rab40b | incmpl | incmpl | 0,0,0,2,0,0, |
73 | NM_001256650 | scaffold_547 | + | 113102 | 157410 | 113102 | 157410 | 14 | 113102,113438,113746,113968,140247,140595,140848,140937,141021,155983,156072,156301,156424,157097, | 113153,113662,113800,114026,140382,140758,140904,140988,141184,156036,156133,156340,156473,157410, | 0 | ZNF43 | incmpl | incmpl | 0,0,2,2,0,0,1,0,0,1,0,1,1,2, |
588 | NM_001197230 | scaffold_3 | - | 394214 | 426252 | 394214 | 426252 | 19 | 394214,395312,398595,399126,401482,404154,406179,409503,410249,413999,415650,416095,417516,419273,419715,420268,420852,421935,42 ... | 394328,395336,398691,399171,401599,404226,406281,409761,410305,414138,415749,416189,417638,419350,419779,420391,421027,422024,42 ... | 0 | nat10 | cmpl | incmpl | 0,2,0,0,0,0,0,0,1,0,0,2,0,1,0,0,2,0,0, |
585 | NM_001104068 | scaffold_1346 | + | 21 | 16642 | 21 | 16642 | 6 | 21,3103,9428,14390,15975,16567, | 120,3202,9629,14621,16113,16642, | 0 | Ank2 | incmpl | incmpl | 0,0,0,0,0,0, |
585 | NM_001104068 | scaffold_2964 | + | 3325 | 15662 | 3325 | 15662 | 15 | 3325,3913,4684,5232,7759,9155,9720,10401,10942,11474,12362,13223,13996,14729,15596, | 3424,4005,4790,5391,7858,9254,9918,10500,11140,11672,12560,13409,14191,14743,15662, | 0 | Ank2 | incmpl | incmpl | 0,0,2,0,0,0,0,0,0,0,0,0,0,0,0, |
585 | NM_001170348 | scaffold_625 | + | 34081 | 37621 | 34081 | 37621 | 4 | 34081,36901,36949,37528, | 34237,36928,37024,37621, | 0 | Kif26a | incmpl | incmpl | 0,0,0,0, |
588 | NM_001136175 | scaffold_359 | - | 397035 | 408612 | 397035 | 408612 | 4 | 397035,397084,397288,408477, | 397059,397159,397399,408612, | 0 | LOC100191026 | incmpl | incmpl | 1,0,0,0, |
585 | NM_059748 | scaffold_2041 | - | 19193 | 24273 | 19193 | 24273 | 3 | 19193,21747,24201, | 19349,21873,24273, | 0 | bckd-1B | incmpl | incmpl | 0,0,0, |
587 | NM_059720 | scaffold_42 | + | 304175 | 306211 | 304175 | 306211 | 2 | 304175,306094, | 304218,306211, | 0 | prg-1 | incmpl | cmpl | 2,0, |
|
Note: all start coordinates in our database are 0-based, not
1-based. See explanation
here.
| |
|
|
|