               SEQUENCE LISTING

<110> Angewandte Biotechnologie GmbH

<120> Pluripotent tendon and ligament perivascular cells

<130> S3254 PCT S3

<150> EP11 17 4762.2
<151> 2011-07-20

<160> 118

<170> BiSSAP 1.0

<210> 1
<211> 22
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..22
<223> /mol_type="DNA"
      /note="human sense primer hOct4"
      /organism="artificial sequences"

<400> 1
acctggctaa gcttccaagg cc                                             22


<210> 2
<211> 22
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..22
<223> /mol_type="DNA"
      /note="human antisense primer hOct4"
      /organism="artificial sequences"

<400> 2
tcgtttggct gaataccttc cc                                             22


<210> 3
<211> 21
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..21
<223> /mol_type="DNA"
      /note="human sense primer Sox2"
      /organism="artificial sequences"

<400> 3
aagatgcaca actcggagat c                                              21


<210> 4
<211> 21
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..21
<223> /mol_type="DNA"
      /note="human antisense primer Sox2"
      /organism="artificial sequences"

<400> 4
tatttataat ccgggtgctc c                                              21


<210> 5
<211> 22
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..22
<223> /mol_type="DNA"
      /note="human sense primer hNanog"
      /organism="artificial sequences"

<400> 5
tcaggacagc cctgattctt cc                                             22


<210> 6
<211> 18
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..18
<223> /mol_type="DNA"
      /note="human antisense primer hNanog"
      /organism="artificial sequences"

<400> 6
tcttgcatct gctggagg                                                  18


<210> 7
<211> 21
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..21
<223> /mol_type="DNA"
      /note="human sense primer Klf-4"
      /organism="artificial sequences"

<400> 7
agaccgagga gttcaacgat c                                              21


<210> 8
<211> 21
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..21
<223> /mol_type="DNA"
      /note="human antisense primer Klf-4"
      /organism="artificial sequences"

<400> 8
ttgatgtccg ccaggttgaa g                                              21


<210> 9
<211> 20
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..20
<223> /mol_type="DNA"
      /note="human sense primer cMyc"
      /organism="artificial sequences"

<400> 9
acaggaacta tgacctcgac                                                20


<210> 10
<211> 20
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..20
<223> /mol_type="DNA"
      /note="human antisense primer cMyc"
      /organism="artificial sequences"

<400> 10
tacagtcctg gatgatgatg                                                20


<210> 11
<211> 23
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..23
<223> /mol_type="DNA"
      /note="human sense primer hNestin"
      /organism="artificial sequences"

<400> 11
tctgaggaag tggggcaagg aat                                            23


<210> 12
<211> 24
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..24
<223> /mol_type="DNA"
      /note="human antisense primer hNestin"
      /organism="artificial sequences"

<400> 12
ttaagagtgc tgctcctgag cagg                                           24


<210> 13
<211> 22
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..22
<223> /mol_type="DNA"
      /note="human sense primer Col1A1"
      /organism="artificial sequences"

<400> 13
tcacctacca ctgcaagaac ag                                             22


<210> 14
<211> 21
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..21
<223> /mol_type="DNA"
      /note="human antisense primer Col1A1"
      /organism="artificial sequences"

<400> 14
atggagggag tttacaggaa g                                              21


<210> 15
<211> 19
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..19
<223> /mol_type="DNA"
      /note="human sense primer Col3A1"
      /organism="artificial sequences"

<400> 15
agtgccaatc ctttgaatg                                                 19


<210> 16
<211> 20
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..20
<223> /mol_type="DNA"
      /note="human antisense primer Col3A1"
      /organism="artificial sequences"

<400> 16
tatgtgatgt tctgggaagc                                                20


<210> 17
<211> 21
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..21
<223> /mol_type="DNA"
      /note="human sense primer hGalc"
      /organism="artificial sequences"

<400> 17
tggatcttac agggttacag g                                              21


<210> 18
<211> 21
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..21
<223> /mol_type="DNA"
      /note="human antisense primer Galc"
      /organism="artificial sequences"

<400> 18
acacaccagg taatgttaaa g                                              21


<210> 19
<211> 23
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..23
<223> /mol_type="DNA"
      /note="human sense primer hSCX"
      /organism="artificial sequences"

<400> 19
tgcgcctggc ctccagctac atc                                            23


<210> 20
<211> 23
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..23
<223> /mol_type="DNA"
      /note="human antisense primer hSCX"
      /organism="artificial sequences"

<400> 20
gttgctgagg cagaaggtgc aga                                            23


<210> 21
<211> 24
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..24
<223> /mol_type="DNA"
      /note="human sense primer hSOX9"
      /organism="artificial sequences"

<400> 21
tcagcccact gacagacctt aatc                                           24


<210> 22
<211> 23
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..23
<223> /mol_type="DNA"
      /note="human antisense primer hSOX9"
      /organism="artificial sequences"

<400> 22
aggtttgggg ctgggaggga aac                                            23


<210> 23
<211> 22
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..22
<223> /mol_type="DNA"
      /note="human sense primer INS1"
      /organism="artificial sequences"

<400> 23
tcatagacca tcagcaagca gg                                             22


<210> 24
<211> 21
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..21
<223> /mol_type="DNA"
      /note="human antisense primer INS1"
      /organism="artificial sequences"

<400> 24
tggtggactc agttgcagta g                                              21


<210> 25
<211> 20
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..20
<223> /mol_type="DNA"
      /note="rat sense primer ratOct4"
      /organism="artificial sequences"

<400> 25
tggctaagct tccaggggcc                                                20


<210> 26
<211> 21
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..21
<223> /mol_type="DNA"
      /note="rat antisense primer ratOct4"
      /organism="artificial sequences"

<400> 26
atggttgtct ggctgaacac c                                              21


<210> 27
<211> 21
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..21
<223> /mol_type="DNA"
      /note="rat sense primer Sox2"
      /organism="artificial sequences"

<400> 27
aagatgcaca actcggagat c                                              21


<210> 28
<211> 21
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..21
<223> /mol_type="DNA"
      /note="rat antisense primer Sox2"
      /organism="artificial sequences"

<400> 28
tatttataat ccgggtgctc c                                              21


<210> 29
<211> 21
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..21
<223> /mol_type="DNA"
      /note="rat sense primer ratNanog"
      /organism="artificial sequences"

<400> 29
tcaagatagc cctgattctt c                                              21


<210> 30
<211> 18
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..18
<223> /mol_type="DNA"
      /note="rat antisense primer ratNanog"
      /organism="artificial sequences"

<400> 30
tcttgcatct gctggagg                                                  18


<210> 31
<211> 21
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..21
<223> /mol_type="DNA"
      /note="rat sense primer Klf-4"
      /organism="artificial sequences"

<400> 31
agaccgagga gttcaacgat c                                              21


<210> 32
<211> 21
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..21
<223> /mol_type="DNA"
      /note="rat antisense primer Klf-4"
      /organism="artificial sequences"

<400> 32
ttgatgtccg ccaggttgaa g                                              21


<210> 33
<211> 20
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..20
<223> /mol_type="DNA"
      /note="rat sense primer cMyc"
      /organism="artificial sequences"

<400> 33
acaggaacta tgacctcgac                                                20


<210> 34
<211> 20
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..20
<223> /mol_type="DNA"
      /note="rat antisense primer cMyc"
      /organism="artificial sequences"

<400> 34
tacagtcctg gatgatgatg                                                20


<210> 35
<211> 21
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..21
<223> /mol_type="DNA"
      /note="rat sense primer rat_Nestin"
      /organism="artificial sequences"

<400> 35
tgctgatgag gaagaaagtg g                                              21


<210> 36
<211> 21
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..21
<223> /mol_type="DNA"
      /note="rat antisense primer rat_Nestin"
      /organism="artificial sequences"

<400> 36
accaatgtca aaggcatctc c                                              21


<210> 37
<211> 22
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..22
<223> /mol_type="DNA"
      /note="rat sense primer Col1A1"
      /organism="artificial sequences"

<400> 37
tcacctacca ctgcaagaac ag                                             22


<210> 38
<211> 21
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..21
<223> /mol_type="DNA"
      /note="rat antisense primer Col1A1"
      /organism="artificial sequences"

<400> 38
atggagggag tttacaggaa g                                              21


<210> 39
<211> 19
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..19
<223> /mol_type="DNA"
      /note="rat sense primer Col3A1"
      /organism="artificial sequences"

<400> 39
agtgccaatc ctttgaatg                                                 19


<210> 40
<211> 20
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..20
<223> /mol_type="DNA"
      /note="rat antisense primer Col3A1"
      /organism="artificial sequences"

<400> 40
tatgtgatgt tctgggaagc                                                20


<210> 41
<211> 22
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..22
<223> /mol_type="DNA"
      /note="rat sense primer ratGalc"
      /organism="artificial sequences"

<400> 41
tgttcacact caccactctg ac                                             22


<210> 42
<211> 22
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..22
<223> /mol_type="DNA"
      /note="rat antisense primer ratGalc"
      /organism="artificial sequences"

<400> 42
aggtcggctg taactctgta ag                                             22


<210> 43
<211> 23
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..23
<223> /mol_type="DNA"
      /note="rat sense primer SCX"
      /organism="artificial sequences"

<400> 43
tgcgcctggc ctccagctac atc                                            23


<210> 44
<211> 23
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..23
<223> /mol_type="DNA"
      /note="rat antisense primer SCX"
      /organism="artificial sequences"

<400> 44
gttgctgagg cagaaggtgc aga                                            23


<210> 45
<211> 24
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..24
<223> /mol_type="DNA"
      /note="rat sense primer SOX9"
      /organism="artificial sequences"

<400> 45
tcagcccact gacagacctt aatc                                           24


<210> 46
<211> 23
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..23
<223> /mol_type="DNA"
      /note="rat antisense primer SOX9"
      /organism="artificial sequences"

<400> 46
aggtttgggg ctgggaggga aac                                            23


<210> 47
<211> 22
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..22
<223> /mol_type="DNA"
      /note="rat sense primer INS1"
      /organism="artificial sequences"

<400> 47
tcatagacca tcagcaagca gg                                             22


<210> 48
<211> 21
<212> DNA
<213> artificial sequences

<220> 
<221> source
<222> 1..21
<223> /mol_type="DNA"
      /note="rat antisense primer INS1"
      /organism="artificial sequences"

<400> 48
tggtggactc agttgcagta g                                              21


<210> 49
<211> 5591
<212> DNA
<213> Homo sapiens

<220> 
<221> source
<222> 1..5591
<223> /mol_type="DNA"
      /note="Homo sapiens Nestin"
      /organism="Homo sapiens"

<400> 49
gctactccca ccccgccccg ccccgtcatt gtccccgtcg gtctcttttc tcttccgtcc       60

taaaagctct gcgagccgct cccttctccc ggtgccccgc gtctgtccat cctcagtggg      120

tcagacgagc aggatggagg gctgcatggg ggaggagtcg tttcagatgt gggagctcaa      180

tcggcgcctg gaggcctacc tggcccgggt caaggcgctg gaggagcaga atgagctgct      240

cagcgcggag ctcggggggc tccgggcaca atccgcggac acctcctggc gggcgcatgc      300

cgacgacgag ctggcggccc tgcgggccct cgttgaccaa cgctggcggg agaagcacgc      360

ggccgaggtg gcgcgcgaca acctggctga agagctggag ggcgtggcag gccgatgcca      420

gcagctgcgg ctggcccggg agcggacgac ggaggaggta gcccgcaacc ggcgcgccgt      480

cgaggcagag aaatgcgccc gggcctggct gagtagccag gtggcagagc tggagcgcga      540

gctagaggct ctacgcgtgg cgcacgagga ggagcgcgtc ggcctgaacg cgcaggctgc      600

ctgtgccccc cgctgccccg cgccgccccg cgggcctccc gcgccggccc cggaggtaga      660

ggagctggca aggcgactgg gcgaggcgtg gcgcggggca gtgcgcggct accaggagcg      720

cgtggcacac atggagacgt cgctgggcca ggcccgcgag cggctgggcc gggcggtgca      780

gggtgcccgc gagggccgcc tggagctgca gcagctccag gctgagcgcg gaggcctcct      840

ggagcgcagg gcagcgttgg aacagaggtt ggagggccgc tggcaggagc ggctgcgggc      900

tactgaaaag ttccagctgg ctgtggaggc cctggagcag gagaaacagg gcctacagag      960

ccagatcgct caggtcctgg aaggtcggca gcagctggcg cacctcaaga tgtccctcag     1020

cctggaggtg gccacgtaca ggaccctcct ggaggctgag aactcccggc tgcaaacacc     1080

tggcggtggc tccaagactt ccctcagctt tcaggacccc aagctggagc tgcaattccc     1140

taggacccca gagggccggc gtcttggatc tttgctccca gtcctgagcc caacttccct     1200

cccctcaccc ttgcctgcta cccttgagac acctgtgcca gcctttctta agaaccaaga     1260

attcctccag gcccgtaccc ctaccttggc cagcaccccc atccccccca cacctcaggc     1320

accctctcct gctgtagatg cagagatcag agcccaggat gctcctctct ctctgctcca     1380

gacacagggt gggaggaaac aggctccaga gcccctgcgg gctgaagcca gggtggccat     1440

tcctgccagc gtcctgcctg gaccagagga gcctgggggc cagcggcaag aggccagtac     1500

aggccagtcc ccagaggacc atgcctcctt ggcaccaccc ctcagccctg accactccag     1560

tttagaggct aaggatggag aatccggtgg gtctagagtg ttcagcatat gccgagggga     1620

aggtgaaggg caaatctggg ggttggtaga gaaagaaaca gccatagagg gcaaagtggt     1680

aagcagcttg cagcaggaaa tatgggaaga agaggatcta aacaggaagg aaatccagga     1740

ctcccaggtt cctttggaaa aagaaaccct gaagtctctg ggagaggaga ttcaagagtc     1800

actgaagact ctggaaaacc agagccatga gacactagaa agggagaatc aagaatgtcc     1860

gaggtcttta gaagaagact tagaaacact aaaaagtcta gaaaaggaaa ataaagagct     1920

attaaaggat gtggaggtag tgagacctct agaaaaagag gctgtaggcc aacttaagcc     1980

tacaggaaaa gaggacacac agacattgca atccctgcaa aaggagaatc aagaactaat     2040

gaaatctctt gaaggtaatc tagagacatt tttatttcca ggaacggaaa atcaagaatt     2100

agtaagttct ctgcaagaga acttagagtc attgacagct ctggaaaagg agaatcaaga     2160

gccactgaga tctccagaag taggggatga ggaggcactg agacctctga caaaggagaa     2220

tcaggaaccc ctgaggtctc ttgaagatga gaacaaagag gcctttagat ctctagaaaa     2280

agagaaccag gagccactga agactctaga agaagaggac cagagtattg tgagacctct     2340

agaaacagag aatcacaaat cactgaggtc tttagaagaa caggaccaag agacattgag     2400

aactcttgaa aaagagactc aacagcgacg gaggtctcta ggggaacagg atcagatgac     2460

attaagaccc ccagaaaaag tggatctaga accactgaag tctcttgacc aggagatagc     2520

tagacctctt gaaaatgaga atcaagagtt cttaaagtca ctcaaagaag agagcgtaga     2580

ggcagtaaaa tctttagaaa cagagatcct agaatcactg aagtctgcgg gacaagagaa     2640

cctggaaaca ctgaaatctc cagaaactca agcaccactg tggactccag aagaaataaa     2700

tcagggggca atgaatcctc tagaaaagga aattcaagaa ccactggagt ctgtggaagt     2760

gaaccaagag acattcagac tcctggaaga ggagaatcag gaatcattga gatctctggg     2820

agcatggaac ctggagaatt tgagatctcc agaggaggta gacaaggaaa gtcaaaggaa     2880

tctggaagag gaagagaacc tgggaaaggg agagtaccaa gagtcactga ggtctctgga     2940

ggaggaggga caggagctgc cgcagtctgc agatgtgcag aggtgggaag atacggtgga     3000

gaaggaccaa gaactggctc aggaaagccc tcctgggatg gctggagtgg aaaatgagga     3060

tgaggcagag ctgaatctga gggagcagga tggcttcact gggaaggagg aggtggtaga     3120

gcagggagag ctgaatgcca cagaggaggt ctggatccca ggcgaggggc acccagagag     3180

ccctgagccc aaagagcaga gaggcctggt tgagggagcc agtgtgaagg gaggggctga     3240

gggcctccag gaccctgaag ggcaatcaca acaggtgggg gccccaggcc tccaggctcc     3300

ccaggggctg ccagaggcga tagagcccct ggtggaagat gatgtggccc cagggggtga     3360

ccaagcctcc ccagaggtca tgttggggtc agagcctgcc atgggtgagt ctgctgcggg     3420

agctgagcca ggcccggggc agggggtggg agggctgggg gacccaggcc atctgaccag     3480

ggaagaggtg atggaaccac ccctggaaga ggagagtttg gaggcaaaga gggttcaggg     3540

cttggaaggg cctagaaagg acctagagga ggcaggtggt ctggggacag agttctccga     3600

gctgcctggg aagagcagag acccttggga gcctcccagg gagggtaggg aggagtcaga     3660

ggctgaggcc cccaggggag cagaggaggc gttccctgct gagaccctgg gccacactgg     3720

aagtgatgcc ccttcacctt ggcctctggg gtcagaggaa gctgaggagg atgtaccacc     3780

agtgctggtc tcccccagcc caacgtacac cccgatcctg gaagatgccc ctgggcctca     3840

gcctcaggct gaagggagtc aggaggctag ctggggggtg caggggaggg ctgaagccct     3900

ggggaaagta gagagcgagc aggaggagtt gggttctggg gagatccccg agggccccca     3960

ggaggaaggg gaggagagca gagaagagag cgaggaggat gagctcgggg agacccttcc     4020

agactccact cccctgggct tctacctcag gtcccccacc tcccccaggt gggaccccac     4080

tggagagcag aggccacccc ctcaagggga gactggaaag gagggctggg atcctgctgt     4140

cctggcttcc gagggccttg aggccccacc ctcagaaaag gaggaggggg aggagggaga     4200

agaggagtgt ggccgtgact ctgacctgtc agaagaattt gaggacctgg ggactgaggc     4260

accttttctt cctggggtcc ctggggaggt ggcagaacct ctgggccagg tgccccagct     4320

gctactggat cctgcagcct gggatcgaga tggggagtcc gatgggtttg cagatgagga     4380

agaaagtggg gaggagggag aggaggatca ggaggagggg agggagccag gggctgggcg     4440

gtgggggcca gggtcttctg ttggcagcct ccaggccctg agtagctccc agagagggga     4500

attcctggag tctgattctg tgagtgtcag tgtcccctgg gatgacagct tgaggggtgc     4560

agtggctggt gcccccaaga ctgccctgga aacggagtcc caggacagtg ctgagccttc     4620

tggctcagag gaagagtctg accctgtttc cttggagagg gaggacaaag tccctggccc     4680

tctagagatc cccagtggga tggaggatgc aggcccaggg gcagacatca ttggtgttaa     4740

tggccagggt cccaacttgg aggggaagtc acagcatgtg aatgggggag tgatgaacgg     4800

gctggagcag tctgaggaag tggggcaagg aatgccgcta gtctctgagg gagaccgagg     4860

gagccccttt caggaggagg aggggagtgc tctgaagacc tcttgggcag gggctcctgt     4920

tcacctgggc cagggtcagt tcctgaagtt cactcagagg gaaggagata gagagtcctg     4980

gtcctcaggg gaggactagg aaaagaccat ctgcccggca ctggggactt aggggtgcgg     5040

ggaggggaag gacgcctcca agcccgctcc ctgctcagga gcagcactct taacttacga     5100

tctcttgaca tatggtttct ggctgagagg cctggcccgc taaggtgaaa aggggtgtgg     5160

caaaggagcc tactccaaga atggaggctg taggaatata acctcccacc ctgcaaaggg     5220

aatctcttgc ctgctccatc tcataggcta agtcagctga atcccgatag tactaggtcc     5280

ccttccctcc gcatcccgtc agctggaaaa ggcctgtggc ccagaggctt ctccaaaggg     5340

agggtgacat gctggctttt gtgcccaagc tcaccagccc tgcgccacct cactgcagta     5400

gtgcaccatc tcactgcagt agcacgccct cctgggccgt ctggcctgtg gctaatggag     5460

gtgacggcac tcccatgtgc tgactccccc catccctgcc acgctgtggc cctgcctggc     5520

tagtccctgc ctgaataaag taatgcctcc gcttcaaaaa aaaaaaaaaa aaaaaaaaaa     5580

aaaaaaaaaa a                                                          5591


<210> 50
<211> 1621
<212> PRT
<213> Homo sapiens

<220> 
<221> SOURCE
<222> 1..1621
<223> /mol_type="protein"
      /note="Homo sapiens Nestin"
      /organism="Homo sapiens"

<400> 50
Met Glu Gly Cys Met Gly Glu Glu Ser Phe Gln Met Trp Glu Leu Asn 
1               5                   10                   15    
Arg Arg Leu Glu Ala Tyr Leu Ala Arg Val Lys Ala Leu Glu Glu Gln 
            20                   25                  30        
Asn Glu Leu Leu Ser Ala Glu Leu Gly Gly Leu Arg Ala Gln Ser Ala 
        35                   40                  45            
Asp Thr Ser Trp Arg Ala His Ala Asp Asp Glu Leu Ala Ala Leu Arg 
    50                   55                  60                
Ala Leu Val Asp Gln Arg Trp Arg Glu Lys His Ala Ala Glu Val Ala 
65                   70                  75                  80
Arg Asp Asn Leu Ala Glu Glu Leu Glu Gly Val Ala Gly Arg Cys Gln 
                85                   90                  95    
Gln Leu Arg Leu Ala Arg Glu Arg Thr Thr Glu Glu Val Ala Arg Asn 
            100                  105                110        
Arg Arg Ala Val Glu Ala Glu Lys Cys Ala Arg Ala Trp Leu Ser Ser 
        115                  120                125            
Gln Val Ala Glu Leu Glu Arg Glu Leu Glu Ala Leu Arg Val Ala His 
    130                  135                140                
Glu Glu Glu Arg Val Gly Leu Asn Ala Gln Ala Ala Cys Ala Pro Arg 
145                  150                155                  160
Cys Pro Ala Pro Pro Arg Gly Pro Pro Ala Pro Ala Pro Glu Val Glu 
                165                  170                175    
Glu Leu Ala Arg Arg Leu Gly Glu Ala Trp Arg Gly Ala Val Arg Gly 
            180                  185                190        
Tyr Gln Glu Arg Val Ala His Met Glu Thr Ser Leu Gly Gln Ala Arg 
        195                  200                205            
Glu Arg Leu Gly Arg Ala Val Gln Gly Ala Arg Glu Gly Arg Leu Glu 
    210                  215                220                
Leu Gln Gln Leu Gln Ala Glu Arg Gly Gly Leu Leu Glu Arg Arg Ala 
225                  230                235                  240
Ala Leu Glu Gln Arg Leu Glu Gly Arg Trp Gln Glu Arg Leu Arg Ala 
                245                  250                255    
Thr Glu Lys Phe Gln Leu Ala Val Glu Ala Leu Glu Gln Glu Lys Gln 
            260                  265                270        
Gly Leu Gln Ser Gln Ile Ala Gln Val Leu Glu Gly Arg Gln Gln Leu 
        275                  280                285            
Ala His Leu Lys Met Ser Leu Ser Leu Glu Val Ala Thr Tyr Arg Thr 
    290                  295                300                
Leu Leu Glu Ala Glu Asn Ser Arg Leu Gln Thr Pro Gly Gly Gly Ser 
305                  310                315                  320
Lys Thr Ser Leu Ser Phe Gln Asp Pro Lys Leu Glu Leu Gln Phe Pro 
                325                  330                335    
Arg Thr Pro Glu Gly Arg Arg Leu Gly Ser Leu Leu Pro Val Leu Ser 
            340                  345                350        
Pro Thr Ser Leu Pro Ser Pro Leu Pro Ala Thr Leu Glu Thr Pro Val 
        355                  360                365            
Pro Ala Phe Leu Lys Asn Gln Glu Phe Leu Gln Ala Arg Thr Pro Thr 
    370                  375                380                
Leu Ala Ser Thr Pro Ile Pro Pro Thr Pro Gln Ala Pro Ser Pro Ala 
385                  390                395                  400
Val Asp Ala Glu Ile Arg Ala Gln Asp Ala Pro Leu Ser Leu Leu Gln 
                405                  410                415    
Thr Gln Gly Gly Arg Lys Gln Ala Pro Glu Pro Leu Arg Ala Glu Ala 
            420                  425                430        
Arg Val Ala Ile Pro Ala Ser Val Leu Pro Gly Pro Glu Glu Pro Gly 
        435                  440                445            
Gly Gln Arg Gln Glu Ala Ser Thr Gly Gln Ser Pro Glu Asp His Ala 
    450                  455                460                
Ser Leu Ala Pro Pro Leu Ser Pro Asp His Ser Ser Leu Glu Ala Lys 
465                  470                475                  480
Asp Gly Glu Ser Gly Gly Ser Arg Val Phe Ser Ile Cys Arg Gly Glu 
                485                  490                495    
Gly Glu Gly Gln Ile Trp Gly Leu Val Glu Lys Glu Thr Ala Ile Glu 
            500                  505                510        
Gly Lys Val Val Ser Ser Leu Gln Gln Glu Ile Trp Glu Glu Glu Asp 
        515                  520                525            
Leu Asn Arg Lys Glu Ile Gln Asp Ser Gln Val Pro Leu Glu Lys Glu 
    530                  535                540                
Thr Leu Lys Ser Leu Gly Glu Glu Ile Gln Glu Ser Leu Lys Thr Leu 
545                  550                555                  560
Glu Asn Gln Ser His Glu Thr Leu Glu Arg Glu Asn Gln Glu Cys Pro 
                565                  570                575    
Arg Ser Leu Glu Glu Asp Leu Glu Thr Leu Lys Ser Leu Glu Lys Glu 
            580                  585                590        
Asn Lys Glu Leu Leu Lys Asp Val Glu Val Val Arg Pro Leu Glu Lys 
        595                  600                605            
Glu Ala Val Gly Gln Leu Lys Pro Thr Gly Lys Glu Asp Thr Gln Thr 
    610                  615                620                
Leu Gln Ser Leu Gln Lys Glu Asn Gln Glu Leu Met Lys Ser Leu Glu 
625                  630                635                  640
Gly Asn Leu Glu Thr Phe Leu Phe Pro Gly Thr Glu Asn Gln Glu Leu 
                645                  650                655    
Val Ser Ser Leu Gln Glu Asn Leu Glu Ser Leu Thr Ala Leu Glu Lys 
            660                  665                670        
Glu Asn Gln Glu Pro Leu Arg Ser Pro Glu Val Gly Asp Glu Glu Ala 
        675                  680                685            
Leu Arg Pro Leu Thr Lys Glu Asn Gln Glu Pro Leu Arg Ser Leu Glu 
    690                  695                700                
Asp Glu Asn Lys Glu Ala Phe Arg Ser Leu Glu Lys Glu Asn Gln Glu 
705                  710                715                  720
Pro Leu Lys Thr Leu Glu Glu Glu Asp Gln Ser Ile Val Arg Pro Leu 
                725                  730                735    
Glu Thr Glu Asn His Lys Ser Leu Arg Ser Leu Glu Glu Gln Asp Gln 
            740                  745                750        
Glu Thr Leu Arg Thr Leu Glu Lys Glu Thr Gln Gln Arg Arg Arg Ser 
        755                  760                765            
Leu Gly Glu Gln Asp Gln Met Thr Leu Arg Pro Pro Glu Lys Val Asp 
    770                  775                780                
Leu Glu Pro Leu Lys Ser Leu Asp Gln Glu Ile Ala Arg Pro Leu Glu 
785                  790                795                  800
Asn Glu Asn Gln Glu Phe Leu Lys Ser Leu Lys Glu Glu Ser Val Glu 
                805                  810                815    
Ala Val Lys Ser Leu Glu Thr Glu Ile Leu Glu Ser Leu Lys Ser Ala 
            820                  825                830        
Gly Gln Glu Asn Leu Glu Thr Leu Lys Ser Pro Glu Thr Gln Ala Pro 
        835                  840                845            
Leu Trp Thr Pro Glu Glu Ile Asn Gln Gly Ala Met Asn Pro Leu Glu 
    850                  855                860                
Lys Glu Ile Gln Glu Pro Leu Glu Ser Val Glu Val Asn Gln Glu Thr 
865                  870                875                  880
Phe Arg Leu Leu Glu Glu Glu Asn Gln Glu Ser Leu Arg Ser Leu Gly 
                885                  890                895    
Ala Trp Asn Leu Glu Asn Leu Arg Ser Pro Glu Glu Val Asp Lys Glu 
            900                  905                910        
Ser Gln Arg Asn Leu Glu Glu Glu Glu Asn Leu Gly Lys Gly Glu Tyr 
        915                  920                925            
Gln Glu Ser Leu Arg Ser Leu Glu Glu Glu Gly Gln Glu Leu Pro Gln 
    930                  935                940                
Ser Ala Asp Val Gln Arg Trp Glu Asp Thr Val Glu Lys Asp Gln Glu 
945                  950                955                  960
Leu Ala Gln Glu Ser Pro Pro Gly Met Ala Gly Val Glu Asn Glu Asp 
                965                  970                975    
Glu Ala Glu Leu Asn Leu Arg Glu Gln Asp Gly Phe Thr Gly Lys Glu 
            980                  985                990        
Glu Val Val Glu Gln Gly Glu Leu Asn Ala Thr Glu Glu Val Trp Ile 
        995                  1000                1005            
Pro Gly Glu Gly His Pro Glu Ser Pro Glu Pro Lys Glu Gln Arg Gly 
    1010                1015                1020                
Leu Val Glu Gly Ala Ser Val Lys Gly Gly Ala Glu Gly Leu Gln Asp 
1025                1030                1035                1040
Pro Glu Gly Gln Ser Gln Gln Val Gly Ala Pro Gly Leu Gln Ala Pro 
                1045                1050                1055    
Gln Gly Leu Pro Glu Ala Ile Glu Pro Leu Val Glu Asp Asp Val Ala 
            1060                1065                1070        
Pro Gly Gly Asp Gln Ala Ser Pro Glu Val Met Leu Gly Ser Glu Pro 
        1075                1080                1085            
Ala Met Gly Glu Ser Ala Ala Gly Ala Glu Pro Gly Pro Gly Gln Gly 
    1090                1095                1100                
Val Gly Gly Leu Gly Asp Pro Gly His Leu Thr Arg Glu Glu Val Met 
1105                1110                1115                1120
Glu Pro Pro Leu Glu Glu Glu Ser Leu Glu Ala Lys Arg Val Gln Gly 
                1125                1130                1135    
Leu Glu Gly Pro Arg Lys Asp Leu Glu Glu Ala Gly Gly Leu Gly Thr 
            1140                1145                1150        
Glu Phe Ser Glu Leu Pro Gly Lys Ser Arg Asp Pro Trp Glu Pro Pro 
        1155                1160                1165            
Arg Glu Gly Arg Glu Glu Ser Glu Ala Glu Ala Pro Arg Gly Ala Glu 
    1170                1175                1180                
Glu Ala Phe Pro Ala Glu Thr Leu Gly His Thr Gly Ser Asp Ala Pro 
1185                1190                1195                1200
Ser Pro Trp Pro Leu Gly Ser Glu Glu Ala Glu Glu Asp Val Pro Pro 
                1205                1210                1215    
Val Leu Val Ser Pro Ser Pro Thr Tyr Thr Pro Ile Leu Glu Asp Ala 
            1220                1225                1230        
Pro Gly Pro Gln Pro Gln Ala Glu Gly Ser Gln Glu Ala Ser Trp Gly 
        1235                1240                1245            
Val Gln Gly Arg Ala Glu Ala Leu Gly Lys Val Glu Ser Glu Gln Glu 
    1250                1255                1260                
Glu Leu Gly Ser Gly Glu Ile Pro Glu Gly Pro Gln Glu Glu Gly Glu 
1265                1270                1275                1280
Glu Ser Arg Glu Glu Ser Glu Glu Asp Glu Leu Gly Glu Thr Leu Pro 
                1285                1290                1295    
Asp Ser Thr Pro Leu Gly Phe Tyr Leu Arg Ser Pro Thr Ser Pro Arg 
            1300                1305                1310        
Trp Asp Pro Thr Gly Glu Gln Arg Pro Pro Pro Gln Gly Glu Thr Gly 
        1315                1320                1325            
Lys Glu Gly Trp Asp Pro Ala Val Leu Ala Ser Glu Gly Leu Glu Ala 
    1330                1335                1340                
Pro Pro Ser Glu Lys Glu Glu Gly Glu Glu Gly Glu Glu Glu Cys Gly 
1345                1350                1355                1360
Arg Asp Ser Asp Leu Ser Glu Glu Phe Glu Asp Leu Gly Thr Glu Ala 
                1365                1370                1375    
Pro Phe Leu Pro Gly Val Pro Gly Glu Val Ala Glu Pro Leu Gly Gln 
            1380                1385                1390        
Val Pro Gln Leu Leu Leu Asp Pro Ala Ala Trp Asp Arg Asp Gly Glu 
        1395                1400                1405            
Ser Asp Gly Phe Ala Asp Glu Glu Glu Ser Gly Glu Glu Gly Glu Glu 
    1410                1415                1420                
Asp Gln Glu Glu Gly Arg Glu Pro Gly Ala Gly Arg Trp Gly Pro Gly 
1425                1430                1435                1440
Ser Ser Val Gly Ser Leu Gln Ala Leu Ser Ser Ser Gln Arg Gly Glu 
                1445                1450                1455    
Phe Leu Glu Ser Asp Ser Val Ser Val Ser Val Pro Trp Asp Asp Ser 
            1460                1465                1470        
Leu Arg Gly Ala Val Ala Gly Ala Pro Lys Thr Ala Leu Glu Thr Glu 
        1475                1480                1485            
Ser Gln Asp Ser Ala Glu Pro Ser Gly Ser Glu Glu Glu Ser Asp Pro 
    1490                1495                1500                
Val Ser Leu Glu Arg Glu Asp Lys Val Pro Gly Pro Leu Glu Ile Pro 
1505                1510                1515                1520
Ser Gly Met Glu Asp Ala Gly Pro Gly Ala Asp Ile Ile Gly Val Asn 
                1525                1530                1535    
Gly Gln Gly Pro Asn Leu Glu Gly Lys Ser Gln His Val Asn Gly Gly 
            1540                1545                1550        
Val Met Asn Gly Leu Glu Gln Ser Glu Glu Val Gly Gln Gly Met Pro 
        1555                1560                1565            
Leu Val Ser Glu Gly Asp Arg Gly Ser Pro Phe Gln Glu Glu Glu Gly 
    1570                1575                1580                
Ser Ala Leu Lys Thr Ser Trp Ala Gly Ala Pro Val His Leu Gly Gln 
1585                1590                1595                1600
Gly Gln Phe Leu Lys Phe Thr Gln Arg Glu Gly Asp Arg Glu Ser Trp 
                1605                1610                1615    
Ser Ser Gly Glu Asp 
            1620    

<210> 51
<211> 5927
<212> DNA
<213> Homo sapiens

<220> 
<221> source
<222> 1..5927
<223> /mol_type="DNA"
      /note="Homo sapiens Col1A1"
      /organism="Homo sapiens"

<400> 51
tcgtcggagc agacgggagt ttctcctcgg ggtcggagca ggaggcacgc ggagtgtgag       60

gccacgcatg agcggacgct aaccccctcc ccagccacaa agagtctaca tgtctagggt      120

ctagacatgt tcagctttgt ggacctccgg ctcctgctcc tcttagcggc caccgccctc      180

ctgacgcacg gccaagagga aggccaagtc gagggccaag acgaagacat cccaccaatc      240

acctgcgtac agaacggcct caggtaccat gaccgagacg tgtggaaacc cgagccctgc      300

cggatctgcg tctgcgacaa cggcaaggtg ttgtgcgatg acgtgatctg tgacgagacc      360

aagaactgcc ccggcgccga agtccccgag ggcgagtgct gtcccgtctg ccccgacggc      420

tcagagtcac ccaccgacca agaaaccacc ggcgtcgagg gacccaaggg agacactggc      480

ccccgaggcc caaggggacc cgcaggcccc cctggccgag atggcatccc tggacagcct      540

ggacttcccg gaccccccgg accccccgga cctcccggac cccctggcct cggaggaaac      600

tttgctcccc agctgtctta tggctatgat gagaaatcaa ccggaggaat ttccgtgcct      660

ggccccatgg gtccctctgg tcctcgtggt ctccctggcc cccctggtgc acctggtccc      720

caaggcttcc aaggtccccc tggtgagcct ggcgagcctg gagcttcagg tcccatgggt      780

ccccgaggtc ccccaggtcc ccctggaaag aatggagatg atggggaagc tggaaaacct      840

ggtcgtcctg gtgagcgtgg gcctcctggg cctcagggtg ctcgaggatt gcccggaaca      900

gctggcctcc ctggaatgaa gggacacaga ggtttcagtg gtttggatgg tgccaaggga      960

gatgctggtc ctgctggtcc taagggtgag cctggcagcc ctggtgaaaa tggagctcct     1020

ggtcagatgg gcccccgtgg cctgcctggt gagagaggtc gccctggagc ccctggccct     1080

gctggtgctc gtggaaatga tggtgctact ggtgctgccg ggccccctgg tcccaccggc     1140

cccgctggtc ctcctggctt ccctggtgct gttggtgcta agggtgaagc tggtccccaa     1200

gggccccgag gctctgaagg tccccagggt gtgcgtggtg agcctggccc ccctggccct     1260

gctggtgctg ctggccctgc tggaaaccct ggtgctgatg gacagcctgg tgctaaaggt     1320

gccaatggtg ctcctggtat tgctggtgct cctggcttcc ctggtgcccg aggcccctct     1380

ggaccccagg gccccggcgg ccctcctggt cccaagggta acagcggtga acctggtgct     1440

cctggcagca aaggagacac tggtgctaag ggagagcctg gccctgttgg tgttcaagga     1500

ccccctggcc ctgctggaga ggaaggaaag cgaggagctc gaggtgaacc cggacccact     1560

ggcctgcccg gaccccctgg cgagcgtggt ggacctggta gccgtggttt ccctggcgca     1620

gatggtgttg ctggtcccaa gggtcccgct ggtgaacgtg gttctcctgg ccctgctggc     1680

cccaaaggat ctcctggtga agctggtcgt cccggtgaag ctggtctgcc tggtgccaag     1740

ggtctgactg gaagccctgg cagccctggt cctgatggca aaactggccc ccctggtccc     1800

gccggtcaag atggtcgccc cggaccccca ggcccacctg gtgcccgtgg tcaggctggt     1860

gtgatgggat tccctggacc taaaggtgct gctggagagc ccggcaaggc tggagagcga     1920

ggtgttcccg gaccccctgg cgctgtcggt cctgctggca aagatggaga ggctggagct     1980

cagggacccc ctggccctgc tggtcccgct ggcgagagag gtgaacaagg ccctgctggc     2040

tcccccggat tccagggtct ccctggtcct gctggtcctc caggtgaagc aggcaaacct     2100

ggtgaacagg gtgttcctgg agaccttggc gcccctggcc cctctggagc aagaggcgag     2160

agaggtttcc ctggcgagcg tggtgtgcaa ggtccccctg gtcctgctgg tccccgaggg     2220

gccaacggtg ctcccggcaa cgatggtgct aagggtgatg ctggtgcccc tggagctccc     2280

ggtagccagg gcgcccctgg ccttcaggga atgcctggtg aacgtggtgc agctggtctt     2340

ccagggccta agggtgacag aggtgatgct ggtcccaaag gtgctgatgg ctctcctggc     2400

aaagatggcg tccgtggtct gactggcccc attggtcctc ctggccctgc tggtgcccct     2460

ggtgacaagg gtgaaagtgg tcccagcggc cctgctggtc ccactggagc tcgtggtgcc     2520

cccggagacc gtggtgagcc tggtcccccc ggccctgctg gctttgctgg cccccctggt     2580

gctgacggcc aacctggtgc taaaggcgaa cctggtgatg ctggtgctaa aggcgatgct     2640

ggtccccctg gccctgccgg acccgctgga ccccctggcc ccattggtaa tgttggtgct     2700

cctggagcca aaggtgctcg cggcagcgct ggtccccctg gtgctactgg tttccctggt     2760

gctgctggcc gagtcggtcc tcctggcccc tctggaaatg ctggaccccc tggccctcct     2820

ggtcctgctg gcaaagaagg cggcaaaggt ccccgtggtg agactggccc tgctggacgt     2880

cctggtgaag ttggtccccc tggtccccct ggccctgctg gcgagaaagg atcccctggt     2940

gctgatggtc ctgctggtgc tcctggtact cccgggcctc aaggtattgc tggacagcgt     3000

ggtgtggtcg gcctgcctgg tcagagagga gagagaggct tccctggtct tcctggcccc     3060

tctggtgaac ctggcaaaca aggtccctct ggagcaagtg gtgaacgtgg tccccctggt     3120

cccatgggcc cccctggatt ggctggaccc cctggtgaat ctggacgtga gggggctcct     3180

ggtgccgaag gttcccctgg acgagacggt tctcctggcg ccaagggtga ccgtggtgag     3240

accggccccg ctggaccccc tggtgctcct ggtgctcctg gtgcccctgg ccccgttggc     3300

cctgctggca agagtggtga tcgtggtgag actggtcctg ctggtcccgc cggtcctgtc     3360

ggccctgttg gcgcccgtgg ccccgccgga ccccaaggcc cccgtggtga caagggtgag     3420

acaggcgaac agggcgacag aggcataaag ggtcaccgtg gcttctctgg cctccagggt     3480

ccccctggcc ctcctggctc tcctggtgaa caaggtccct ctggagcctc tggtcctgct     3540

ggtccccgag gtccccctgg ctctgctggt gctcctggca aagatggact caacggtctc     3600

cctggcccca ttgggccccc tggtcctcgc ggtcgcactg gtgatgctgg tcctgttggt     3660

ccccccggcc ctcctggacc tcctggtccc cctggtcctc ccagcgctgg tttcgacttc     3720

agcttcctgc cccagccacc tcaagagaag gctcacgatg gtggccgcta ctaccgggct     3780

gatgatgcca atgtggttcg tgaccgtgac ctcgaggtgg acaccaccct caagagcctg     3840

agccagcaga tcgagaacat ccggagccca gagggcagcc gcaagaaccc cgcccgcacc     3900

tgccgtgacc tcaagatgtg ccactctgac tggaagagtg gagagtactg gattgacccc     3960

aaccaaggct gcaacctgga tgccatcaaa gtcttctgca acatggagac tggtgagacc     4020

tgcgtgtacc ccactcagcc cagtgtggcc cagaagaact ggtacatcag caagaacccc     4080

aaggacaaga ggcatgtctg gttcggcgag agcatgaccg atggattcca gttcgagtat     4140

ggcggccagg gctccgaccc tgccgatgtg gccatccagc tgaccttcct gcgcctgatg     4200

tccaccgagg cctcccagaa catcacctac cactgcaaga acagcgtggc ctacatggac     4260

cagcagactg gcaacctcaa gaaggccctg ctcctccagg gctccaacga gatcgagatc     4320

cgcgccgagg gcaacagccg cttcacctac agcgtcactg tcgatggctg cacgagtcac     4380

accggagcct ggggcaagac agtgattgaa tacaaaacca ccaagacctc ccgcctgccc     4440

atcatcgatg tggccccctt ggacgttggt gccccagacc aggaattcgg cttcgacgtt     4500

ggccctgtct gcttcctgta aactccctcc atcccaacct ggctccctcc cacccaacca     4560

actttccccc caacccggaa acagacaagc aacccaaact gaaccccctc aaaagccaaa     4620

aaatgggaga caatttcaca tggactttgg aaaatatttt tttcctttgc attcatctct     4680

caaacttagt ttttatcttt gaccaaccga acatgaccaa aaaccaaaag tgcattcaac     4740

cttaccaaaa aaaaaaaaaa aaaaagaata aataaataac tttttaaaaa aggaagcttg     4800

gtccacttgc ttgaagaccc atgcgggggt aagtcccttt ctgcccgttg ggcttatgaa     4860

accccaatgc tgccctttct gctcctttct ccacaccccc cttggggcct cccctccact     4920

ccttcccaaa tctgtctccc cagaagacac aggaaacaat gtattgtctg cccagcaatc     4980

aaaggcaatg ctcaaacacc caagtggccc ccaccctcag cccgctcctg cccgcccagc     5040

acccccaggc cctgggggac ctggggttct cagactgcca aagaagcctt gccatctggc     5100

gctcccatgg ctcttgcaac atctcccctt cgtttttgag ggggtcatgc cgggggagcc     5160

accagcccct cactgggttc ggaggagagt caggaagggc cacgacaaag cagaaacatc     5220

ggatttgggg aacgcgtgtc aatcccttgt gccgcagggc tgggcgggag agactgttct     5280

gttccttgtg taactgtgtt gctgaaagac tacctcgttc ttgtcttgat gtgtcaccgg     5340

ggcaactgcc tgggggcggg gatgggggca gggtggaagc ggctccccat tttataccaa     5400

aggtgctaca tctatgtgat gggtggggtg gggagggaat cactggtgct atagaaattg     5460

agatgccccc ccaggccagc aaatgttcct ttttgttcaa agtctatttt tattccttga     5520

tatttttctt tttttttttt tttttttgtg gatggggact tgtgaatttt tctaaaggtg     5580

ctatttaaca tgggaggaga gcgtgtgcgg ctccagccca gcccgctgct cactttccac     5640

cctctctcca cctgcctctg gcttctcagg cctctgctct ccgacctctc tcctctgaaa     5700

ccctcctcca cagctgcagc ccatcctccc ggctccctcc tagtctgtcc tgcgtcctct     5760

gtccccgggt ttcagagaca acttcccaaa gcacaaagca gtttttcccc ctaggggtgg     5820

gaggaagcaa aagactctgt acctattttg tatgtgtata ataatttgag atgtttttaa     5880

ttattttgat tgctggaata aagcatgtgg aaatgaccca aacataa                   5927


<210> 52
<211> 1464
<212> PRT
<213> Homo sapiens

<220> 
<221> SOURCE
<222> 1..1464
<223> /mol_type="protein"
      /note="Homo sapiens Col1A1"
      /organism="Homo sapiens"

<400> 52
Met Phe Ser Phe Val Asp Leu Arg Leu Leu Leu Leu Leu Ala Ala Thr 
1               5                   10                   15    
Ala Leu Leu Thr His Gly Gln Glu Glu Gly Gln Val Glu Gly Gln Asp 
            20                   25                  30        
Glu Asp Ile Pro Pro Ile Thr Cys Val Gln Asn Gly Leu Arg Tyr His 
        35                   40                  45            
Asp Arg Asp Val Trp Lys Pro Glu Pro Cys Arg Ile Cys Val Cys Asp 
    50                   55                  60                
Asn Gly Lys Val Leu Cys Asp Asp Val Ile Cys Asp Glu Thr Lys Asn 
65                   70                  75                  80
Cys Pro Gly Ala Glu Val Pro Glu Gly Glu Cys Cys Pro Val Cys Pro 
                85                   90                  95    
Asp Gly Ser Glu Ser Pro Thr Asp Gln Glu Thr Thr Gly Val Glu Gly 
            100                  105                110        
Pro Lys Gly Asp Thr Gly Pro Arg Gly Pro Arg Gly Pro Ala Gly Pro 
        115                  120                125            
Pro Gly Arg Asp Gly Ile Pro Gly Gln Pro Gly Leu Pro Gly Pro Pro 
    130                  135                140                
Gly Pro Pro Gly Pro Pro Gly Pro Pro Gly Leu Gly Gly Asn Phe Ala 
145                  150                155                  160
Pro Gln Leu Ser Tyr Gly Tyr Asp Glu Lys Ser Thr Gly Gly Ile Ser 
                165                  170                175    
Val Pro Gly Pro Met Gly Pro Ser Gly Pro Arg Gly Leu Pro Gly Pro 
            180                  185                190        
Pro Gly Ala Pro Gly Pro Gln Gly Phe Gln Gly Pro Pro Gly Glu Pro 
        195                  200                205            
Gly Glu Pro Gly Ala Ser Gly Pro Met Gly Pro Arg Gly Pro Pro Gly 
    210                  215                220                
Pro Pro Gly Lys Asn Gly Asp Asp Gly Glu Ala Gly Lys Pro Gly Arg 
225                  230                235                  240
Pro Gly Glu Arg Gly Pro Pro Gly Pro Gln Gly Ala Arg Gly Leu Pro 
                245                  250                255    
Gly Thr Ala Gly Leu Pro Gly Met Lys Gly His Arg Gly Phe Ser Gly 
            260                  265                270        
Leu Asp Gly Ala Lys Gly Asp Ala Gly Pro Ala Gly Pro Lys Gly Glu 
        275                  280                285            
Pro Gly Ser Pro Gly Glu Asn Gly Ala Pro Gly Gln Met Gly Pro Arg 
    290                  295                300                
Gly Leu Pro Gly Glu Arg Gly Arg Pro Gly Ala Pro Gly Pro Ala Gly 
305                  310                315                  320
Ala Arg Gly Asn Asp Gly Ala Thr Gly Ala Ala Gly Pro Pro Gly Pro 
                325                  330                335    
Thr Gly Pro Ala Gly Pro Pro Gly Phe Pro Gly Ala Val Gly Ala Lys 
            340                  345                350        
Gly Glu Ala Gly Pro Gln Gly Pro Arg Gly Ser Glu Gly Pro Gln Gly 
        355                  360                365            
Val Arg Gly Glu Pro Gly Pro Pro Gly Pro Ala Gly Ala Ala Gly Pro 
    370                  375                380                
Ala Gly Asn Pro Gly Ala Asp Gly Gln Pro Gly Ala Lys Gly Ala Asn 
385                  390                395                  400
Gly Ala Pro Gly Ile Ala Gly Ala Pro Gly Phe Pro Gly Ala Arg Gly 
                405                  410                415    
Pro Ser Gly Pro Gln Gly Pro Gly Gly Pro Pro Gly Pro Lys Gly Asn 
            420                  425                430        
Ser Gly Glu Pro Gly Ala Pro Gly Ser Lys Gly Asp Thr Gly Ala Lys 
        435                  440                445            
Gly Glu Pro Gly Pro Val Gly Val Gln Gly Pro Pro Gly Pro Ala Gly 
    450                  455                460                
Glu Glu Gly Lys Arg Gly Ala Arg Gly Glu Pro Gly Pro Thr Gly Leu 
465                  470                475                  480
Pro Gly Pro Pro Gly Glu Arg Gly Gly Pro Gly Ser Arg Gly Phe Pro 
                485                  490                495    
Gly Ala Asp Gly Val Ala Gly Pro Lys Gly Pro Ala Gly Glu Arg Gly 
            500                  505                510        
Ser Pro Gly Pro Ala Gly Pro Lys Gly Ser Pro Gly Glu Ala Gly Arg 
        515                  520                525            
Pro Gly Glu Ala Gly Leu Pro Gly Ala Lys Gly Leu Thr Gly Ser Pro 
    530                  535                540                
Gly Ser Pro Gly Pro Asp Gly Lys Thr Gly Pro Pro Gly Pro Ala Gly 
545                  550                555                  560
Gln Asp Gly Arg Pro Gly Pro Pro Gly Pro Pro Gly Ala Arg Gly Gln 
                565                  570                575    
Ala Gly Val Met Gly Phe Pro Gly Pro Lys Gly Ala Ala Gly Glu Pro 
            580                  585                590        
Gly Lys Ala Gly Glu Arg Gly Val Pro Gly Pro Pro Gly Ala Val Gly 
        595                  600                605            
Pro Ala Gly Lys Asp Gly Glu Ala Gly Ala Gln Gly Pro Pro Gly Pro 
    610                  615                620                
Ala Gly Pro Ala Gly Glu Arg Gly Glu Gln Gly Pro Ala Gly Ser Pro 
625                  630                635                  640
Gly Phe Gln Gly Leu Pro Gly Pro Ala Gly Pro Pro Gly Glu Ala Gly 
                645                  650                655    
Lys Pro Gly Glu Gln Gly Val Pro Gly Asp Leu Gly Ala Pro Gly Pro 
            660                  665                670        
Ser Gly Ala Arg Gly Glu Arg Gly Phe Pro Gly Glu Arg Gly Val Gln 
        675                  680                685            
Gly Pro Pro Gly Pro Ala Gly Pro Arg Gly Ala Asn Gly Ala Pro Gly 
    690                  695                700                
Asn Asp Gly Ala Lys Gly Asp Ala Gly Ala Pro Gly Ala Pro Gly Ser 
705                  710                715                  720
Gln Gly Ala Pro Gly Leu Gln Gly Met Pro Gly Glu Arg Gly Ala Ala 
                725                  730                735    
Gly Leu Pro Gly Pro Lys Gly Asp Arg Gly Asp Ala Gly Pro Lys Gly 
            740                  745                750        
Ala Asp Gly Ser Pro Gly Lys Asp Gly Val Arg Gly Leu Thr Gly Pro 
        755                  760                765            
Ile Gly Pro Pro Gly Pro Ala Gly Ala Pro Gly Asp Lys Gly Glu Ser 
    770                  775                780                
Gly Pro Ser Gly Pro Ala Gly Pro Thr Gly Ala Arg Gly Ala Pro Gly 
785                  790                795                  800
Asp Arg Gly Glu Pro Gly Pro Pro Gly Pro Ala Gly Phe Ala Gly Pro 
                805                  810                815    
Pro Gly Ala Asp Gly Gln Pro Gly Ala Lys Gly Glu Pro Gly Asp Ala 
            820                  825                830        
Gly Ala Lys Gly Asp Ala Gly Pro Pro Gly Pro Ala Gly Pro Ala Gly 
        835                  840                845            
Pro Pro Gly Pro Ile Gly Asn Val Gly Ala Pro Gly Ala Lys Gly Ala 
    850                  855                860                
Arg Gly Ser Ala Gly Pro Pro Gly Ala Thr Gly Phe Pro Gly Ala Ala 
865                  870                875                  880
Gly Arg Val Gly Pro Pro Gly Pro Ser Gly Asn Ala Gly Pro Pro Gly 
                885                  890                895    
Pro Pro Gly Pro Ala Gly Lys Glu Gly Gly Lys Gly Pro Arg Gly Glu 
            900                  905                910        
Thr Gly Pro Ala Gly Arg Pro Gly Glu Val Gly Pro Pro Gly Pro Pro 
        915                  920                925            
Gly Pro Ala Gly Glu Lys Gly Ser Pro Gly Ala Asp Gly Pro Ala Gly 
    930                  935                940                
Ala Pro Gly Thr Pro Gly Pro Gln Gly Ile Ala Gly Gln Arg Gly Val 
945                  950                955                  960
Val Gly Leu Pro Gly Gln Arg Gly Glu Arg Gly Phe Pro Gly Leu Pro 
                965                  970                975    
Gly Pro Ser Gly Glu Pro Gly Lys Gln Gly Pro Ser Gly Ala Ser Gly 
            980                  985                990        
Glu Arg Gly Pro Pro Gly Pro Met Gly Pro Pro Gly Leu Ala Gly Pro 
        995                  1000                1005            
Pro Gly Glu Ser Gly Arg Glu Gly Ala Pro Gly Ala Glu Gly Ser Pro 
    1010                1015                1020                
Gly Arg Asp Gly Ser Pro Gly Ala Lys Gly Asp Arg Gly Glu Thr Gly 
1025                1030                1035                1040
Pro Ala Gly Pro Pro Gly Ala Pro Gly Ala Pro Gly Ala Pro Gly Pro 
                1045                1050                1055    
Val Gly Pro Ala Gly Lys Ser Gly Asp Arg Gly Glu Thr Gly Pro Ala 
            1060                1065                1070        
Gly Pro Ala Gly Pro Val Gly Pro Val Gly Ala Arg Gly Pro Ala Gly 
        1075                1080                1085            
Pro Gln Gly Pro Arg Gly Asp Lys Gly Glu Thr Gly Glu Gln Gly Asp 
    1090                1095                1100                
Arg Gly Ile Lys Gly His Arg Gly Phe Ser Gly Leu Gln Gly Pro Pro 
1105                1110                1115                1120
Gly Pro Pro Gly Ser Pro Gly Glu Gln Gly Pro Ser Gly Ala Ser Gly 
                1125                1130                1135    
Pro Ala Gly Pro Arg Gly Pro Pro Gly Ser Ala Gly Ala Pro Gly Lys 
            1140                1145                1150        
Asp Gly Leu Asn Gly Leu Pro Gly Pro Ile Gly Pro Pro Gly Pro Arg 
        1155                1160                1165            
Gly Arg Thr Gly Asp Ala Gly Pro Val Gly Pro Pro Gly Pro Pro Gly 
    1170                1175                1180                
Pro Pro Gly Pro Pro Gly Pro Pro Ser Ala Gly Phe Asp Phe Ser Phe 
1185                1190                1195                1200
Leu Pro Gln Pro Pro Gln Glu Lys Ala His Asp Gly Gly Arg Tyr Tyr 
                1205                1210                1215    
Arg Ala Asp Asp Ala Asn Val Val Arg Asp Arg Asp Leu Glu Val Asp 
            1220                1225                1230        
Thr Thr Leu Lys Ser Leu Ser Gln Gln Ile Glu Asn Ile Arg Ser Pro 
        1235                1240                1245            
Glu Gly Ser Arg Lys Asn Pro Ala Arg Thr Cys Arg Asp Leu Lys Met 
    1250                1255                1260                
Cys His Ser Asp Trp Lys Ser Gly Glu Tyr Trp Ile Asp Pro Asn Gln 
1265                1270                1275                1280
Gly Cys Asn Leu Asp Ala Ile Lys Val Phe Cys Asn Met Glu Thr Gly 
                1285                1290                1295    
Glu Thr Cys Val Tyr Pro Thr Gln Pro Ser Val Ala Gln Lys Asn Trp 
            1300                1305                1310        
Tyr Ile Ser Lys Asn Pro Lys Asp Lys Arg His Val Trp Phe Gly Glu 
        1315                1320                1325            
Ser Met Thr Asp Gly Phe Gln Phe Glu Tyr Gly Gly Gln Gly Ser Asp 
    1330                1335                1340                
Pro Ala Asp Val Ala Ile Gln Leu Thr Phe Leu Arg Leu Met Ser Thr 
1345                1350                1355                1360
Glu Ala Ser Gln Asn Ile Thr Tyr His Cys Lys Asn Ser Val Ala Tyr 
                1365                1370                1375    
Met Asp Gln Gln Thr Gly Asn Leu Lys Lys Ala Leu Leu Leu Gln Gly 
            1380                1385                1390        
Ser Asn Glu Ile Glu Ile Arg Ala Glu Gly Asn Ser Arg Phe Thr Tyr 
        1395                1400                1405            
Ser Val Thr Val Asp Gly Cys Thr Ser His Thr Gly Ala Trp Gly Lys 
    1410                1415                1420                
Thr Val Ile Glu Tyr Lys Thr Thr Lys Thr Ser Arg Leu Pro Ile Ile 
1425                1430                1435                1440
Asp Val Ala Pro Leu Asp Val Gly Ala Pro Asp Gln Glu Phe Gly Phe 
                1445                1450                1455    
Asp Val Gly Pro Val Cys Phe Leu 
            1460                

<210> 53
<211> 5490
<212> DNA
<213> Homo sapiens

<220> 
<221> source
<222> 1..5490
<223> /mol_type="DNA"
      /note="Homo sapiens Col3A1"
      /organism="Homo sapiens"

<400> 53
ggctgagttt tatgacgggc ccggtgctga agggcaggga acaacttgat ggtgctactt       60

tgaactgctt ttcttttctc ctttttgcac aaagagtctc atgtctgata tttagacatg      120

atgagctttg tgcaaaaggg gagctggcta cttctcgctc tgcttcatcc cactattatt      180

ttggcacaac aggaagctgt tgaaggagga tgttcccatc ttggtcagtc ctatgcggat      240

agagatgtct ggaagccaga accatgccaa atatgtgtct gtgactcagg atccgttctc      300

tgcgatgaca taatatgtga cgatcaagaa ttagactgcc ccaacccaga aattccattt      360

ggagaatgtt gtgcagtttg cccacagcct ccaactgctc ctactcgccc tcctaatggt      420

caaggacctc aaggccccaa gggagatcca ggccctcctg gtattcctgg gagaaatggt      480

gaccctggta ttccaggaca accagggtcc cctggttctc ctggcccccc tggaatctgt      540

gaatcatgcc ctactggtcc tcagaactat tctccccagt atgattcata tgatgtcaag      600

tctggagtag cagtaggagg actcgcaggc tatcctggac cagctggccc cccaggccct      660

cccggtcccc ctggtacatc tggtcatcct ggttcccctg gatctccagg ataccaagga      720

ccccctggtg aacctgggca agctggtcct tcaggccctc caggacctcc tggtgctata      780

ggtccatctg gtcctgctgg aaaagatgga gaatcaggta gacccggacg acctggagag      840

cgaggattgc ctggacctcc aggtatcaaa ggtccagctg ggatacctgg attccctggt      900

atgaaaggac acagaggctt cgatggacga aatggagaaa agggtgaaac aggtgctcct      960

ggattaaagg gtgaaaatgg tcttccaggc gaaaatggag ctcctggacc catgggtcca     1020

agaggggctc ctggtgagcg aggacggcca ggacttcctg gggctgcagg tgctcggggt     1080

aatgacggtg ctcgaggcag tgatggtcaa ccaggccctc ctggtcctcc tggaactgcc     1140

ggattccctg gatcccctgg tgctaagggt gaagttggac ctgcagggtc tcctggttca     1200

aatggtgccc ctggacaaag aggagaacct ggacctcagg gacacgctgg tgctcaaggt     1260

cctcctggcc ctcctgggat taatggtagt cctggtggta aaggcgaaat gggtcccgct     1320

ggcattcctg gagctcctgg actgatggga gcccggggtc ctccaggacc agccggtgct     1380

aatggtgctc ctggactgcg aggtggtgca ggtgagcctg gtaagaatgg tgccaaagga     1440

gagcccggac cacgtggtga acgcggtgag gctggtattc caggtgttcc aggagctaaa     1500

ggcgaagatg gcaaggatgg atcacctgga gaacctggtg caaatgggct tccaggagct     1560

gcaggagaaa ggggtgcccc tgggttccga ggacctgctg gaccaaatgg catcccagga     1620

gaaaagggtc ctgctggaga gcgtggtgct ccaggccctg cagggcccag aggagctgct     1680

ggagaacctg gcagagatgg cgtccctgga ggtccaggaa tgaggggcat gcccggaagt     1740

ccaggaggac caggaagtga tgggaaacca gggcctcccg gaagtcaagg agaaagtggt     1800

cgaccaggtc ctcctgggcc atctggtccc cgaggtcagc ctggtgtcat gggcttcccc     1860

ggtcctaaag gaaatgatgg tgctcctggt aagaatggag aacgaggtgg ccctggagga     1920

cctggccctc agggtcctcc tggaaagaat ggtgaaactg gacctcaggg acccccaggg     1980

cctactgggc ctggtggtga caaaggagac acaggacccc ctggtccaca aggattacaa     2040

ggcttgcctg gtacaggtgg tcctccagga gaaaatggaa aacctgggga accaggtcca     2100

aagggtgatg ccggtgcacc tggagctcca ggaggcaagg gtgatgctgg tgcccctggt     2160

gaacgtggac ctcctggatt ggcaggggcc ccaggactta gaggtggagc tggtccccct     2220

ggtcccgaag gaggaaaggg tgctgctggt cctcctgggc cacctggtgc tgctggtact     2280

cctggtctgc aaggaatgcc tggagaaaga ggaggtcttg gaagtcctgg tccaaagggt     2340

gacaagggtg aaccaggcgg tccaggtgct gatggtgtcc cagggaaaga tggcccaagg     2400

ggtcctactg gtcctattgg tcctcctggc ccagctggcc agcctggaga taagggtgaa     2460

ggtggtgccc ccggacttcc aggtatagct ggacctcgtg gtagccctgg tgagagaggt     2520

gaaactggcc ctccaggacc tgctggtttc cctggtgctc ctggacagaa tggtgaacct     2580

ggtggtaaag gagaaagagg ggctccgggt gagaaaggtg aaggaggccc tcctggagtt     2640

gcaggacccc ctggaggttc tggacctgct ggtcctcctg gtccccaagg tgtcaaaggt     2700

gaacgtggca gtcctggtgg acctggtgct gctggcttcc ctggtgctcg tggtcttcct     2760

ggtcctcctg gtagtaatgg taacccagga cccccaggtc ccagcggttc tccaggcaag     2820

gatgggcccc caggtcctgc gggtaacact ggtgctcctg gcagccctgg agtgtctgga     2880

ccaaaaggtg atgctggcca accaggagag aagggatcgc ctggtgccca gggcccacca     2940

ggagctccag gcccacttgg gattgctggg atcactggag cacggggtct tgcaggacca     3000

ccaggcatgc caggtcctag gggaagccct ggccctcagg gtgtcaaggg tgaaagtggg     3060

aaaccaggag ctaacggtct cagtggagaa cgtggtcccc ctggacccca gggtcttcct     3120

ggtctggctg gtacagctgg tgaacctgga agagatggaa accctggatc agatggtctt     3180

ccaggccgag atggatctcc tggtggcaag ggtgatcgtg gtgaaaatgg ctctcctggt     3240

gcccctggcg ctcctggtca tccaggccca cctggtcctg tcggtccagc tggaaagagt     3300

ggtgacagag gagaaagtgg ccctgctggc cctgctggtg ctcccggtcc tgctggttcc     3360

cgaggtgctc ctggtcctca aggcccacgt ggtgacaaag gtgaaacagg tgaacgtgga     3420

gctgctggca tcaaaggaca tcgaggattc cctggtaatc caggtgcccc aggttctcca     3480

ggccctgctg gtcagcaggg tgcaatcggc agtccaggac ctgcaggccc cagaggacct     3540

gttggaccca gtggacctcc tggcaaagat ggaaccagtg gacatccagg tcccattgga     3600

ccaccagggc ctcgaggtaa cagaggtgaa agaggatctg agggctcccc aggccaccca     3660

gggcaaccag gccctcctgg acctcctggt gcccctggtc cttgctgtgg tggtgttgga     3720

gccgctgcca ttgctgggat tggaggtgaa aaagctggcg gttttgcccc gtattatgga     3780

gatgaaccaa tggatttcaa aatcaacacc gatgagatta tgacttcact caagtctgtt     3840

aatggacaaa tagaaagcct cattagtcct gatggttctc gtaaaaaccc cgctagaaac     3900

tgcagagacc tgaaattctg ccatcctgaa ctcaagagtg gagaatactg ggttgaccct     3960

aaccaaggat gcaaattgga tgctatcaag gtattctgta atatggaaac tggggaaaca     4020

tgcataagtg ccaatccttt gaatgttcca cggaaacact ggtggacaga ttctagtgct     4080

gagaagaaac acgtttggtt tggagagtcc atggatggtg gttttcagtt tagctacggc     4140

aatcctgaac ttcctgaaga tgtccttgat gtgcagctgg cattccttcg acttctctcc     4200

agccgagctt cccagaacat cacatatcac tgcaaaaata gcattgcata catggatcag     4260

gccagtggaa atgtaaagaa ggccctgaag ctgatggggt caaatgaagg tgaattcaag     4320

gctgaaggaa atagcaaatt cacctacaca gttctggagg atggttgcac gaaacacact     4380

ggggaatgga gcaaaacagt ctttgaatat cgaacacgca aggctgtgag actacctatt     4440

gtagatattg caccctatga cattggtggt cctgatcaag aatttggtgt ggacgttggc     4500

cctgtttgct ttttataaac caaactctat ctgaaatccc aacaaaaaaa atttaactcc     4560

atatgtgttc ctcttgttct aatcttgtca accagtgcaa gtgaccgaca aaattccagt     4620

tatttatttc caaaatgttt ggaaacagta taatttgaca aagaaaaatg atacttctct     4680

ttttttgctg ttccaccaaa tacaattcaa atgctttttg ttttattttt ttaccaattc     4740

caatttcaaa atgtctcaat ggtgctataa taaataaact tcaacactct ttatgataac     4800

aacactgtgt tatattcttt gaatcctagc ccatctgcag agcaatgact gtgctcacca     4860

gtaaaagata acctttcttt ctgaaatagt caaatacgaa attagaaaag ccctccctat     4920

tttaactacc tcaactggtc agaaacacag attgtattct atgagtccca gaagatgaaa     4980

aaaattttat acgttgataa aacttataaa tttcattgat taatctcctg gaagattggt     5040

ttaaaaagaa aagtgtaatg caagaattta aagaaatatt tttaaagcca caattatttt     5100

aatattggat atcaactgct tgtaaaggtg ctcctctttt ttcttgtcat tgctggtcaa     5160

gattactaat atttgggaag gctttaaaga cgcatgttat ggtgctaatg tactttcact     5220

tttaaactct agatcagaat tgttgacttg cattcagaac ataaatgcac aaaatctgta     5280

catgtctccc atcagaaaga ttcattggca tgccacaggg gattctcctc cttcatcctg     5340

taaaggtcaa caataaaaac caaattatgg ggctgctttt gtcacactag catagagaat     5400

gtgttgaaat ttaactttgt aagcttgtat gtggttgttg atcttttttt tccttacaga     5460

cacccataat aaaatatcat attaaaattc                                      5490


<210> 54
<211> 1466
<212> PRT
<213> Homo sapiens

<220> 
<221> SOURCE
<222> 1..1466
<223> /mol_type="protein"
      /note="Homo sapiens Col3A1"
      /organism="Homo sapiens"

<400> 54
Met Met Ser Phe Val Gln Lys Gly Ser Trp Leu Leu Leu Ala Leu Leu 
1               5                   10                   15    
His Pro Thr Ile Ile Leu Ala Gln Gln Glu Ala Val Glu Gly Gly Cys 
            20                   25                  30        
Ser His Leu Gly Gln Ser Tyr Ala Asp Arg Asp Val Trp Lys Pro Glu 
        35                   40                  45            
Pro Cys Gln Ile Cys Val Cys Asp Ser Gly Ser Val Leu Cys Asp Asp 
    50                   55                  60                
Ile Ile Cys Asp Asp Gln Glu Leu Asp Cys Pro Asn Pro Glu Ile Pro 
65                   70                  75                  80
Phe Gly Glu Cys Cys Ala Val Cys Pro Gln Pro Pro Thr Ala Pro Thr 
                85                   90                  95    
Arg Pro Pro Asn Gly Gln Gly Pro Gln Gly Pro Lys Gly Asp Pro Gly 
            100                  105                110        
Pro Pro Gly Ile Pro Gly Arg Asn Gly Asp Pro Gly Ile Pro Gly Gln 
        115                  120                125            
Pro Gly Ser Pro Gly Ser Pro Gly Pro Pro Gly Ile Cys Glu Ser Cys 
    130                  135                140                
Pro Thr Gly Pro Gln Asn Tyr Ser Pro Gln Tyr Asp Ser Tyr Asp Val 
145                  150                155                  160
Lys Ser Gly Val Ala Val Gly Gly Leu Ala Gly Tyr Pro Gly Pro Ala 
                165                  170                175    
Gly Pro Pro Gly Pro Pro Gly Pro Pro Gly Thr Ser Gly His Pro Gly 
            180                  185                190        
Ser Pro Gly Ser Pro Gly Tyr Gln Gly Pro Pro Gly Glu Pro Gly Gln 
        195                  200                205            
Ala Gly Pro Ser Gly Pro Pro Gly Pro Pro Gly Ala Ile Gly Pro Ser 
    210                  215                220                
Gly Pro Ala Gly Lys Asp Gly Glu Ser Gly Arg Pro Gly Arg Pro Gly 
225                  230                235                  240
Glu Arg Gly Leu Pro Gly Pro Pro Gly Ile Lys Gly Pro Ala Gly Ile 
                245                  250                255    
Pro Gly Phe Pro Gly Met Lys Gly His Arg Gly Phe Asp Gly Arg Asn 
            260                  265                270        
Gly Glu Lys Gly Glu Thr Gly Ala Pro Gly Leu Lys Gly Glu Asn Gly 
        275                  280                285            
Leu Pro Gly Glu Asn Gly Ala Pro Gly Pro Met Gly Pro Arg Gly Ala 
    290                  295                300                
Pro Gly Glu Arg Gly Arg Pro Gly Leu Pro Gly Ala Ala Gly Ala Arg 
305                  310                315                  320
Gly Asn Asp Gly Ala Arg Gly Ser Asp Gly Gln Pro Gly Pro Pro Gly 
                325                  330                335    
Pro Pro Gly Thr Ala Gly Phe Pro Gly Ser Pro Gly Ala Lys Gly Glu 
            340                  345                350        
Val Gly Pro Ala Gly Ser Pro Gly Ser Asn Gly Ala Pro Gly Gln Arg 
        355                  360                365            
Gly Glu Pro Gly Pro Gln Gly His Ala Gly Ala Gln Gly Pro Pro Gly 
    370                  375                380                
Pro Pro Gly Ile Asn Gly Ser Pro Gly Gly Lys Gly Glu Met Gly Pro 
385                  390                395                  400
Ala Gly Ile Pro Gly Ala Pro Gly Leu Met Gly Ala Arg Gly Pro Pro 
                405                  410                415    
Gly Pro Ala Gly Ala Asn Gly Ala Pro Gly Leu Arg Gly Gly Ala Gly 
            420                  425                430        
Glu Pro Gly Lys Asn Gly Ala Lys Gly Glu Pro Gly Pro Arg Gly Glu 
        435                  440                445            
Arg Gly Glu Ala Gly Ile Pro Gly Val Pro Gly Ala Lys Gly Glu Asp 
    450                  455                460                
Gly Lys Asp Gly Ser Pro Gly Glu Pro Gly Ala Asn Gly Leu Pro Gly 
465                  470                475                  480
Ala Ala Gly Glu Arg Gly Ala Pro Gly Phe Arg Gly Pro Ala Gly Pro 
                485                  490                495    
Asn Gly Ile Pro Gly Glu Lys Gly Pro Ala Gly Glu Arg Gly Ala Pro 
            500                  505                510        
Gly Pro Ala Gly Pro Arg Gly Ala Ala Gly Glu Pro Gly Arg Asp Gly 
        515                  520                525            
Val Pro Gly Gly Pro Gly Met Arg Gly Met Pro Gly Ser Pro Gly Gly 
    530                  535                540                
Pro Gly Ser Asp Gly Lys Pro Gly Pro Pro Gly Ser Gln Gly Glu Ser 
545                  550                555                  560
Gly Arg Pro Gly Pro Pro Gly Pro Ser Gly Pro Arg Gly Gln Pro Gly 
                565                  570                575    
Val Met Gly Phe Pro Gly Pro Lys Gly Asn Asp Gly Ala Pro Gly Lys 
            580                  585                590        
Asn Gly Glu Arg Gly Gly Pro Gly Gly Pro Gly Pro Gln Gly Pro Pro 
        595                  600                605            
Gly Lys Asn Gly Glu Thr Gly Pro Gln Gly Pro Pro Gly Pro Thr Gly 
    610                  615                620                
Pro Gly Gly Asp Lys Gly Asp Thr Gly Pro Pro Gly Pro Gln Gly Leu 
625                  630                635                  640
Gln Gly Leu Pro Gly Thr Gly Gly Pro Pro Gly Glu Asn Gly Lys Pro 
                645                  650                655    
Gly Glu Pro Gly Pro Lys Gly Asp Ala Gly Ala Pro Gly Ala Pro Gly 
            660                  665                670        
Gly Lys Gly Asp Ala Gly Ala Pro Gly Glu Arg Gly Pro Pro Gly Leu 
        675                  680                685            
Ala Gly Ala Pro Gly Leu Arg Gly Gly Ala Gly Pro Pro Gly Pro Glu 
    690                  695                700                
Gly Gly Lys Gly Ala Ala Gly Pro Pro Gly Pro Pro Gly Ala Ala Gly 
705                  710                715                  720
Thr Pro Gly Leu Gln Gly Met Pro Gly Glu Arg Gly Gly Leu Gly Ser 
                725                  730                735    
Pro Gly Pro Lys Gly Asp Lys Gly Glu Pro Gly Gly Pro Gly Ala Asp 
            740                  745                750        
Gly Val Pro Gly Lys Asp Gly Pro Arg Gly Pro Thr Gly Pro Ile Gly 
        755                  760                765            
Pro Pro Gly Pro Ala Gly Gln Pro Gly Asp Lys Gly Glu Gly Gly Ala 
    770                  775                780                
Pro Gly Leu Pro Gly Ile Ala Gly Pro Arg Gly Ser Pro Gly Glu Arg 
785                  790                795                  800
Gly Glu Thr Gly Pro Pro Gly Pro Ala Gly Phe Pro Gly Ala Pro Gly 
                805                  810                815    
Gln Asn Gly Glu Pro Gly Gly Lys Gly Glu Arg Gly Ala Pro Gly Glu 
            820                  825                830        
Lys Gly Glu Gly Gly Pro Pro Gly Val Ala Gly Pro Pro Gly Gly Ser 
        835                  840                845            
Gly Pro Ala Gly Pro Pro Gly Pro Gln Gly Val Lys Gly Glu Arg Gly 
    850                  855                860                
Ser Pro Gly Gly Pro Gly Ala Ala Gly Phe Pro Gly Ala Arg Gly Leu 
865                  870                875                  880
Pro Gly Pro Pro Gly Ser Asn Gly Asn Pro Gly Pro Pro Gly Pro Ser 
                885                  890                895    
Gly Ser Pro Gly Lys Asp Gly Pro Pro Gly Pro Ala Gly Asn Thr Gly 
            900                  905                910        
Ala Pro Gly Ser Pro Gly Val Ser Gly Pro Lys Gly Asp Ala Gly Gln 
        915                  920                925            
Pro Gly Glu Lys Gly Ser Pro Gly Ala Gln Gly Pro Pro Gly Ala Pro 
    930                  935                940                
Gly Pro Leu Gly Ile Ala Gly Ile Thr Gly Ala Arg Gly Leu Ala Gly 
945                  950                955                  960
Pro Pro Gly Met Pro Gly Pro Arg Gly Ser Pro Gly Pro Gln Gly Val 
                965                  970                975    
Lys Gly Glu Ser Gly Lys Pro Gly Ala Asn Gly Leu Ser Gly Glu Arg 
            980                  985                990        
Gly Pro Pro Gly Pro Gln Gly Leu Pro Gly Leu Ala Gly Thr Ala Gly 
        995                  1000                1005            
Glu Pro Gly Arg Asp Gly Asn Pro Gly Ser Asp Gly Leu Pro Gly Arg 
    1010                1015                1020                
Asp Gly Ser Pro Gly Gly Lys Gly Asp Arg Gly Glu Asn Gly Ser Pro 
1025                1030                1035                1040
Gly Ala Pro Gly Ala Pro Gly His Pro Gly Pro Pro Gly Pro Val Gly 
                1045                1050                1055    
Pro Ala Gly Lys Ser Gly Asp Arg Gly Glu Ser Gly Pro Ala Gly Pro 
            1060                1065                1070        
Ala Gly Ala Pro Gly Pro Ala Gly Ser Arg Gly Ala Pro Gly Pro Gln 
        1075                1080                1085            
Gly Pro Arg Gly Asp Lys Gly Glu Thr Gly Glu Arg Gly Ala Ala Gly 
    1090                1095                1100                
Ile Lys Gly His Arg Gly Phe Pro Gly Asn Pro Gly Ala Pro Gly Ser 
1105                1110                1115                1120
Pro Gly Pro Ala Gly Gln Gln Gly Ala Ile Gly Ser Pro Gly Pro Ala 
                1125                1130                1135    
Gly Pro Arg Gly Pro Val Gly Pro Ser Gly Pro Pro Gly Lys Asp Gly 
            1140                1145                1150        
Thr Ser Gly His Pro Gly Pro Ile Gly Pro Pro Gly Pro Arg Gly Asn 
        1155                1160                1165            
Arg Gly Glu Arg Gly Ser Glu Gly Ser Pro Gly His Pro Gly Gln Pro 
    1170                1175                1180                
Gly Pro Pro Gly Pro Pro Gly Ala Pro Gly Pro Cys Cys Gly Gly Val 
1185                1190                1195                1200
Gly Ala Ala Ala Ile Ala Gly Ile Gly Gly Glu Lys Ala Gly Gly Phe 
                1205                1210                1215    
Ala Pro Tyr Tyr Gly Asp Glu Pro Met Asp Phe Lys Ile Asn Thr Asp 
            1220                1225                1230        
Glu Ile Met Thr Ser Leu Lys Ser Val Asn Gly Gln Ile Glu Ser Leu 
        1235                1240                1245            
Ile Ser Pro Asp Gly Ser Arg Lys Asn Pro Ala Arg Asn Cys Arg Asp 
    1250                1255                1260                
Leu Lys Phe Cys His Pro Glu Leu Lys Ser Gly Glu Tyr Trp Val Asp 
1265                1270                1275                1280
Pro Asn Gln Gly Cys Lys Leu Asp Ala Ile Lys Val Phe Cys Asn Met 
                1285                1290                1295    
Glu Thr Gly Glu Thr Cys Ile Ser Ala Asn Pro Leu Asn Val Pro Arg 
            1300                1305                1310        
Lys His Trp Trp Thr Asp Ser Ser Ala Glu Lys Lys His Val Trp Phe 
        1315                1320                1325            
Gly Glu Ser Met Asp Gly Gly Phe Gln Phe Ser Tyr Gly Asn Pro Glu 
    1330                1335                1340                
Leu Pro Glu Asp Val Leu Asp Val Gln Leu Ala Phe Leu Arg Leu Leu 
1345                1350                1355                1360
Ser Ser Arg Ala Ser Gln Asn Ile Thr Tyr His Cys Lys Asn Ser Ile 
                1365                1370                1375    
Ala Tyr Met Asp Gln Ala Ser Gly Asn Val Lys Lys Ala Leu Lys Leu 
            1380                1385                1390        
Met Gly Ser Asn Glu Gly Glu Phe Lys Ala Glu Gly Asn Ser Lys Phe 
        1395                1400                1405            
Thr Tyr Thr Val Leu Glu Asp Gly Cys Thr Lys His Thr Gly Glu Trp 
    1410                1415                1420                
Ser Lys Thr Val Phe Glu Tyr Arg Thr Arg Lys Ala Val Arg Leu Pro 
1425                1430                1435                1440
Ile Val Asp Ile Ala Pro Tyr Asp Ile Gly Gly Pro Asp Gln Glu Phe 
                1445                1450                1455    
Gly Val Asp Val Gly Pro Val Cys Phe Leu 
            1460                1465    

<210> 55
<211> 1411
<212> DNA
<213> Homo sapiens

<220> 
<221> source
<222> 1..1411
<223> /mol_type="DNA"
      /note="Homo sapiens Oct4/POU5F1"
      /organism="Homo sapiens"

<400> 55
ccttcgcaag ccctcatttc accaggcccc cggcttgggg cgccttcctt ccccatggcg      60

ggacacctgg cttcggattt cgccttctcg ccccctccag gtggtggagg tgatgggcca     120

ggggggccgg agccgggctg ggttgatcct cggacctggc taagcttcca aggccctcct     180

ggagggccag gaatcgggcc gggggttggg ccaggctctg aggtgtgggg gattccccca     240

tgccccccgc cgtatgagtt ctgtgggggg atggcgtact gtgggcccca ggttggagtg     300

gggctagtgc cccaaggcgg cttggagacc tctcagcctg agggcgaagc aggagtcggg     360

gtggagagca actccgatgg ggcctccccg gagccctgca ccgtcacccc tggtgccgtg     420

aagctggaga aggagaagct ggagcaaaac ccggaggagt cccaggacat caaagctctg     480

cagaaagaac tcgagcaatt tgccaagctc ctgaagcaga agaggatcac cctgggatat     540

acacaggccg atgtggggct caccctgggg gttctatttg ggaaggtatt cagccaaacg     600

accatctgcc gctttgaggc tctgcagctt agcttcaaga acatgtgtaa gctgcggccc     660

ttgctgcaga agtgggtgga ggaagctgac aacaatgaaa atcttcagga gatatgcaaa     720

gcagaaaccc tcgtgcaggc ccgaaagaga aagcgaacca gtatcgagaa ccgagtgaga     780

ggcaacctgg agaatttgtt cctgcagtgc ccgaaaccca cactgcagca gatcagccac     840

atcgcccagc agcttgggct cgagaaggat gtggtccgag tgtggttctg taaccggcgc     900

cagaagggca agcgatcaag cagcgactat gcacaacgag aggattttga ggctgctggg     960

tctcctttct cagggggacc agtgtccttt cctctggccc cagggcccca ttttggtacc    1020

ccaggctatg ggagccctca cttcactgca ctgtactcct cggtcccttt ccctgagggg    1080

gaagcctttc cccctgtctc cgtcaccact ctgggctctc ccatgcattc aaactgaggt    1140

gcctgccctt ctaggaatgg gggacagggg gaggggagga gctagggaaa gaaaacctgg    1200

agtttgtgcc agggtttttg ggattaagtt cttcattcac taaggaagga attgggaaca    1260

caaagggtgg gggcagggga gtttggggca actggttgga gggaaggtga agttcaatga    1320

tgctcttgat tttaatccca catcatgtat cacttttttc ttaaataaag aagcctggga    1380

cacagtagat agacacactt aaaaaaaaaa a                                   1411


<210> 56
<211> 360
<212> PRT
<213> Homo sapiens

<220> 
<221> SOURCE
<222> 1..360
<223> /mol_type="protein"
      /note="Homo sapiens Oct4/POU5F1"
      /organism="Homo sapiens"

<400> 56
Met Ala Gly His Leu Ala Ser Asp Phe Ala Phe Ser Pro Pro Pro Gly 
1               5                   10                   15    
Gly Gly Gly Asp Gly Pro Gly Gly Pro Glu Pro Gly Trp Val Asp Pro 
            20                   25                  30        
Arg Thr Trp Leu Ser Phe Gln Gly Pro Pro Gly Gly Pro Gly Ile Gly 
        35                   40                  45            
Pro Gly Val Gly Pro Gly Ser Glu Val Trp Gly Ile Pro Pro Cys Pro 
    50                   55                  60                
Pro Pro Tyr Glu Phe Cys Gly Gly Met Ala Tyr Cys Gly Pro Gln Val 
65                   70                  75                  80
Gly Val Gly Leu Val Pro Gln Gly Gly Leu Glu Thr Ser Gln Pro Glu 
                85                   90                  95    
Gly Glu Ala Gly Val Gly Val Glu Ser Asn Ser Asp Gly Ala Ser Pro 
            100                  105                110        
Glu Pro Cys Thr Val Thr Pro Gly Ala Val Lys Leu Glu Lys Glu Lys 
        115                  120                125            
Leu Glu Gln Asn Pro Glu Glu Ser Gln Asp Ile Lys Ala Leu Gln Lys 
    130                  135                140                
Glu Leu Glu Gln Phe Ala Lys Leu Leu Lys Gln Lys Arg Ile Thr Leu 
145                  150                155                  160
Gly Tyr Thr Gln Ala Asp Val Gly Leu Thr Leu Gly Val Leu Phe Gly 
                165                  170                175    
Lys Val Phe Ser Gln Thr Thr Ile Cys Arg Phe Glu Ala Leu Gln Leu 
            180                  185                190        
Ser Phe Lys Asn Met Cys Lys Leu Arg Pro Leu Leu Gln Lys Trp Val 
        195                  200                205            
Glu Glu Ala Asp Asn Asn Glu Asn Leu Gln Glu Ile Cys Lys Ala Glu 
    210                  215                220                
Thr Leu Val Gln Ala Arg Lys Arg Lys Arg Thr Ser Ile Glu Asn Arg 
225                  230                235                  240
Val Arg Gly Asn Leu Glu Asn Leu Phe Leu Gln Cys Pro Lys Pro Thr 
                245                  250                255    
Leu Gln Gln Ile Ser His Ile Ala Gln Gln Leu Gly Leu Glu Lys Asp 
            260                  265                270        
Val Val Arg Val Trp Phe Cys Asn Arg Arg Gln Lys Gly Lys Arg Ser 
        275                  280                285            
Ser Ser Asp Tyr Ala Gln Arg Glu Asp Phe Glu Ala Ala Gly Ser Pro 
    290                  295                300                
Phe Ser Gly Gly Pro Val Ser Phe Pro Leu Ala Pro Gly Pro His Phe 
305                  310                315                  320
Gly Thr Pro Gly Tyr Gly Ser Pro His Phe Thr Ala Leu Tyr Ser Ser 
                325                  330                335    
Val Pro Phe Pro Glu Gly Glu Ala Phe Pro Pro Val Ser Val Thr Thr 
            340                  345                350        
Leu Gly Ser Pro Met His Ser Asn 
        355                  360

<210> 57
<211> 3897
<212> DNA
<213> Homo sapiens

<220> 
<221> source
<222> 1..3897
<223> /mol_type="DNA"
      /note="Homo sapiens Galc"
      /organism="Homo sapiens"

<400> 57
actcaaaatg gcggcggcgg cgtcagcatc agcggcctcc tgcccgtatc tatcgtggcg       60

gcgacgggac ccgcctccct gggcgccgga gtcatgtgac ccacacaatg gctgagtggc      120

tactctcggc ttcctggcaa cgccgagcga aagctatgac tgcggccgcg ggttcggcgg      180

gccgcgccgc ggtgcccttg ctgctgtgtg cgctgctggc gcccggcggc gcgtacgtgc      240

tcgacgactc cgacgggctg ggccgggagt tcgacggcat cggcgcggtc agcggcggcg      300

gggcaacctc ccgacttcta gtaaattacc cagagcccta tcgttctcag atattggatt      360

atctctttaa gccgaatttt ggtgcctctt tgcatatttt aaaagtggaa ataggtggtg      420

atgggcagac aacagacggc actgagccct cccacatgca ttatgcacta gatgagaatt      480

atttccgagg atacgagtgg tggttgatga aagaagctaa gaagaggaat cccaatatta      540

cactcattgg gttgccatgg tcattccctg gatggctggg aaaaggtttc gactggcctt      600

atgtcaatct tcagctgact gcctattatg tcgtgacctg gattgtgggc gccaagcgtt      660

accatgattt ggacattgat tatattggaa tttggaatga gaggtcatat aatgccaatt      720

atattaagat attaagaaaa atgctgaatt atcaaggtct ccagcgagtg aaaatcatag      780

caagtgataa tctctgggag tccatctctg catccatgct ccttgatgcc gaactcttca      840

aggtggttga tgttataggg gctcattatc ctggaaccca ttcagcaaaa gatgcaaagt      900

tgactgggaa gaagctttgg tcttctgaag actttagcac tttaaatagt gacatgggtg      960

caggctgctg gggtcgcatt ttaaatcaga attatatcaa tggctatatg acttccacaa     1020

tcgcatggaa tttagtggct agttactatg aacagttgcc ttatgggaga tgcgggttga     1080

tgacggccca ggagccatgg agtgggcact acgtggtaga atctcctgtc tgggtatcag     1140

ctcataccac tcagtttact caacctggct ggtattacct gaagacagtt ggccatttag     1200

agaaaggagg aagctacgta gctctgactg atggcttagg gaacctcacc atcatcattg     1260

aaaccatgag tcataaacat tctaagtgca tacggccatt tcttccttat ttcaatgtgt     1320

cacaacaatt tgccaccttt gttcttaagg gatcttttag tgaaatacca gagctacagg     1380

tatggtatac caaacttgga aaaacatccg aaagatttct ttttaagcag ctggattctc     1440

tatggctcct tgacagcgat ggcagtttca cactgagcct gcatgaagat gagctgttca     1500

cactcaccac tctcaccact ggtcgcaaag gcagctaccc gcttcctcca aaatcccagc     1560

ccttcccaag tacctataag gatgatttca atgttgatta cccatttttt agtgaagctc     1620

caaactttgc tgatcaaact ggtgtatttg aatattttac aaatattgaa gaccctggcg     1680

agcatcactt cacgctacgc caagttctca accagagacc cattacgtgg gctgccgatg     1740

catccaacac aatcagtatt ataggagact acaactggac caatctgact ataaagtgtg     1800

atgtatacat agagacccct gacacaggag gtgtgttcat tgcaggaaga gtaaataaag     1860

gtggtatttt gattagaagt gccagaggaa ttttcttctg gatttttgca aatggatctt     1920

acagggttac aggtgattta gctggatgga ttatatatgc tttaggacgt gttgaagtta     1980

cagcaaaaaa atggtataca ctcacgttaa ctattaaggg tcatttcacc tctggcatgc     2040

tgaatgacaa gtctctgtgg acagacatcc ctgtgaattt tccaaagaat ggctgggctg     2100

caattggaac tcactccttt gaatttgcac agtttgacaa ctttcttgtg gaagccacac     2160

gctaatactt aacagggcat catagaatac tctggatttt cttcccttct ttttggtttt     2220

ggttcagagc caattcttgt ttcattggaa cagtatatga ggcttttgag actaaaaata     2280

atgaagagta aaaggggaga gaaatttatt tttaatttac cctgtggaag attttattag     2340

aattaattcc aaggggaaaa ctggtgaatc tttaacatta cctggtgtgt tccctaacat     2400

tcaaactgtg cattggccat acccttagga gtggtttgag tagtacagac ctcgaagcct     2460

tgctgctaac actgaggtag ctctcttcat cttatttgca agcggtcctg tagatggcag     2520

taacttgatc atcactgaga tgtatttatg catgctgacc gtgtgtccaa gtgagccagt     2580

gtcttcatca caagatgatg ctgccataat agaaagctga agaacactag aagtagcttt     2640

ttgaaaacca cttcaacctg ttatgcttta tgctctaaaa agtatttttt tattttcctt     2700

tttaagatga tacttttgaa atgcaggata tgatgagtgg gatgatttta aaaatgcctc     2760

tttaataaac tacctctaac actatttctg cagtaataga tattagcaga ttaattgggt     2820

tatttgcatt atttaatttt tttgattcca agttttggtc ttgtaaccac tataactctc     2880

tgtgaacgtt tttccaggtg gctggaagaa ggaagaaaac ctgatatagc caatgctgtt     2940

gtagtcgttt cctcagcctc atctcactgt gctgtggtct gtcctcacat gtgcactggt     3000

aacagactca cacagctgat gaatgctttt ctctccttat gtgtggaagg aggggagcac     3060

ttagacattt gctaactccc agaattggat catctcctaa gatgtactta ctttttaaag     3120

tccaaatatg tttatattta aatatacgtg agcgtgttca tcatgttgta tgatttatac     3180

taagcattaa tgtggctcta tgtagcaaat cagttattca tgtaggtaaa gtaaatctag     3240

aattatttat aagaattact cattgaacta attctactat ttaggaattt gtaagagtct     3300

aacataggct tagctacagt gaagttttgc attgcttttg aagacaagaa gataagtgct     3360

agaataaata agattacaga gaaaattttt tgttaaaacc aagtgatttc cagctgatgt     3420

atctaatatt ttttaaaacg aacattatag aggtgtaatt tatttacaat aaaatgttcc     3480

tactttaaat atacaattca gtgagttttg ataaattgat atacccatgt aaccaacact     3540

ccagtcaagc ttcagaatat ttccatcacc ccagaaggtt ctcttgtata cctgctcagt     3600

cagttccttt cactcccaat tgttggcagc cattgatagg aattctatca ctataggtta     3660

gttttctttg ttccagaaca tcatgaaagc ggcgtcatgt actgtgtatt cttatgaatg     3720

gtttctttcc atcagcataa tgatttgaga tttgtccatg ttgtgtgatt cagtggtttg     3780

ttccttctta tttctgaaga gttttccatt gtatgaatat accacaattt gtttcctccc     3840

caccagtttc tgatactaca attaaaactg tctacattta caaaaaaaaa aaaaaaa        3897


<210> 58
<211> 685
<212> PRT
<213> Homo sapiens

<220> 
<221> SOURCE
<222> 1..685
<223> /mol_type="protein"
      /note="Homo sapiens Galc"
      /organism="Homo sapiens"

<400> 58
Met Ala Glu Trp Leu Leu Ser Ala Ser Trp Gln Arg Arg Ala Lys Ala 
1               5                   10                   15    
Met Thr Ala Ala Ala Gly Ser Ala Gly Arg Ala Ala Val Pro Leu Leu 
            20                   25                  30        
Leu Cys Ala Leu Leu Ala Pro Gly Gly Ala Tyr Val Leu Asp Asp Ser 
        35                   40                  45            
Asp Gly Leu Gly Arg Glu Phe Asp Gly Ile Gly Ala Val Ser Gly Gly 
    50                   55                  60                
Gly Ala Thr Ser Arg Leu Leu Val Asn Tyr Pro Glu Pro Tyr Arg Ser 
65                   70                  75                  80
Gln Ile Leu Asp Tyr Leu Phe Lys Pro Asn Phe Gly Ala Ser Leu His 
                85                   90                  95    
Ile Leu Lys Val Glu Ile Gly Gly Asp Gly Gln Thr Thr Asp Gly Thr 
            100                  105                110        
Glu Pro Ser His Met His Tyr Ala Leu Asp Glu Asn Tyr Phe Arg Gly 
        115                  120                125            
Tyr Glu Trp Trp Leu Met Lys Glu Ala Lys Lys Arg Asn Pro Asn Ile 
    130                  135                140                
Thr Leu Ile Gly Leu Pro Trp Ser Phe Pro Gly Trp Leu Gly Lys Gly 
145                  150                155                  160
Phe Asp Trp Pro Tyr Val Asn Leu Gln Leu Thr Ala Tyr Tyr Val Val 
                165                  170                175    
Thr Trp Ile Val Gly Ala Lys Arg Tyr His Asp Leu Asp Ile Asp Tyr 
            180                  185                190        
Ile Gly Ile Trp Asn Glu Arg Ser Tyr Asn Ala Asn Tyr Ile Lys Ile 
        195                  200                205            
Leu Arg Lys Met Leu Asn Tyr Gln Gly Leu Gln Arg Val Lys Ile Ile 
    210                  215                220                
Ala Ser Asp Asn Leu Trp Glu Ser Ile Ser Ala Ser Met Leu Leu Asp 
225                  230                235                  240
Ala Glu Leu Phe Lys Val Val Asp Val Ile Gly Ala His Tyr Pro Gly 
                245                  250                255    
Thr His Ser Ala Lys Asp Ala Lys Leu Thr Gly Lys Lys Leu Trp Ser 
            260                  265                270        
Ser Glu Asp Phe Ser Thr Leu Asn Ser Asp Met Gly Ala Gly Cys Trp 
        275                  280                285            
Gly Arg Ile Leu Asn Gln Asn Tyr Ile Asn Gly Tyr Met Thr Ser Thr 
    290                  295                300                
Ile Ala Trp Asn Leu Val Ala Ser Tyr Tyr Glu Gln Leu Pro Tyr Gly 
305                  310                315                  320
Arg Cys Gly Leu Met Thr Ala Gln Glu Pro Trp Ser Gly His Tyr Val 
                325                  330                335    
Val Glu Ser Pro Val Trp Val Ser Ala His Thr Thr Gln Phe Thr Gln 
            340                  345                350        
Pro Gly Trp Tyr Tyr Leu Lys Thr Val Gly His Leu Glu Lys Gly Gly 
        355                  360                365            
Ser Tyr Val Ala Leu Thr Asp Gly Leu Gly Asn Leu Thr Ile Ile Ile 
    370                  375                380                
Glu Thr Met Ser His Lys His Ser Lys Cys Ile Arg Pro Phe Leu Pro 
385                  390                395                  400
Tyr Phe Asn Val Ser Gln Gln Phe Ala Thr Phe Val Leu Lys Gly Ser 
                405                  410                415    
Phe Ser Glu Ile Pro Glu Leu Gln Val Trp Tyr Thr Lys Leu Gly Lys 
            420                  425                430        
Thr Ser Glu Arg Phe Leu Phe Lys Gln Leu Asp Ser Leu Trp Leu Leu 
        435                  440                445            
Asp Ser Asp Gly Ser Phe Thr Leu Ser Leu His Glu Asp Glu Leu Phe 
    450                  455                460                
Thr Leu Thr Thr Leu Thr Thr Gly Arg Lys Gly Ser Tyr Pro Leu Pro 
465                  470                475                  480
Pro Lys Ser Gln Pro Phe Pro Ser Thr Tyr Lys Asp Asp Phe Asn Val 
                485                  490                495    
Asp Tyr Pro Phe Phe Ser Glu Ala Pro Asn Phe Ala Asp Gln Thr Gly 
            500                  505                510        
Val Phe Glu Tyr Phe Thr Asn Ile Glu Asp Pro Gly Glu His His Phe 
        515                  520                525            
Thr Leu Arg Gln Val Leu Asn Gln Arg Pro Ile Thr Trp Ala Ala Asp 
    530                  535                540                
Ala Ser Asn Thr Ile Ser Ile Ile Gly Asp Tyr Asn Trp Thr Asn Leu 
545                  550                555                  560
Thr Ile Lys Cys Asp Val Tyr Ile Glu Thr Pro Asp Thr Gly Gly Val 
                565                  570                575    
Phe Ile Ala Gly Arg Val Asn Lys Gly Gly Ile Leu Ile Arg Ser Ala 
            580                  585                590        
Arg Gly Ile Phe Phe Trp Ile Phe Ala Asn Gly Ser Tyr Arg Val Thr 
        595                  600                605            
Gly Asp Leu Ala Gly Trp Ile Ile Tyr Ala Leu Gly Arg Val Glu Val 
    610                  615                620                
Thr Ala Lys Lys Trp Tyr Thr Leu Thr Leu Thr Ile Lys Gly His Phe 
625                  630                635                  640
Thr Ser Gly Met Leu Asn Asp Lys Ser Leu Trp Thr Asp Ile Pro Val 
                645                  650                655    
Asn Phe Pro Lys Asn Gly Trp Ala Ala Ile Gly Thr His Ser Phe Glu 
            660                  665                670        
Phe Ala Gln Phe Asp Asn Phe Leu Val Glu Ala Thr Arg 
        675                  680                685

<210> 59
<211> 606
<212> DNA
<213> Homo sapiens

<220> 
<221> source
<222> 1..606
<223> /mol_type="DNA"
      /note="Homo sapiens Scleraxis A and Scleraxis B"
      /organism="Homo sapiens"

<400> 59
atgtccttcg ccacgctgcg cccggcgccg ccgggccgct acctgtaccc cgaggtgagc      60

ccgctgtcgg aggacgagga ccgcggcagc gacagctcgg gctccgacga gaaaccctgt     120

cgcgtgcacg cggcgcgctg cggcctccag ggcgcccggc ggagggcggg gggccggcgg     180

gccgggggcg gggggccagg gggccggcca ggccgtgagc cccggcagcg gcacacggcg     240

aacgcgcgcg agcgagaccg caccaacagc gtgaacacgg ccttcacggc gctgcgcacg     300

ctgatcccca ccgagcccgc cgaccgcaag ctctccaaga ttgagacgct gcgcctggcc     360

tccagctaca tctcgcacct gggcaacgtg ctgctggcgg gcgaggcctg cggcgacgga     420

cagccctgcc actccgggcc cgccttcttc cacgcggcgc gcgccggcag ccccccgccg     480

ccgcccccgc cgcctcccgc ccgcgacggc gagaacaccc agcccaaaca gatctgcacc     540

ttctgcctca gcaaccagag aaagttgagc aaggaccgcg acagaaagac agcgattcgc     600

agttag                                                                606


<210> 60
<211> 201
<212> PRT
<213> Homo sapiens

<220> 
<221> SOURCE
<222> 1..201
<223> /mol_type="protein"
      /note="Homo sapiens Scleraxis A and Scleraxis B"
      /organism="Homo sapiens"

<400> 60
Met Ser Phe Ala Thr Leu Arg Pro Ala Pro Pro Gly Arg Tyr Leu Tyr 
1               5                   10                   15    
Pro Glu Val Ser Pro Leu Ser Glu Asp Glu Asp Arg Gly Ser Asp Ser 
            20                   25                  30        
Ser Gly Ser Asp Glu Lys Pro Cys Arg Val His Ala Ala Arg Cys Gly 
        35                   40                  45            
Leu Gln Gly Ala Arg Arg Arg Ala Gly Gly Arg Arg Ala Gly Gly Gly 
    50                   55                  60                
Gly Pro Gly Gly Arg Pro Gly Arg Glu Pro Arg Gln Arg His Thr Ala 
65                   70                  75                  80
Asn Ala Arg Glu Arg Asp Arg Thr Asn Ser Val Asn Thr Ala Phe Thr 
                85                   90                  95    
Ala Leu Arg Thr Leu Ile Pro Thr Glu Pro Ala Asp Arg Lys Leu Ser 
            100                  105                110        
Lys Ile Glu Thr Leu Arg Leu Ala Ser Ser Tyr Ile Ser His Leu Gly 
        115                  120                125            
Asn Val Leu Leu Ala Gly Glu Ala Cys Gly Asp Gly Gln Pro Cys His 
    130                  135                140                
Ser Gly Pro Ala Phe Phe His Ala Ala Arg Ala Gly Ser Pro Pro Pro 
145                  150                155                  160
Pro Pro Pro Pro Pro Pro Ala Arg Asp Gly Glu Asn Thr Gln Pro Lys 
                165                  170                175    
Gln Ile Cys Thr Phe Cys Leu Ser Asn Gln Arg Lys Leu Ser Lys Asp 
            180                  185                190        
Arg Asp Arg Lys Thr Ala Ile Arg Ser 
        195                  200    

<210> 61
<211> 3963
<212> DNA
<213> Homo sapiens

<220> 
<221> source
<222> 1..3963
<223> /mol_type="DNA"
      /note="Homo sapiens Sox-9"
      /organism="Homo sapiens"

<400> 61
ggagagccga aagcggagct cgaaactgac tggaaacttc agtggcgcgg agactcgcca       60

gtttcaaccc cggaaacttt tctttgcagg aggagaagag aaggggtgca agcgccccca      120

cttttgctct ttttcctccc ctcctcctcc tctccaattc gcctcccccc acttggagcg      180

ggcagctgtg aactggccac cccgcgcctt cctaagtgct cgccgcggta gccggccgac      240

gcgccagctt ccccgggagc cgcttgctcc gcatccgggc agccgagggg agaggagccc      300

gcgcctcgag tccccgagcc gccgcggctt ctcgcctttc ccggccacca gccccctgcc      360

ccgggcccgc gtatgaatct cctggacccc ttcatgaaga tgaccgacga gcaggagaag      420

ggcctgtccg gcgcccccag ccccaccatg tccgaggact ccgcgggctc gccctgcccg      480

tcgggctccg gctcggacac cgagaacacg cggccccagg agaacacgtt ccccaagggc      540

gagcccgatc tgaagaagga gagcgaggag gacaagttcc ccgtgtgcat ccgcgaggcg      600

gtcagccagg tgctcaaagg ctacgactgg acgctggtgc ccatgccggt gcgcgtcaac      660

ggctccagca agaacaagcc gcacgtcaag cggcccatga acgccttcat ggtgtgggcg      720

caggcggcgc gcaggaagct cgcggaccag tacccgcact tgcacaacgc cgagctcagc      780

aagacgctgg gcaagctctg gagacttctg aacgagagcg agaagcggcc cttcgtggag      840

gaggcggagc ggctgcgcgt gcagcacaag aaggaccacc cggattacaa gtaccagccg      900

cggcggagga agtcggtgaa gaacgggcag gcggaggcag aggaggccac ggagcagacg      960

cacatctccc ccaacgccat cttcaaggcg ctgcaggccg actcgccaca ctcctcctcc     1020

ggcatgagcg aggtgcactc ccccggcgag cactcggggc aatcccaggg cccaccgacc     1080

ccacccacca cccccaaaac cgacgtgcag ccgggcaagg ctgacctgaa gcgagagggg     1140

cgccccttgc cagagggggg cagacagccc cctatcgact tccgcgacgt ggacatcggc     1200

gagctgagca gcgacgtcat ctccaacatc gagaccttcg atgtcaacga gtttgaccag     1260

tacctgccgc ccaacggcca cccgggggtg ccggccacgc acggccaggt cacctacacg     1320

ggcagctacg gcatcagcag caccgcggcc accccggcga gcgcgggcca cgtgtggatg     1380

tccaagcagc aggcgccgcc gccacccccg cagcagcccc cacaggcccc gccggccccg     1440

caggcgcccc cgcagccgca ggcggcgccc ccacagcagc cggcggcacc cccgcagcag     1500

ccacaggcgc acacgctgac cacgctgagc agcgagccgg gccagtccca gcgaacgcac     1560

atcaagacgg agcagctgag ccccagccac tacagcgagc agcagcagca ctcgccccaa     1620

cagatcgcct acagcccctt caacctccca cactacagcc cctcctaccc gcccatcacc     1680

cgctcacagt acgactacac cgaccaccag aactccagct cctactacag ccacgcggca     1740

ggccagggca ccggcctcta ctccaccttc acctacatga accccgctca gcgccccatg     1800

tacaccccca tcgccgacac ctctggggtc ccttccatcc cgcagaccca cagcccccag     1860

cactgggaac aacccgtcta cacacagctc actcgacctt gaggaggcct cccacgaagg     1920

gcgaagatgg ccgagatgat cctaaaaata accgaagaaa gagaggacca accagaattc     1980

cctttggaca tttgtgtttt tttgtttttt tattttgttt tgttttttct tcttcttctt     2040

cttccttaaa gacatttaag ctaaaggcaa ctcgtaccca aatttccaag acacaaacat     2100

gacctatcca agcgcattac ccacttgtgg ccaatcagtg gccaggccaa ccttggctaa     2160

atggagcagc gaaatcaacg agaaactgga ctttttaaac cctcttcaga gcaagcgtgg     2220

aggatgatgg agaatcgtgt gatcagtgtg ctaaatctct ctgcctgttt ggactttgta     2280

attatttttt tagcagtaat taaagaaaaa agtcctctgt gaggaatatt ctctatttta     2340

aatattttta gtatgtactg tgtatgattc attaccattt tgaggggatt tatacatatt     2400

tttagataaa attaaatgct cttatttttc caacagctaa actactctta gttgaacagt     2460

gtgccctagc ttttcttgca accagagtat ttttgtacag atttgctttc tcttacaaaa     2520

agaaaaaaaa aatcctgttg tattaacatt taaaaacaga attgtgttat gtgatcagtt     2580

ttgggggtta actttgctta attcctcagg ctttgcgatt taaggaggag ctgccttaaa     2640

aaaaaataaa ggccttattt tgcaattatg ggagtaaaca atagtctaga gaagcatttg     2700

gtaagcttta tcatatatat attttttaaa gaagagaaaa acaccttgag ccttaaaacg     2760

gtgctgctgg gaaacatttg cactctttta gtgcatttcc tcctgccttt gcttgttcac     2820

tgcagtctta agaaagaggt aaaaggcaag caaaggagat gaaatctgtt ctgggaatgt     2880

ttcagcagcc aataagtgcc cgagcacact gcccccggtt gcctgcctgg gccccatgtg     2940

gaaggcagat gcctgctcgc tctgtcacct gtgcctctca gaacaccagc agttaacctt     3000

caagacattc cacttgctaa aattatttat tttgtaagga gaggttttaa ttaaaacaaa     3060

aaaaaattct tttttttttt tttttccaat tttaccttct ttaaaatagg ttgttggagc     3120

tttcctcaaa gggtatggtc atctgttgtt aaattatgtt cttaactgta accagttttt     3180

ttttatttat ctctttaatc tttttttatt attaaaagca agtttctttg tattcctcac     3240

cctagatttg tataaatgcc tttttgtcca tccctttttt ctttgttgtt tttgttgaaa     3300

acaaactgga aacttgtttc tttttttgta taaatgagag attgcaaatg tagtgtatca     3360

ctgagtcatt tgcagtgttt tctgccacag acctttgggc tgccttatat tgtgtgtgtg     3420

tgtgggtgtg tgtgtgtttt gacacaaaaa caatgcaagc atgtgtcatc catatttctc     3480

tgcatcttct cttggagtga gggaggctac ctggagggga tcagcccact gacagacctt     3540

aatcttaatt actgctgtgg ctagagagtt tgaggattgc tttttaaaaa agacagcaaa     3600

cttttttttt tatttaaaaa aagatatatt aacagtttta gaagtcagta gaataaaatc     3660

ttaaagcact cataatatgg catccttcaa tttctgtata aaagcagatc tttttaaaaa     3720

gatacttctg taacttaaga aacctggcat ttaaatcata ttttgtcttt aggtaaaagc     3780

tttggtttgt gttcgtgttt tgtttgtttc acttgtttcc ctcccagccc caaacctttt     3840

gttctctccg tgaaacttac ctttcccttt ttctttctct tttttttttt tgtatattat     3900

tgtttacaat aaatatacat tgcattaaaa agaaaaaaaa aaaaaaaaaa aaaaaaaaaa     3960

aaa                                                                   3963


<210> 62
<211> 509
<212> PRT
<213> Homo sapiens

<220> 
<221> SOURCE
<222> 1..509
<223> /mol_type="protein"
      /note="Homo sapiens Sox-9"
      /organism="Homo sapiens"

<400> 62
Met Asn Leu Leu Asp Pro Phe Met Lys Met Thr Asp Glu Gln Glu Lys 
1               5                   10                   15    
Gly Leu Ser Gly Ala Pro Ser Pro Thr Met Ser Glu Asp Ser Ala Gly 
            20                   25                  30        
Ser Pro Cys Pro Ser Gly Ser Gly Ser Asp Thr Glu Asn Thr Arg Pro 
        35                   40                  45            
Gln Glu Asn Thr Phe Pro Lys Gly Glu Pro Asp Leu Lys Lys Glu Ser 
    50                   55                  60                
Glu Glu Asp Lys Phe Pro Val Cys Ile Arg Glu Ala Val Ser Gln Val 
65                   70                  75                  80
Leu Lys Gly Tyr Asp Trp Thr Leu Val Pro Met Pro Val Arg Val Asn 
                85                   90                  95    
Gly Ser Ser Lys Asn Lys Pro His Val Lys Arg Pro Met Asn Ala Phe 
            100                  105                110        
Met Val Trp Ala Gln Ala Ala Arg Arg Lys Leu Ala Asp Gln Tyr Pro 
        115                  120                125            
His Leu His Asn Ala Glu Leu Ser Lys Thr Leu Gly Lys Leu Trp Arg 
    130                  135                140                
Leu Leu Asn Glu Ser Glu Lys Arg Pro Phe Val Glu Glu Ala Glu Arg 
145                  150                155                  160
Leu Arg Val Gln His Lys Lys Asp His Pro Asp Tyr Lys Tyr Gln Pro 
                165                  170                175    
Arg Arg Arg Lys Ser Val Lys Asn Gly Gln Ala Glu Ala Glu Glu Ala 
            180                  185                190        
Thr Glu Gln Thr His Ile Ser Pro Asn Ala Ile Phe Lys Ala Leu Gln 
        195                  200                205            
Ala Asp Ser Pro His Ser Ser Ser Gly Met Ser Glu Val His Ser Pro 
    210                  215                220                
Gly Glu His Ser Gly Gln Ser Gln Gly Pro Pro Thr Pro Pro Thr Thr 
225                  230                235                  240
Pro Lys Thr Asp Val Gln Pro Gly Lys Ala Asp Leu Lys Arg Glu Gly 
                245                  250                255    
Arg Pro Leu Pro Glu Gly Gly Arg Gln Pro Pro Ile Asp Phe Arg Asp 
            260                  265                270        
Val Asp Ile Gly Glu Leu Ser Ser Asp Val Ile Ser Asn Ile Glu Thr 
        275                  280                285            
Phe Asp Val Asn Glu Phe Asp Gln Tyr Leu Pro Pro Asn Gly His Pro 
    290                  295                300                
Gly Val Pro Ala Thr His Gly Gln Val Thr Tyr Thr Gly Ser Tyr Gly 
305                  310                315                  320
Ile Ser Ser Thr Ala Ala Thr Pro Ala Ser Ala Gly His Val Trp Met 
                325                  330                335    
Ser Lys Gln Gln Ala Pro Pro Pro Pro Pro Gln Gln Pro Pro Gln Ala 
            340                  345                350        
Pro Pro Ala Pro Gln Ala Pro Pro Gln Pro Gln Ala Ala Pro Pro Gln 
        355                  360                365            
Gln Pro Ala Ala Pro Pro Gln Gln Pro Gln Ala His Thr Leu Thr Thr 
    370                  375                380                
Leu Ser Ser Glu Pro Gly Gln Ser Gln Arg Thr His Ile Lys Thr Glu 
385                  390                395                  400
Gln Leu Ser Pro Ser His Tyr Ser Glu Gln Gln Gln His Ser Pro Gln 
                405                  410                415    
Gln Ile Ala Tyr Ser Pro Phe Asn Leu Pro His Tyr Ser Pro Ser Tyr 
            420                  425                430        
Pro Pro Ile Thr Arg Ser Gln Tyr Asp Tyr Thr Asp His Gln Asn Ser 
        435                  440                445            
Ser Ser Tyr Tyr Ser His Ala Ala Gly Gln Gly Thr Gly Leu Tyr Ser 
    450                  455                460                
Thr Phe Thr Tyr Met Asn Pro Ala Gln Arg Pro Met Tyr Thr Pro Ile 
465                  470                475                  480
Ala Asp Thr Ser Gly Val Pro Ser Ile Pro Gln Thr His Ser Pro Gln 
                485                  490                495    
His Trp Glu Gln Pro Val Tyr Thr Gln Leu Thr Arg Pro 
            500                  505                

<210> 63
<211> 2379
<212> DNA
<213> Homo sapiens

<220> 
<221> source
<222> 1..2379
<223> /mol_type="DNA"
      /note="Homo sapiens c-Myc"
      /organism="Homo sapiens"

<400> 63
gacccccgag ctgtgctgct cgcggccgcc accgccgggc cccggccgtc cctggctccc      60

ctcctgcctc gagaagggca gggcttctca gaggcttggc gggaaaaaga acggagggag     120

ggatcgcgct gagtataaaa gccggttttc ggggctttat ctaactcgct gtagtaattc     180

cagcgagagg cagagggagc gagcgggcgg ccggctaggg tggaagagcc gggcgagcag     240

agctgcgctg cgggcgtcct gggaagggag atccggagcg aatagggggc ttcgcctctg     300

gcccagccct cccgctgatc ccccagccag cggtccgcaa cccttgccgc atccacgaaa     360

ctttgcccat agcagcgggc gggcactttg cactggaact tacaacaccc gagcaaggac     420

gcgactctcc cgacgcgggg aggctattct gcccatttgg ggacacttcc ccgccgctgc     480

caggacccgc ttctctgaaa ggctctcctt gcagctgctt agacgctgga tttttttcgg     540

gtagtggaaa accagcagcc tcccgcgacg atgcccctca acgttagctt caccaacagg     600

aactatgacc tcgactacga ctcggtgcag ccgtatttct actgcgacga ggaggagaac     660

ttctaccagc agcagcagca gagcgagctg cagcccccgg cgcccagcga ggatatctgg     720

aagaaattcg agctgctgcc caccccgccc ctgtccccta gccgccgctc cgggctctgc     780

tcgccctcct acgttgcggt cacacccttc tcccttcggg gagacaacga cggcggtggc     840

gggagcttct ccacggccga ccagctggag atggtgaccg agctgctggg aggagacatg     900

gtgaaccaga gtttcatctg cgacccggac gacgagacct tcatcaaaaa catcatcatc     960

caggactgta tgtggagcgg cttctcggcc gccgccaagc tcgtctcaga gaagctggcc    1020

tcctaccagg ctgcgcgcaa agacagcggc agcccgaacc ccgcccgcgg ccacagcgtc    1080

tgctccacct ccagcttgta cctgcaggat ctgagcgccg ccgcctcaga gtgcatcgac    1140

ccctcggtgg tcttccccta ccctctcaac gacagcagct cgcccaagtc ctgcgcctcg    1200

caagactcca gcgccttctc tccgtcctcg gattctctgc tctcctcgac ggagtcctcc    1260

ccgcagggca gccccgagcc cctggtgctc catgaggaga caccgcccac caccagcagc    1320

gactctgagg aggaacaaga agatgaggaa gaaatcgatg ttgtttctgt ggaaaagagg    1380

caggctcctg gcaaaaggtc agagtctgga tcaccttctg ctggaggcca cagcaaacct    1440

cctcacagcc cactggtcct caagaggtgc cacgtctcca cacatcagca caactacgca    1500

gcgcctccct ccactcggaa ggactatcct gctgccaaga gggtcaagtt ggacagtgtc    1560

agagtcctga gacagatcag caacaaccga aaatgcacca gccccaggtc ctcggacacc    1620

gaggagaatg tcaagaggcg aacacacaac gtcttggagc gccagaggag gaacgagcta    1680

aaacggagct tttttgccct gcgtgaccag atcccggagt tggaaaacaa tgaaaaggcc    1740

cccaaggtag ttatccttaa aaaagccaca gcatacatcc tgtccgtcca agcagaggag    1800

caaaagctca tttctgaaga ggacttgttg cggaaacgac gagaacagtt gaaacacaaa    1860

cttgaacagc tacggaactc ttgtgcgtaa ggaaaagtaa ggaaaacgat tccttctaac    1920

agaaatgtcc tgagcaatca cctatgaact tgtttcaaat gcatgatcaa atgcaacctc    1980

acaaccttgg ctgagtcttg agactgaaag atttagccat aatgtaaact gcctcaaatt    2040

ggactttggg cataaaagaa cttttttatg cttaccatct tttttttttc tttaacagat    2100

ttgtatttaa gaattgtttt taaaaaattt taagatttac acaatgtttc tctgtaaata    2160

ttgccattaa atgtaaataa ctttaataaa acgtttatag cagttacaca gaatttcaat    2220

cctagtatat agtacctagt attataggta ctataaaccc taattttttt tatttaagta    2280

cattttgctt tttaaagttg atttttttct attgttttta gaaaaaataa aataactggc    2340

aaatatatca ttgagccaaa tcttaaaaaa aaaaaaaaa                           2379


<210> 64
<211> 454
<212> PRT
<213> Homo sapiens

<220> 
<221> SOURCE
<222> 1..454
<223> /mol_type="protein"
      /note="Homo sapiens c-Myc"
      /organism="Homo sapiens"

<400> 64
Met Asp Phe Phe Arg Val Val Glu Asn Gln Gln Pro Pro Ala Thr Met 
1               5                   10                   15    
Pro Leu Asn Val Ser Phe Thr Asn Arg Asn Tyr Asp Leu Asp Tyr Asp 
            20                   25                  30        
Ser Val Gln Pro Tyr Phe Tyr Cys Asp Glu Glu Glu Asn Phe Tyr Gln 
        35                   40                  45            
Gln Gln Gln Gln Ser Glu Leu Gln Pro Pro Ala Pro Ser Glu Asp Ile 
    50                   55                  60                
Trp Lys Lys Phe Glu Leu Leu Pro Thr Pro Pro Leu Ser Pro Ser Arg 
65                   70                  75                  80
Arg Ser Gly Leu Cys Ser Pro Ser Tyr Val Ala Val Thr Pro Phe Ser 
                85                   90                  95    
Leu Arg Gly Asp Asn Asp Gly Gly Gly Gly Ser Phe Ser Thr Ala Asp 
            100                  105                110        
Gln Leu Glu Met Val Thr Glu Leu Leu Gly Gly Asp Met Val Asn Gln 
        115                  120                125            
Ser Phe Ile Cys Asp Pro Asp Asp Glu Thr Phe Ile Lys Asn Ile Ile 
    130                  135                140                
Ile Gln Asp Cys Met Trp Ser Gly Phe Ser Ala Ala Ala Lys Leu Val 
145                  150                155                  160
Ser Glu Lys Leu Ala Ser Tyr Gln Ala Ala Arg Lys Asp Ser Gly Ser 
                165                  170                175    
Pro Asn Pro Ala Arg Gly His Ser Val Cys Ser Thr Ser Ser Leu Tyr 
            180                  185                190        
Leu Gln Asp Leu Ser Ala Ala Ala Ser Glu Cys Ile Asp Pro Ser Val 
        195                  200                205            
Val Phe Pro Tyr Pro Leu Asn Asp Ser Ser Ser Pro Lys Ser Cys Ala 
    210                  215                220                
Ser Gln Asp Ser Ser Ala Phe Ser Pro Ser Ser Asp Ser Leu Leu Ser 
225                  230                235                  240
Ser Thr Glu Ser Ser Pro Gln Gly Ser Pro Glu Pro Leu Val Leu His 
                245                  250                255    
Glu Glu Thr Pro Pro Thr Thr Ser Ser Asp Ser Glu Glu Glu Gln Glu 
            260                  265                270        
Asp Glu Glu Glu Ile Asp Val Val Ser Val Glu Lys Arg Gln Ala Pro 
        275                  280                285            
Gly Lys Arg Ser Glu Ser Gly Ser Pro Ser Ala Gly Gly His Ser Lys 
    290                  295                300                
Pro Pro His Ser Pro Leu Val Leu Lys Arg Cys His Val Ser Thr His 
305                  310                315                  320
Gln His Asn Tyr Ala Ala Pro Pro Ser Thr Arg Lys Asp Tyr Pro Ala 
                325                  330                335    
Ala Lys Arg Val Lys Leu Asp Ser Val Arg Val Leu Arg Gln Ile Ser 
            340                  345                350        
Asn Asn Arg Lys Cys Thr Ser Pro Arg Ser Ser Asp Thr Glu Glu Asn 
        355                  360                365            
Val Lys Arg Arg Thr His Asn Val Leu Glu Arg Gln Arg Arg Asn Glu 
    370                  375                380                
Leu Lys Arg Ser Phe Phe Ala Leu Arg Asp Gln Ile Pro Glu Leu Glu 
385                  390                395                  400
Asn Asn Glu Lys Ala Pro Lys Val Val Ile Leu Lys Lys Ala Thr Ala 
                405                  410                415    
Tyr Ile Leu Ser Val Gln Ala Glu Glu Gln Lys Leu Ile Ser Glu Glu 
            420                  425                430        
Asp Leu Leu Arg Lys Arg Arg Glu Gln Leu Lys His Lys Leu Glu Gln 
        435                  440                445            
Leu Arg Asn Ser Cys Ala 
    450                

<210> 65
<211> 2949
<212> DNA
<213> Homo sapiens

<220> 
<221> source
<222> 1..2949
<223> /mol_type="DNA"
      /note="Homo sapiens Klf-4"
      /organism="Homo sapiens"

<400> 65
agtttcccga ccagagagaa cgaacgtgtc tgcgggcgcg cggggagcag aggcggtggc      60

gggcggcggc ggcaccggga gccgccgagt gaccctcccc cgcccctctg gccccccacc     120

ctcccacccg cccgtggccc gcgcccatgg ccgcgcgcgc tccacacaac tcaccggagt     180

ccgcgccttg cgccgccgac cagttcgcag ctccgcgcca cggcagccag tctcacctgg     240

cggcaccgcc cgcccaccgc cccggccaca gcccctgcgc ccacggcagc actcgaggcg     300

accgcgacag tggtggggga cgctgctgag tggaagagag cgcagcccgg ccaccggacc     360

tacttactcg ccttgctgat tgtctatttt tgcgtttaca acttttctaa gaacttttgt     420

atacaaagga actttttaaa aaagacgctt ccaagttata tttaatccaa agaagaagga     480

tctcggccaa tttggggttt tgggttttgg cttcgtttct tctcttcgtt gactttgggg     540

ttcaggtgcc ccagctgctt cgggctgccg aggaccttct gggcccccac attaatgagg     600

cagccacctg gcgagtctga catggctgtc agcgacgcgc tgctcccatc tttctccacg     660

ttcgcgtctg gcccggcggg aagggagaag acactgcgtc aagcaggtgc cccgaataac     720

cgctggcggg aggagctctc ccacatgaag cgacttcccc cagtgcttcc cggccgcccc     780

tatgacctgg cggcggcgac cgtggccaca gacctggaga gcggcggagc cggtgcggct     840

tgcggcggta gcaacctggc gcccctacct cggagagaga ccgaggagtt caacgatctc     900

ctggacctgg actttattct ctccaattcg ctgacccatc ctccggagtc agtggccgcc     960

accgtgtcct cgtcagcgtc agcctcctct tcgtcgtcgc cgtcgagcag cggccctgcc    1020

agcgcgccct ccacctgcag cttcacctat ccgatccggg ccgggaacga cccgggcgtg    1080

gcgccgggcg gcacgggcgg aggcctcctc tatggcaggg agtccgctcc ccctccgacg    1140

gctcccttca acctggcgga catcaacgac gtgagcccct cgggcggctt cgtggccgag    1200

ctcctgcggc cagaattgga cccggtgtac attccgccgc agcagccgca gccgccaggt    1260

ggcgggctga tgggcaagtt cgtgctgaag gcgtcgctga gcgcccctgg cagcgagtac    1320

ggcagcccgt cggtcatcag cgtcagcaaa ggcagccctg acggcagcca cccggtggtg    1380

gtggcgccct acaacggcgg gccgccgcgc acgtgcccca agatcaagca ggaggcggtc    1440

tcttcgtgca cccacttggg cgctggaccc cctctcagca atggccaccg gccggctgca    1500

cacgacttcc ccctggggcg gcagctcccc agcaggacta ccccgaccct gggtcttgag    1560

gaagtgctga gcagcaggga ctgtcaccct gccctgccgc ttcctcccgg cttccatccc    1620

cacccggggc ccaattaccc atccttcctg cccgatcaga tgcagccgca agtcccgccg    1680

ctccattacc aagagctcat gccacccggt tcctgcatgc cagaggagcc caagccaaag    1740

aggggaagac gatcgtggcc ccggaaaagg accgccaccc acacttgtga ttacgcgggc    1800

tgcggcaaaa cctacacaaa gagttcccat ctcaaggcac acctgcgaac ccacacaggt    1860

gagaaacctt accactgtga ctgggacggc tgtggatgga aattcgcccg ctcagatgaa    1920

ctgaccaggc actaccgtaa acacacgggg caccgcccgt tccagtgcca aaaatgcgac    1980

cgagcatttt ccaggtcgga ccacctcgcc ttacacatga agaggcattt ttaaatccca    2040

gacagtggat atgacccaca ctgccagaag agaattcagt attttttact tttcacactg    2100

tcttcccgat gagggaagga gcccagccag aaagcactac aatcatggtc aagttcccaa    2160

ctgagtcatc ttgtgagtgg ataatcagga aaaatgagga atccaaaaga caaaaatcaa    2220

agaacagatg gggtctgtga ctggatcttc tatcattcca attctaaatc cgacttgaat    2280

attcctggac ttacaaaatg ccaagggggt gactggaagt tgtggatatc agggtataaa    2340

ttatatccgt gagttggggg agggaagacc agaattccct tgaattgtgt attgatgcaa    2400

tataagcata aaagatcacc ttgtattctc tttaccttct aaaagccatt attatgatgt    2460

tagaagaaga ggaagaaatt caggtacaga aaacatgttt aaatagccta aatgatggtg    2520

cttggtgagt cttggttcta aaggtaccaa acaaggaagc caaagttttc aaactgctgc    2580

atactttgac aaggaaaatc tatatttgtc ttccgatcaa catttatgac ctaagtcagg    2640

taatatacct ggtttacttc tttagcattt ttatgcagac agtctgttat gcactgtggt    2700

ttcagatgtg caataatttg tacaatggtt tattcccaag tatgccttaa gcagaacaaa    2760

tgtgtttttc tatatagttc cttgccttaa taaatatgta atataaattt aagcaaacgt    2820

ctattttgta tatttgtaaa ctacaaagta aaatgaacat tttgtggagt ttgtattttg    2880

catactcaag gtgagaatta agttttaaat aaacctataa tattttatct gaaaaaaaaa    2940

aaaaaaaaa                                                            2949


<210> 66
<211> 478
<212> PRT
<213> Homo sapiens

<220> 
<221> SOURCE
<222> 1..478
<223> /mol_type="protein"
      /note="Homo sapiens Klf-4"
      /organism="Homo sapiens"

<400> 66
Met Arg Gln Pro Pro Gly Glu Ser Asp Met Ala Val Ser Asp Ala Leu 
1               5                   10                   15    
Leu Pro Ser Phe Ser Thr Phe Ala Ser Gly Pro Ala Gly Arg Glu Lys 
            20                   25                  30        
Thr Leu Arg Gln Ala Gly Ala Pro Asn Asn Arg Trp Arg Glu Glu Leu 
        35                   40                  45            
Ser His Met Lys Arg Leu Pro Pro Val Leu Pro Gly Arg Pro Tyr Asp 
    50                   55                  60                
Leu Ala Ala Ala Thr Val Ala Thr Asp Leu Glu Ser Gly Gly Ala Gly 
65                   70                  75                  80
Ala Ala Cys Gly Gly Ser Asn Leu Ala Pro Leu Pro Arg Arg Glu Thr 
                85                   90                  95    
Glu Glu Phe Asn Asp Leu Leu Asp Leu Asp Phe Ile Leu Ser Asn Ser 
            100                  105                110        
Leu Thr His Pro Pro Glu Ser Val Ala Ala Thr Val Ser Ser Ser Ala 
        115                  120                125            
Ser Ala Ser Ser Ser Ser Ser Pro Ser Ser Ser Gly Pro Ala Ser Ala 
    130                  135                140                
Pro Ser Thr Cys Ser Phe Thr Tyr Pro Ile Arg Ala Gly Asn Asp Pro 
145                  150                155                  160
Gly Val Ala Pro Gly Gly Thr Gly Gly Gly Leu Leu Tyr Gly Arg Glu 
                165                  170                175    
Ser Ala Pro Pro Pro Thr Ala Pro Phe Asn Leu Ala Asp Ile Asn Asp 
            180                  185                190        
Val Ser Pro Ser Gly Gly Phe Val Ala Glu Leu Leu Arg Pro Glu Leu 
        195                  200                205            
Asp Val Tyr Ile Pro Pro Gln Gln Pro Gln Pro Pro Gly Gly Gly Leu 
    210                  215                220                
Met Gly Lys Phe Val Leu Lys Ala Ser Leu Ser Ala Pro Gly Ser Glu 
225                  230                235                  240
Tyr Gly Ser Pro Ser Val Ile Ser Val Ser Lys Gly Ser Pro Asp Gly 
                245                  250                255    
Ser His Pro Val Val Val Ala Pro Tyr Asn Gly Gly Pro Pro Arg Thr 
            260                  265                270        
Cys Pro Lys Ile Lys Gln Glu Ala Val Ser Ser Cys Thr His Leu Gly 
        275                  280                285            
Ala Gly Pro Pro Leu Ser Asn Gly His Arg Pro Ala Ala His Asp Phe 
    290                  295                300                
Pro Leu Gly Arg Gln Leu Pro Ser Arg Thr Thr Pro Thr Leu Gly Leu 
305                  310                315                  320
Glu Glu Val Leu Ser Ser Arg Asp Cys His Pro Ala Leu Pro Leu Pro 
                325                  330                335    
Pro Gly Phe His Pro His Pro Gly Pro Asn Tyr Pro Ser Phe Leu Pro 
            340                  345                350        
Asp Gln Met Gln Pro Gln Val Pro Pro Leu His Tyr Gln Glu Leu Met 
        355                  360                365            
Pro Pro Gly Ser Cys Met Pro Glu Glu Pro Lys Pro Lys Arg Gly Arg 
    370                  375                380                
Arg Ser Trp Pro Arg Lys Arg Thr Ala Thr His Thr Cys Asp Tyr Ala 
385                  390                395                  400
Gly Cys Gly Lys Thr Tyr Thr Lys Ser Ser His Leu Lys Ala His Leu 
                405                  410                415    
Arg Thr His Thr Gly Glu Lys Pro Tyr His Cys Asp Trp Asp Gly Cys 
            420                  425                430        
Gly Trp Lys Phe Ala Arg Ser Asp Glu Leu Thr Arg His Tyr Arg Lys 
        435                  440                445            
His Thr Gly His Arg Pro Phe Gln Cys Gln Lys Cys Asp Arg Ala Phe 
    450                  455                460                
Ser Arg Ser Asp His Leu Ala Leu His Met Lys Arg His Phe 
465                  470                475            

<210> 67
<211> 2520
<212> DNA
<213> Homo sapiens

<220> 
<221> source
<222> 1..2520
<223> /mol_type="DNA"
      /note="Homo sapiens Sox-2"
      /organism="Homo sapiens"

<400> 67
ggatggttgt ctattaactt gttcaaaaaa gtatcaggag ttgtcaaggc agagaagaga      60

gtgtttgcaa aagggggaaa gtagtttgct gcctctttaa gactaggact gagagaaaga     120

agaggagaga gaaagaaagg gagagaagtt tgagccccag gcttaagcct ttccaaaaaa     180

taataataac aatcatcggc ggcggcagga tcggccagag gaggagggaa gcgctttttt     240

tgatcctgat tccagtttgc ctctctcttt ttttccccca aattattctt cgcctgattt     300

tcctcgcgga gccctgcgct cccgacaccc ccgcccgcct cccctcctcc tctccccccg     360

cccgcgggcc ccccaaagtc ccggccgggc cgagggtcgg cggccgccgg cgggccgggc     420

ccgcgcacag cgcccgcatg tacaacatga tggagacgga gctgaagccg ccgggcccgc     480

agcaaacttc ggggggcggc ggcggcaact ccaccgcggc ggcggccggc ggcaaccaga     540

aaaacagccc ggaccgcgtc aagcggccca tgaatgcctt catggtgtgg tcccgcgggc     600

agcggcgcaa gatggcccag gagaacccca agatgcacaa ctcggagatc agcaagcgcc     660

tgggcgccga gtggaaactt ttgtcggaga cggagaagcg gccgttcatc gacgaggcta     720

agcggctgcg agcgctgcac atgaaggagc acccggatta taaataccgg ccccggcgga     780

aaaccaagac gctcatgaag aaggataagt acacgctgcc cggcgggctg ctggcccccg     840

gcggcaatag catggcgagc ggggtcgggg tgggcgccgg cctgggcgcg ggcgtgaacc     900

agcgcatgga cagttacgcg cacatgaacg gctggagcaa cggcagctac agcatgatgc     960

aggaccagct gggctacccg cagcacccgg gcctcaatgc gcacggcgca gcgcagatgc    1020

agcccatgca ccgctacgac gtgagcgccc tgcagtacaa ctccatgacc agctcgcaga    1080

cctacatgaa cggctcgccc acctacagca tgtcctactc gcagcagggc acccctggca    1140

tggctcttgg ctccatgggt tcggtggtca agtccgaggc cagctccagc ccccctgtgg    1200

ttacctcttc ctcccactcc agggcgccct gccaggccgg ggacctccgg gacatgatca    1260

gcatgtatct ccccggcgcc gaggtgccgg aacccgccgc ccccagcaga cttcacatgt    1320

cccagcacta ccagagcggc ccggtgcccg gcacggccat taacggcaca ctgcccctct    1380

cacacatgtg agggccggac agcgaactgg aggggggaga aattttcaaa gaaaaacgag    1440

ggaaatggga ggggtgcaaa agaggagagt aagaaacagc atggagaaaa cccggtacgc    1500

tcaaaaagaa aaaggaaaaa aaaaaatccc atcacccaca gcaaatgaca gctgcaaaag    1560

agaacaccaa tcccatccac actcacgcaa aaaccgcgat gccgacaaga aaacttttat    1620

gagagagatc ctggacttct ttttggggga ctatttttgt acagagaaaa cctggggagg    1680

gtggggaggg cgggggaatg gaccttgtat agatctggag gaaagaaagc tacgaaaaac    1740

tttttaaaag ttctagtggt acggtaggag ctttgcagga agtttgcaaa agtctttacc    1800

aataatattt agagctagtc tccaagcgac gaaaaaaatg ttttaatatt tgcaagcaac    1860

ttttgtacag tatttatcga gataaacatg gcaatcaaaa tgtccattgt ttataagctg    1920

agaatttgcc aatatttttc aaggagaggc ttcttgctga attttgattc tgcagctgaa    1980

atttaggaca gttgcaaacg tgaaaagaag aaaattattc aaatttggac attttaattg    2040

tttaaaaatt gtacaaaagg aaaaaattag aataagtact ggcgaaccat ctctgtggtc    2100

ttgtttaaaa agggcaaaag ttttagactg tactaaattt tataacttac tgttaaaagc    2160

aaaaatggcc atgcaggttg acaccgttgg taatttataa tagcttttgt tcgatcccaa    2220

ctttccattt tgttcagata aaaaaaacca tgaaattact gtgtttgaaa tattttctta    2280

tggtttgtaa tatttctgta aatttattgt gatattttaa ggttttcccc cctttatttt    2340

ccgtagttgt attttaaaag attcggctct gtattatttg aatcagtctg ccgagaatcc    2400

atgtatatat ttgaactaat atcatcctta taacaggtac attttcaact taagttttta    2460

ctccattatg cacagtttga gataaataaa tttttgaaat atggacactg aaaaaaaaaa    2520


<210> 68
<211> 317
<212> PRT
<213> Homo sapiens

<220> 
<221> SOURCE
<222> 1..317
<223> /mol_type="protein"
      /note="Homo sapiens Sox-2"
      /organism="Homo sapiens"

<400> 68
Met Tyr Asn Met Met Glu Thr Glu Leu Lys Pro Pro Gly Pro Gln Gln 
1               5                   10                   15    
Thr Ser Gly Gly Gly Gly Gly Asn Ser Thr Ala Ala Ala Ala Gly Gly 
            20                   25                  30        
Asn Gln Lys Asn Ser Pro Asp Arg Val Lys Arg Pro Met Asn Ala Phe 
        35                   40                  45            
Met Val Trp Ser Arg Gly Gln Arg Arg Lys Met Ala Gln Glu Asn Pro 
    50                   55                  60                
Lys Met His Asn Ser Glu Ile Ser Lys Arg Leu Gly Ala Glu Trp Lys 
65                   70                  75                  80
Leu Leu Ser Glu Thr Glu Lys Arg Pro Phe Ile Asp Glu Ala Lys Arg 
                85                   90                  95    
Leu Arg Ala Leu His Met Lys Glu His Pro Asp Tyr Lys Tyr Arg Pro 
            100                  105                110        
Arg Arg Lys Thr Lys Thr Leu Met Lys Lys Asp Lys Tyr Thr Leu Pro 
        115                  120                125            
Gly Gly Leu Leu Ala Pro Gly Gly Asn Ser Met Ala Ser Gly Val Gly 
    130                  135                140                
Val Gly Ala Gly Leu Gly Ala Gly Val Asn Gln Arg Met Asp Ser Tyr 
145                  150                155                  160
Ala His Met Asn Gly Trp Ser Asn Gly Ser Tyr Ser Met Met Gln Asp 
                165                  170                175    
Gln Leu Gly Tyr Pro Gln His Pro Gly Leu Asn Ala His Gly Ala Ala 
            180                  185                190        
Gln Met Gln Pro Met His Arg Tyr Asp Val Ser Ala Leu Gln Tyr Asn 
        195                  200                205            
Ser Met Thr Ser Ser Gln Thr Tyr Met Asn Gly Ser Pro Thr Tyr Ser 
    210                  215                220                
Met Ser Tyr Ser Gln Gln Gly Thr Pro Gly Met Ala Leu Gly Ser Met 
225                  230                235                  240
Gly Ser Val Val Lys Ser Glu Ala Ser Ser Ser Pro Pro Val Val Thr 
                245                  250                255    
Ser Ser Ser His Ser Arg Ala Pro Cys Gln Ala Gly Asp Leu Arg Asp 
            260                  265                270        
Met Ile Ser Met Tyr Leu Pro Gly Ala Glu Val Pro Glu Pro Ala Ala 
        275                  280                285            
Pro Ser Arg Leu His Met Ser Gln His Tyr Gln Ser Gly Pro Val Pro 
    290                  295                300                
Gly Thr Ala Ile Asn Gly Thr Leu Pro Leu Ser His Met 
305                  310                315        

<210> 69
<211> 2098
<212> DNA
<213> Homo sapiens

<220> 
<221> source
<222> 1..2098
<223> /mol_type="DNA"
      /note="Homo sapiens NANOG"
      /organism="Homo sapiens"

<400> 69
attataaatc tagagactcc aggattttaa cgttctgctg gactgagctg gttgcctcat      60

gttattatgc aggcaactca ctttatccca atttcttgat acttttcctt ctggaggtcc     120

tatttctcta acatcttcca gaaaagtctt aaagctgcct taaccttttt tccagtccac     180

ctcttaaatt ttttcctcct cttcctctat actaacatga gtgtggatcc agcttgtccc     240

caaagcttgc cttgctttga agcatccgac tgtaaagaat cttcacctat gcctgtgatt     300

tgtgggcctg aagaaaacta tccatccttg caaatgtctt ctgctgagat gcctcacacg     360

gagactgtct ctcctcttcc ttcctccatg gatctgctta ttcaggacag ccctgattct     420

tccaccagtc ccaaaggcaa acaacccact tctgcagaga agagtgtcgc aaaaaaggaa     480

gacaaggtcc cggtcaagaa acagaagacc agaactgtgt tctcttccac ccagctgtgt     540

gtactcaatg atagatttca gagacagaaa tacctcagcc tccagcagat gcaagaactc     600

tccaacatcc tgaacctcag ctacaaacag gtgaagacct ggttccagaa ccagagaatg     660

aaatctaaga ggtggcagaa aaacaactgg ccgaagaata gcaatggtgt gacgcagaag     720

gcctcagcac ctacctaccc cagcctttac tcttcctacc accagggatg cctggtgaac     780

ccgactggga accttccaat gtggagcaac cagacctgga acaattcaac ctggagcaac     840

cagacccaga acatccagtc ctggagcaac cactcctgga acactcagac ctggtgcacc     900

caatcctgga acaatcaggc ctggaacagt cccttctata actgtggaga ggaatctctg     960

cagtcctgca tgcagttcca gccaaattct cctgccagtg acttggaggc tgccttggaa    1020

gctgctgggg aaggccttaa tgtaatacag cagaccacta ggtattttag tactccacaa    1080

accatggatt tattcctaaa ctactccatg aacatgcaac ctgaagacgt gtgaagatga    1140

gtgaaactga tattactcaa tttcagtctg gacactggct gaatccttcc tctcccctcc    1200

tcccatccct cataggattt ttcttgtttg gaaaccacgt gttctggttt ccatgatgcc    1260

catccagtca atctcatgga gggtggagta tggttggagc ctaatcagcg aggtttcttt    1320

tttttttttt ttcctattgg atcttcctgg agaaaatact tttttttttt ttttttttga    1380

aacggagtct tgctctgtcg cccaggctgg agtgcagtgg cgcggtcttg gctcactgca    1440

agctccgtct cccgggttca cgccattctc ctgcctcagc ctcccgagca gctgggacta    1500

caggcgcccg ccacctcgcc cggctaatat tttgtatttt tagtagagac ggggtttcac    1560

tgtgttagcc aggatggtct cgatctcctg accttgtgat ccacccgcct cggcctccct    1620

aacagctggg atttacaggc gtgagccacc gcgccctgcc tagaaaagac attttaataa    1680

ccttggctgc cgtctctggc tatagataag tagatctaat actagtttgg atatctttag    1740

ggtttagaat ctaacctcaa gaataagaaa tacaagtaca aattggtgat gaagatgtat    1800

tcgtattgtt tgggattggg aggctttgct tattttttaa aaactattga ggtaaagggt    1860

taagctgtaa catacttaat tgatttctta ccgtttttgg ctctgttttg ctatatcccc    1920

taatttgttg gttgtgctaa tctttgtaga aagaggtctc gtatttgctg catcgtaatg    1980

acatgagtac tgctttagtt ggtttaagtt caaatgaatg aaacaactat ttttccttta    2040

gttgatttta ccctgatttc accgagtgtt tcaatgagta aatatacagc ttaaacat      2098


<210> 70
<211> 305
<212> PRT
<213> Homo sapiens

<220> 
<221> SOURCE
<222> 1..305
<223> /mol_type="protein"
      /note="Homo sapiens NANOG"
      /organism="Homo sapiens"

<400> 70
Met Ser Val Asp Pro Ala Cys Pro Gln Ser Leu Pro Cys Phe Glu Ala 
1               5                   10                   15    
Ser Asp Cys Lys Glu Ser Ser Pro Met Pro Val Ile Cys Gly Pro Glu 
            20                   25                  30        
Glu Asn Tyr Pro Ser Leu Gln Met Ser Ser Ala Glu Met Pro His Thr 
        35                   40                  45            
Glu Thr Val Ser Pro Leu Pro Ser Ser Met Asp Leu Leu Ile Gln Asp 
    50                   55                  60                
Ser Pro Asp Ser Ser Thr Ser Pro Lys Gly Lys Gln Pro Thr Ser Ala 
65                   70                  75                  80
Glu Lys Ser Val Ala Lys Lys Glu Asp Lys Val Pro Val Lys Lys Gln 
                85                   90                  95    
Lys Thr Arg Thr Val Phe Ser Ser Thr Gln Leu Cys Val Leu Asn Asp 
            100                  105                110        
Arg Phe Gln Arg Gln Lys Tyr Leu Ser Leu Gln Gln Met Gln Glu Leu 
        115                  120                125            
Ser Asn Ile Leu Asn Leu Ser Tyr Lys Gln Val Lys Thr Trp Phe Gln 
    130                  135                140                
Asn Gln Arg Met Lys Ser Lys Arg Trp Gln Lys Asn Asn Trp Pro Lys 
145                  150                155                  160
Asn Ser Asn Gly Val Thr Gln Lys Ala Ser Ala Pro Thr Tyr Pro Ser 
                165                  170                175    
Leu Tyr Ser Ser Tyr His Gln Gly Cys Leu Val Asn Pro Thr Gly Asn 
            180                  185                190        
Leu Pro Met Trp Ser Asn Gln Thr Trp Asn Asn Ser Thr Trp Ser Asn 
        195                  200                205            
Gln Thr Gln Asn Ile Gln Ser Trp Ser Asn His Ser Trp Asn Thr Gln 
    210                  215                220                
Thr Trp Cys Thr Gln Ser Trp Asn Asn Gln Ala Trp Asn Ser Pro Phe 
225                  230                235                  240
Tyr Asn Cys Gly Glu Glu Ser Leu Gln Ser Cys Met Gln Phe Gln Pro 
                245                  250                255    
Asn Ser Pro Ala Ser Asp Leu Glu Ala Ala Leu Glu Ala Ala Gly Glu 
            260                  265                270        
Gly Leu Asn Val Ile Gln Gln Thr Thr Arg Tyr Phe Ser Thr Pro Gln 
        275                  280                285            
Thr Met Asp Leu Phe Leu Asn Tyr Ser Met Asn Met Gln Pro Glu Asp 
    290                  295                300                
Val 
305

<210> 71
<211> 469
<212> DNA
<213> Homo sapiens

<220> 
<221> source
<222> 1..469
<223> /mol_type="DNA"
      /note="Homo sapiens Insulin"
      /organism="Homo sapiens"

<400> 71
agccctccag gacaggctgc atcagaagag gccatcaagc agatcactgt ccttctgcca      60

tggccctgtg gatgcgcctc ctgcccctgc tggcgctgct ggccctctgg ggacctgacc     120

cagccgcagc ctttgtgaac caacacctgt gcggctcaca cctggtggaa gctctctacc     180

tagtgtgcgg ggaacgaggc ttcttctaca cacccaagac ccgccgggag gcagaggacc     240

tgcaggtggg gcaggtggag ctgggcgggg gccctggtgc aggcagcctg cagcccttgg     300

ccctggaggg gtccctgcag aagcgtggca ttgtggaaca atgctgtacc agcatctgct     360

ccctctacca gctggagaac tactgcaact agacgcagcc cgcaggcagc cccacacccg     420

ccgcctcctg caccgagaga gatggaataa agcccttgaa ccagcaaaa                 469


<210> 72
<211> 110
<212> PRT
<213> Homo sapiens

<220> 
<221> SOURCE
<222> 1..110
<223> /mol_type="protein"
      /note="Homo sapiens Insulin"
      /organism="Homo sapiens"

<400> 72
Met Ala Leu Trp Met Arg Leu Leu Pro Leu Leu Ala Leu Leu Ala Leu 
1               5                   10                   15    
Trp Gly Pro Asp Pro Ala Ala Ala Phe Val Asn Gln His Leu Cys Gly 
            20                   25                  30        
Ser His Leu Val Glu Ala Leu Tyr Leu Val Cys Gly Glu Arg Gly Phe 
        35                   40                  45            
Phe Tyr Thr Pro Lys Thr Arg Arg Glu Ala Glu Asp Leu Gln Val Gly 
    50                   55                  60                
Gln Val Glu Leu Gly Gly Gly Pro Gly Ala Gly Ser Leu Gln Pro Leu 
65                   70                  75                  80
Ala Leu Glu Gly Ser Leu Gln Lys Arg Gly Ile Val Glu Gln Cys Cys 
                85                   90                  95    
Thr Ser Ile Cys Ser Leu Tyr Gln Leu Glu Asn Tyr Cys Asn 
            100                  105                110

<210> 73
<211> 1310
<212> DNA
<213> Homo sapiens

<220> 
<221> source
<222> 1..1310
<223> /mol_type="DNA"
      /note="Homo sapiens GAPDH"
      /organism="Homo sapiens"

<400> 73
aaattgagcc cgcagcctcc cgcttcgctc tctgctcctc ctgttcgaca gtcagccgca      60

tcttcttttg cgtcgccagc cgagccacat cgctcagaca ccatggggaa ggtgaaggtc     120

ggagtcaacg gatttggtcg tattgggcgc ctggtcacca gggctgcttt taactctggt     180

aaagtggata ttgttgccat caatgacccc ttcattgacc tcaactacat ggtttacatg     240

ttccaatatg attccaccca tggcaaattc catggcaccg tcaaggctga gaacgggaag     300

cttgtcatca atggaaatcc catcaccatc ttccaggagc gagatccctc caaaatcaag     360

tggggcgatg ctggcgctga gtacgtcgtg gagtccactg gcgtcttcac caccatggag     420

aaggctgggg ctcatttgca ggggggagcc aaaagggtca tcatctctgc cccctctgct     480

gatgccccca tgttcgtcat gggtgtgaac catgagaagt atgacaacag cctcaagatc     540

atcagcaatg cctcctgcac caccaactgc ttagcacccc tggccaaggt catccatgac     600

aactttggta tcgtggaagg actcatgacc acagtccatg ccatcactgc cacccagaag     660

actgtggatg gcccctccgg gaaactgtgg cgtgatggcc gcggggctct ccagaacatc     720

atccctgcct ctactggcgc tgccaaggct gtgggcaagg tcatccctga gctgaacggg     780

aagctcactg gcatggcctt ccgtgtcccc actgccaacg tgtcagtggt ggacctgacc     840

tgccgtctag aaaaacctgc caaatatgat gacatcaaga aggtggtgaa gcaggcgtcg     900

gagggccccc tcaagggcat cctgggctac actgagcacc aggtggtctc ctctgacttc     960

aacagcgaca cccactcctc cacctttgac gctggggctg gcattgccct caacgaccac    1020

tttgtcaagc tcatttcctg gtatgacaac gaatttggct acagcaacag ggtggtggac    1080

ctcatggccc acatggcctc caaggagtaa gacccctgga ccaccagccc cagcaagagc    1140

acaagaggaa gagagagacc ctcactgctg gggagtccct gccacactca gtcccccacc    1200

acactgaatc tcccctcctc acagttgcca tgtagacccc ttgaagaggg gaggggccta    1260

gggagccgca ccttgtcatg taccatcaat aaagtaccct gtgctcaacc               1310


<210> 74
<211> 335
<212> PRT
<213> Homo sapiens

<220> 
<221> SOURCE
<222> 1..335
<223> /mol_type="protein"
      /note="Homo sapiens GAPDH"
      /organism="Homo sapiens"

<400> 74
Met Gly Lys Val Lys Val Gly Val Asn Gly Phe Gly Arg Ile Gly Arg 
1               5                   10                   15    
Leu Val Thr Arg Ala Ala Phe Asn Ser Gly Lys Val Asp Ile Val Ala 
            20                   25                  30        
Ile Asn Asp Pro Phe Ile Asp Leu Asn Tyr Met Val Tyr Met Phe Gln 
        35                   40                  45            
Tyr Asp Ser Thr His Gly Lys Phe His Gly Thr Val Lys Ala Glu Asn 
    50                   55                  60                
Gly Lys Leu Val Ile Asn Gly Asn Pro Ile Thr Ile Phe Gln Glu Arg 
65                   70                  75                  80
Asp Pro Ser Lys Ile Lys Trp Gly Asp Ala Gly Ala Glu Tyr Val Val 
                85                   90                  95    
Glu Ser Thr Gly Val Phe Thr Thr Met Glu Lys Ala Gly Ala His Leu 
            100                  105                110        
Gln Gly Gly Ala Lys Arg Val Ile Ile Ser Ala Pro Ser Ala Asp Ala 
        115                  120                125            
Pro Met Phe Val Met Gly Val Asn His Glu Lys Tyr Asp Asn Ser Leu 
    130                  135                140                
Lys Ile Ile Ser Asn Ala Ser Cys Thr Thr Asn Cys Leu Ala Pro Leu 
145                  150                155                  160
Ala Lys Val Ile His Asp Asn Phe Gly Ile Val Glu Gly Leu Met Thr 
                165                  170                175    
Thr Val His Ala Ile Thr Ala Thr Gln Lys Thr Val Asp Gly Pro Ser 
            180                  185                190        
Gly Lys Leu Trp Arg Asp Gly Arg Gly Ala Leu Gln Asn Ile Ile Pro 
        195                  200                205            
Ala Ser Thr Gly Ala Ala Lys Ala Val Gly Lys Val Ile Pro Glu Leu 
    210                  215                220                
Asn Gly Lys Leu Thr Gly Met Ala Phe Arg Val Pro Thr Ala Asn Val 
225                  230                235                  240
Ser Val Val Asp Leu Thr Cys Arg Leu Glu Lys Pro Ala Lys Tyr Asp 
                245                  250                255    
Asp Ile Lys Lys Val Val Lys Gln Ala Ser Glu Gly Pro Leu Lys Gly 
            260                  265                270        
Ile Leu Gly Tyr Thr Glu His Gln Val Val Ser Ser Asp Phe Asn Ser 
        275                  280                285            
Asp Thr His Ser Ser Thr Phe Asp Ala Gly Ala Gly Ile Ala Leu Asn 
    290                  295                300                
Asp His Phe Val Lys Leu Ile Ser Trp Tyr Asp Asn Glu Phe Gly Tyr 
305                  310                315                  320
Ser Asn Arg Val Val Asp Leu Met Ala His Met Ala Ser Lys Glu 
                325                  330                335

<210> 75
<211> 5946
<212> DNA
<213> Rattus norvegicus

<220> 
<221> source
<222> 1..5946
<223> /mol_type="DNA"
      /note="Rattus norvegicus Nestin"
      /organism="Rattus norvegicus"

<400> 75
tgctggagtt ctccgcttcc gctgggtcac tgtcgccgct acttcttttc aacccctaaa       60

agctccacgg gccactccct tctctagtgc tccacgtccg cttgccctcg ggggccagac      120

cagcgacatg gagggttgcg tcggggaaga atcttttcag atgtgggagc tcaatcgacg      180

cctggaggcc tacctgaccc gggtcaagac gctagaagag caaaaccagc tgctcagcgc      240

cgagcttggg ggactccggg cgcagtccgg agacacctcc tggagagccc gagccgatga      300

cgagctggca tccctgcgga tcctcgtcga tcagcgctgg cgggagaagc tcgaggctga      360

ggtgcagcgc gacaaccttg cggaagagct ggagagcgtg gcgggccggt gccagcaggt      420

gcggcttgct cgggagcgga ccgtccagga ggccgcctgc agccggcgcg cactcgaggc      480

ggagaagaat gcgcggggct ggctgagcac ccaggcggcc gagctggagc gggagttaga      540

ggctctgcga gccgcgcacg aggaggagcg cgcacacctg aacgcccagg ccgcctgtgc      600

gcctcgccgg ccccccgcac cgccccaccg gatccccggt ccggcccccg aagtcgagga      660

tctggccagg cgactaggcg aagtgtggcg cggggcggtg cgtgactacc aggagcgcgt      720

ggctcacatg gaaagctcgc tgggtcaggc acgcgagcgg ctgagccaag ccgtgcgggg      780

cgctcgggag tgtcgcttag aggtgcaaca gctgcaggct gatcgcgaca gcctccagga      840

gcgcagagaa gcgctggaac agagattgga aggccgctgg caggaccggc tgcaggccac      900

tgataagttc cagctggctg tggaagccct ggagcaggag aagcaaggtc tacagagtca      960

gatcgctcag atcctggaag gtgggcagca actggcacac ctcaagatgt cccttagtct     1020

ggaggtggct acatacagga ctctgctgga ggctgagaac tctcggttgc agacacctgg     1080

acgaggttcc caggcttctc ttggctttct ggaccccaag ctgaagccga atttccttgg     1140

gataccagag gaccagtacc tgggatctgt gctccctgcc ctcagcccca catccttccc     1200

ttcccccttg cctaataccc ttgagactcc tgtgacagcc ttcctgaaga ctcaggagtt     1260

ccttcaggcc agaaccccca ccttggccag cactcccatc ccacctatat ctgaggctcc     1320

ctgtcctcca aatgcagagg tgagagccca ggaggtccct ctttctctgc tccagacaca     1380

ggctccagag cccctttggc tgaaggccac agtgcctagt tcttctgcta tcctcccaga     1440

actagaggaa cctgggggca agcagcaggg tcacttccct gatgatctga cctccttagc     1500

cacaaacctc aaccctcacc accctacttt agaggctaaa gatggagaat ccagtgagtc     1560

tagagtttct agcatattcc aggaagatga ggggcaaatc tgggaactgg tagagaaaga     1620

agcagatata gaggtaaaag tagaaaacag ctcagcccag aaaacacaag aaagtggtct     1680

ggacacagaa gaaacccagg attcccaggg acctttgcag aaggaaacac tgaaggctct     1740

aggagaggag ccactgatgt ctctgaaaat ccagaactat gagacagcag ggaaagagaa     1800

ttgcaattct tctacagaag gccacctggg aacactagaa ggcccagaaa aagaaaagca     1860

aataccacta aagtctttag aagaaaagaa tgtagagtca gagaaaactc tagaaaatgg     1920

ggttcctgta ctatctgagc ttttaggaaa agaagacaca agaacagagg atcaagaatt     1980

aatgtctcct aaaggtacac taaagagatt ttcatctcta ggaaaggaaa gtcaagaagt     2040

agtgaggcct tcaaaagagg ggaacctaga atcatggaca gcttttaaag aggagagcca     2100

acacccactg ggatttccag gagctgagga ccagatgctt gagagactgg tagagaaaga     2160

ggatcagagc ttcccaaggt ctccagagga agaggaccag gaggcatgta gacctctgca     2220

gaaagagaat caggaaccac tagggtatga agaagcagag ggccagatac ttgagagact     2280

gatagaaaaa gagagtcagg agtccctgag gtctccagaa gaagaggacc aggaggcagg     2340

tagatctctg cagaaagaga atcaggagcc actagggtat gaagaagcag aggaccagat     2400

gcttgagaga ctgatagaaa aagagagtca ggagtccctg aagtctccag aagaaaacca     2460

gaggattggg aagcctctag aaagagagaa tcagaaatct ctgaggtatc ttgaagaaaa     2520

ccaggagact tttgtaccac tagaaagcag gaaccagagg ccactgagat ctctagaagt     2580

agaagaggag gagcagagaa ttgtgaaacc tctagaaaaa gtgagtcagg attccctcgg     2640

atctctagca gaagagaatg tgcagccact gaggtatctg gaagaagatg actgcataaa     2700

taagagcctt ctagaagaca agactcacaa gtccttgggg tctcttgaag atagaaatgg     2760

ggatagcatt attataccac aagaaagtga gacccaggtt tcattgaggc ctccagaaga     2820

ggaggaccag aggattgtga accatctaga aaaagaaagt caggagttct cgaggtcttc     2880

agaagaagaa gagcaggtga tggagagatc tctagaagga gagaaccatg aatcactgag     2940

ttctgtagaa aaagaggacc agatggttga gagccaacta gagaaagaga gtcaggactc     3000

agggaagtct cttgaagatg agagccagga gacctttgga cctctggaaa aagagaatgc     3060

agagtccctg agatctctag caggacagga ccaagaggaa cagaagcttg aacaagagac     3120

ccaacaaaca ctgagggctg tagggaatga gcagatggca gtgagcccac cagaaaaggt     3180

ggatccagag ttaccgaagc ctcttggaaa tgaccaggaa atagctagat ctcttggaaa     3240

agagaatcaa gagtcactag tgtcactgaa agaaaaaggt atagagacag tgaagtcttt     3300

agaaacagag atcatagaac cactggagac tgcagaagag gacctggaaa gaaggaagtc     3360

tatagatact caggagccat tgtggtctac tgaagtggct agagagacag tagaacctcc     3420

agaagatgag cccccaggat cgctagggtc tgtggatgag aaccgagaga cactgacatc     3480

ccttgaaaag gagagtcaag aactgagctc tctgggcaag tggaacgtag agaccagggt     3540

agaggacagt cagcagtgcc tgcaagtaga agagggtctg caggaggaac agcaccaaga     3600

gtctctgaga gaggtgaagc aggagctgcc tagctctgga aatcaacagc ggtgggagga     3660

tgtggtggag ggcaaagcag tgggtcagga agcacctctg gcaaccacag gagtgggaac     3720

tgaggataag gcagagttgc atctgagggg gcaaggtgga gaggaagaag ctgcagcaga     3780

gggagagctg ttgcaggata ttgtggggga ggcctggagt ctggggagct ctgagcccaa     3840

ggagcagagg gtccctgctg aggccctcga caacctggaa ggaggggcct tagaggtccc     3900

agttgctcag tcaatgccag aggtgacaga gcgagatgag gatagagccc aagcaggtga     3960

acaagactcc atagaggtga cccttgggtt agaggctgcc agaactggac tggaactcga     4020

gcaggaagtg gtagggctag aggacccaag gcattttgcc agggaggagg ccattccccc     4080

atccctgggg gaggaaagtg tgaaggcaaa gatagctcag ggcttggaag ggcctggaaa     4140

ggaaccaaaa gaggcaggtg ctctggactc ggggatcctt gaattgccca agactagcag     4200

cgaggctctg gaatgccagg gccatgaaga gtctgagtcc atggagggct gggaagaaga     4260

ggaggcctca ctggagactt cagatcatga gggcagtgat gcccctcagc ccaggccccc     4320

agaaacagaa gaagatgagg gtgcacaggc agcactgaca gcccctggtc ccaagctctt     4380

ggaaccctgt tcacccatcc caatcctgac agatgcccat gagctgcagc cccaggctga     4440

ggggatccag gaggctggct ggcagccaga agctgggtct gaagcactag aaagggtaga     4500

aaatgagcca gagtttggtc ttggggagat cccggagggc ctccaggatt gggaagaggg     4560

cagagaagaa agcgaggcag atgatctagg ggaaactctc cctgactcta ctcccctggg     4620

cctctacctg aggtcccctg cttctccaaa gtgggatctg gctggagaac agaggctttc     4680

ccctcaaggg gatgccggga aggaagactg gggtcctgct gtccccgctg cccagggcct     4740

cagtggtcca ccggaagagg aggaggagca aggccatggc tctgacctat catctgagga     4800

gtttgaggac ctagggactg aggcctctct tcttccaggg gttcccaagg aggtggcaga     4860

tcacgtgggc caagtgcccc cggtactgca gcctgcatgc tgggatcagg gtggggaatc     4920

tgatgggttt gctgatgagg aagaaagtgg ggaggaggga gaggaagaag atgctgatga     4980

ggaaggagca gagtcaggag ctcagtggtg ggggtcaggg gcctctggtg gaggctgcaa     5040

ggtccaggat attgcccaaa gaggagaccc ggtacaggag tctgtgggtg tcagtggtct     5100

ctgggatgat ggcttgagag gtgctgcagc taatgttcct gccctagaga tggtatctca     5160

ggacagtgct gagccttctg ggtcagagga gtctgagtct gcttccttgg agggggagga     5220

aggtcaagtg actgaccatt tagatgctcc ccaggaggtg accagcatgg tcccgggggt     5280

aggagatgcc tttgacattg gtggccagag ccccaacttg gactcagaac aagtgaatgg     5340

gaaaatggag aatggactag aacaggctga ggggcaggtg gtcctggatg gggacgagga     5400

tcaagaactc ctattacagg gacaggaggt gggtgctcta aaggttcctt tggtagcatc     5460

tcctgtgcat ctaggcccaa gccagcccct gaagttcact ctgagtgggg tagatgggga     5520

ttcctggtcc tcaggggaag actagaaact gcccctctgg ctctgaggat gtactggtgg     5580

ggatgtccct ccctgctctg ggtgaccact cttagctttg ataacttgac ccatggtatt     5640

tgtcctggag agttgtggct gggctgagca agggaggtga gatcctcctg aaggctcagg     5700

agttccaggc ctatagttct accccctctt tcttctgtgg ctcacctgct ggaagaggcc     5760

tgggcccaga gctttcccac aaggctgttc tggccacagc ttgctagcct tgcctaccac     5820

ctgcacaagg tctggtctgg tgtatgacca ggggagctga gggcagcatt tatctgaccc     5880

ttcatctcag cctgctgaga gcttgttcct ctcttcctcc ctgaataaag ccgtatccct     5940

acctac                                                                5946


<210> 76
<211> 1805
<212> PRT
<213> Rattus norvegicus

<220> 
<221> SOURCE
<222> 1..1805
<223> /mol_type="protein"
      /note="Rattus norvegicus Nestin"
      /organism="Rattus norvegicus"

<400> 76
Met Glu Gly Cys Val Gly Glu Glu Ser Phe Gln Met Trp Glu Leu Asn 
1               5                   10                   15    
Arg Arg Leu Glu Ala Tyr Leu Thr Arg Val Lys Thr Leu Glu Glu Gln 
            20                   25                  30        
Asn Gln Leu Leu Ser Ala Glu Leu Gly Gly Leu Arg Ala Gln Ser Gly 
        35                   40                  45            
Asp Thr Ser Trp Arg Ala Arg Ala Asp Asp Glu Leu Ala Ser Leu Arg 
    50                   55                  60                
Ile Leu Val Asp Gln Arg Trp Arg Glu Lys Leu Glu Ala Glu Val Gln 
65                   70                  75                  80
Arg Asp Asn Leu Ala Glu Glu Leu Glu Ser Val Ala Gly Arg Cys Gln 
                85                   90                  95    
Gln Val Arg Leu Ala Arg Glu Arg Thr Val Gln Glu Ala Ala Cys Ser 
            100                  105                110        
Arg Arg Ala Leu Glu Ala Glu Lys Asn Ala Arg Gly Trp Leu Ser Thr 
        115                  120                125            
Gln Ala Ala Glu Leu Glu Arg Glu Leu Glu Ala Leu Arg Ala Ala His 
    130                  135                140                
Glu Glu Glu Arg Ala His Leu Asn Ala Gln Ala Ala Cys Ala Pro Arg 
145                  150                155                  160
Arg Pro Pro Ala Pro Pro His Arg Ile Pro Gly Pro Ala Pro Glu Val 
                165                  170                175    
Glu Asp Leu Ala Arg Arg Leu Gly Glu Val Trp Arg Gly Ala Val Arg 
            180                  185                190        
Asp Tyr Gln Glu Arg Val Ala His Met Glu Ser Ser Leu Gly Gln Ala 
        195                  200                205            
Arg Glu Arg Leu Ser Gln Ala Val Arg Gly Ala Arg Glu Cys Arg Leu 
    210                  215                220                
Glu Val Gln Gln Leu Gln Ala Asp Arg Asp Ser Leu Gln Glu Arg Arg 
225                  230                235                  240
Glu Ala Leu Glu Gln Arg Leu Glu Gly Arg Trp Gln Asp Arg Leu Gln 
                245                  250                255    
Ala Thr Asp Lys Phe Gln Leu Ala Val Glu Ala Leu Glu Gln Glu Lys 
            260                  265                270        
Gln Gly Leu Gln Ser Gln Ile Ala Gln Ile Leu Glu Gly Gly Gln Gln 
        275                  280                285            
Leu Ala His Leu Lys Met Ser Leu Ser Leu Glu Val Ala Thr Tyr Arg 
    290                  295                300                
Thr Leu Leu Glu Ala Glu Asn Ser Arg Leu Gln Thr Pro Gly Arg Gly 
305                  310                315                  320
Ser Gln Ala Ser Leu Gly Phe Leu Asp Pro Lys Leu Lys Pro Asn Phe 
                325                  330                335    
Leu Gly Ile Pro Glu Asp Gln Tyr Leu Gly Ser Val Leu Pro Ala Leu 
            340                  345                350        
Ser Pro Thr Ser Phe Pro Ser Pro Leu Pro Asn Thr Leu Glu Thr Pro 
        355                  360                365            
Val Thr Ala Phe Leu Lys Thr Gln Glu Phe Leu Gln Ala Arg Thr Pro 
    370                  375                380                
Thr Leu Ala Ser Thr Pro Ile Pro Pro Ile Ser Glu Ala Pro Cys Pro 
385                  390                395                  400
Pro Asn Ala Glu Val Arg Ala Gln Glu Val Pro Leu Ser Leu Leu Gln 
                405                  410                415    
Thr Gln Ala Pro Glu Pro Leu Trp Leu Lys Ala Thr Val Pro Ser Ser 
            420                  425                430        
Ser Ala Ile Leu Pro Glu Leu Glu Glu Pro Gly Gly Lys Gln Gln Gly 
        435                  440                445            
His Phe Pro Asp Asp Leu Thr Ser Leu Ala Thr Asn Leu Asn Pro His 
    450                  455                460                
His Pro Thr Leu Glu Ala Lys Asp Gly Glu Ser Ser Glu Ser Arg Val 
465                  470                475                  480
Ser Ser Ile Phe Gln Glu Asp Glu Gly Gln Ile Trp Glu Leu Val Glu 
                485                  490                495    
Lys Glu Ala Asp Ile Glu Val Lys Val Glu Asn Ser Ser Ala Gln Lys 
            500                  505                510        
Thr Gln Glu Ser Gly Leu Asp Thr Glu Glu Thr Gln Asp Ser Gln Gly 
        515                  520                525            
Pro Leu Gln Lys Glu Thr Leu Lys Ala Leu Gly Glu Glu Pro Leu Met 
    530                  535                540                
Ser Leu Lys Ile Gln Asn Tyr Glu Thr Ala Gly Lys Glu Asn Cys Asn 
545                  550                555                  560
Ser Ser Thr Glu Gly His Leu Gly Thr Leu Glu Gly Pro Glu Lys Glu 
                565                  570                575    
Lys Gln Ile Pro Leu Lys Ser Leu Glu Glu Lys Asn Val Glu Ser Glu 
            580                  585                590        
Lys Thr Leu Glu Asn Gly Val Pro Val Leu Ser Glu Leu Leu Gly Lys 
        595                  600                605            
Glu Asp Thr Arg Thr Glu Asp Gln Glu Leu Met Ser Pro Lys Gly Thr 
    610                  615                620                
Leu Lys Arg Phe Ser Ser Leu Gly Lys Glu Ser Gln Glu Val Val Arg 
625                  630                635                  640
Pro Ser Lys Glu Gly Asn Leu Glu Ser Trp Thr Ala Phe Lys Glu Glu 
                645                  650                655    
Ser Gln His Pro Leu Gly Phe Pro Gly Ala Glu Asp Gln Met Leu Glu 
            660                  665                670        
Arg Leu Val Glu Lys Glu Asp Gln Ser Phe Pro Arg Ser Pro Glu Glu 
        675                  680                685            
Glu Asp Gln Glu Ala Cys Arg Pro Leu Gln Lys Glu Asn Gln Glu Pro 
    690                  695                700                
Leu Gly Tyr Glu Glu Ala Glu Gly Gln Ile Leu Glu Arg Leu Ile Glu 
705                  710                715                  720
Lys Glu Ser Gln Glu Ser Leu Arg Ser Pro Glu Glu Glu Asp Gln Glu 
                725                  730                735    
Ala Gly Arg Ser Leu Gln Lys Glu Asn Gln Glu Pro Leu Gly Tyr Glu 
            740                  745                750        
Glu Ala Glu Asp Gln Met Leu Glu Arg Leu Ile Glu Lys Glu Ser Gln 
        755                  760                765            
Glu Ser Leu Lys Ser Pro Glu Glu Asn Gln Arg Ile Gly Lys Pro Leu 
    770                  775                780                
Glu Arg Glu Asn Gln Lys Ser Leu Arg Tyr Leu Glu Glu Asn Gln Glu 
785                  790                795                  800
Thr Phe Val Pro Leu Glu Ser Arg Asn Gln Arg Pro Leu Arg Ser Leu 
                805                  810                815    
Glu Val Glu Glu Glu Glu Gln Arg Ile Val Lys Pro Leu Glu Lys Val 
            820                  825                830        
Ser Gln Asp Ser Leu Gly Ser Leu Ala Glu Glu Asn Val Gln Pro Leu 
        835                  840                845            
Arg Tyr Leu Glu Glu Asp Asp Cys Ile Asn Lys Ser Leu Leu Glu Asp 
    850                  855                860                
Lys Thr His Lys Ser Leu Gly Ser Leu Glu Asp Arg Asn Gly Asp Ser 
865                  870                875                  880
Ile Ile Ile Pro Gln Glu Ser Glu Thr Gln Val Ser Leu Arg Pro Pro 
                885                  890                895    
Glu Glu Glu Asp Gln Arg Ile Val Asn His Leu Glu Lys Glu Ser Gln 
            900                  905                910        
Glu Phe Ser Arg Ser Ser Glu Glu Glu Glu Gln Val Met Glu Arg Ser 
        915                  920                925            
Leu Glu Gly Glu Asn His Glu Ser Leu Ser Ser Val Glu Lys Glu Asp 
    930                  935                940                
Gln Met Val Glu Ser Gln Leu Glu Lys Glu Ser Gln Asp Ser Gly Lys 
945                  950                955                  960
Ser Leu Glu Asp Glu Ser Gln Glu Thr Phe Gly Pro Leu Glu Lys Glu 
                965                  970                975    
Asn Ala Glu Ser Leu Arg Ser Leu Ala Gly Gln Asp Gln Glu Glu Gln 
            980                  985                990        
Lys Leu Glu Gln Glu Thr Gln Gln Thr Leu Arg Ala Val Gly Asn Glu 
        995                  1000                1005            
Gln Met Ala Val Ser Pro Pro Glu Lys Val Asp Pro Glu Leu Pro Lys 
    1010                1015                1020                
Pro Leu Gly Asn Asp Gln Glu Ile Ala Arg Ser Leu Gly Lys Glu Asn 
1025                1030                1035                1040
Gln Glu Ser Leu Val Ser Leu Lys Glu Lys Gly Ile Glu Thr Val Lys 
                1045                1050                1055    
Ser Leu Glu Thr Glu Ile Ile Glu Pro Leu Glu Thr Ala Glu Glu Asp 
            1060                1065                1070        
Leu Glu Arg Arg Lys Ser Ile Asp Thr Gln Glu Pro Leu Trp Ser Thr 
        1075                1080                1085            
Glu Val Ala Arg Glu Thr Val Glu Pro Pro Glu Asp Glu Pro Pro Gly 
    1090                1095                1100                
Ser Leu Gly Ser Val Asp Glu Asn Arg Glu Thr Leu Thr Ser Leu Glu 
1105                1110                1115                1120
Lys Glu Ser Gln Glu Leu Ser Ser Leu Gly Lys Trp Asn Val Glu Thr 
                1125                1130                1135    
Arg Val Glu Asp Ser Gln Gln Cys Leu Gln Val Glu Glu Gly Leu Gln 
            1140                1145                1150        
Glu Glu Gln His Gln Glu Ser Leu Arg Glu Val Lys Gln Glu Leu Pro 
        1155                1160                1165            
Ser Ser Gly Asn Gln Gln Arg Trp Glu Asp Val Val Glu Gly Lys Ala 
    1170                1175                1180                
Val Gly Gln Glu Ala Pro Leu Ala Thr Thr Gly Val Gly Thr Glu Asp 
1185                1190                1195                1200
Lys Ala Glu Leu His Leu Arg Gly Gln Gly Gly Glu Glu Glu Ala Ala 
                1205                1210                1215    
Ala Glu Gly Glu Leu Leu Gln Asp Ile Val Gly Glu Ala Trp Ser Leu 
            1220                1225                1230        
Gly Ser Ser Glu Pro Lys Glu Gln Arg Val Pro Ala Glu Ala Leu Asp 
        1235                1240                1245            
Asn Leu Glu Gly Gly Ala Leu Glu Val Pro Val Ala Gln Ser Met Pro 
    1250                1255                1260                
Glu Val Thr Glu Arg Asp Glu Asp Arg Ala Gln Ala Gly Glu Gln Asp 
1265                1270                1275                1280
Ser Ile Glu Val Thr Leu Gly Leu Glu Ala Ala Arg Thr Gly Leu Glu 
                1285                1290                1295    
Leu Glu Gln Glu Val Val Gly Leu Glu Asp Pro Arg His Phe Ala Arg 
            1300                1305                1310        
Glu Glu Ala Ile Pro Pro Ser Leu Gly Glu Glu Ser Val Lys Ala Lys 
        1315                1320                1325            
Ile Ala Gln Gly Leu Glu Gly Pro Gly Lys Glu Pro Lys Glu Ala Gly 
    1330                1335                1340                
Ala Leu Asp Ser Gly Ile Leu Glu Leu Pro Lys Thr Ser Ser Glu Ala 
1345                1350                1355                1360
Leu Glu Cys Gln Gly His Glu Glu Ser Glu Ser Met Glu Gly Trp Glu 
                1365                1370                1375    
Glu Glu Glu Ala Ser Leu Glu Thr Ser Asp His Glu Gly Ser Asp Ala 
            1380                1385                1390        
Pro Gln Pro Arg Pro Pro Glu Thr Glu Glu Asp Glu Gly Ala Gln Ala 
        1395                1400                1405            
Ala Leu Thr Ala Pro Gly Pro Lys Leu Leu Glu Pro Cys Ser Pro Ile 
    1410                1415                1420                
Pro Ile Leu Thr Asp Ala His Glu Leu Gln Pro Gln Ala Glu Gly Ile 
1425                1430                1435                1440
Gln Glu Ala Gly Trp Gln Pro Glu Ala Gly Ser Glu Ala Leu Glu Arg 
                1445                1450                1455    
Val Glu Asn Glu Pro Glu Phe Gly Leu Gly Glu Ile Pro Glu Gly Leu 
            1460                1465                1470        
Gln Asp Trp Glu Glu Gly Arg Glu Glu Ser Glu Ala Asp Asp Leu Gly 
        1475                1480                1485            
Glu Thr Leu Pro Asp Ser Thr Pro Leu Gly Leu Tyr Leu Arg Ser Pro 
    1490                1495                1500                
Ala Ser Pro Lys Trp Asp Leu Ala Gly Glu Gln Arg Leu Ser Pro Gln 
1505                1510                1515                1520
Gly Asp Ala Gly Lys Glu Asp Trp Gly Pro Ala Val Pro Ala Ala Gln 
                1525                1530                1535    
Gly Leu Ser Gly Pro Pro Glu Glu Glu Glu Glu Gln Gly His Gly Ser 
            1540                1545                1550        
Asp Leu Ser Ser Glu Glu Phe Glu Asp Leu Gly Thr Glu Ala Ser Leu 
        1555                1560                1565            
Leu Pro Gly Val Pro Lys Glu Val Ala Asp His Val Gly Gln Val Pro 
    1570                1575                1580                
Pro Val Leu Gln Pro Ala Cys Trp Asp Gln Gly Gly Glu Ser Asp Gly 
1585                1590                1595                1600
Phe Ala Asp Glu Glu Glu Ser Gly Glu Glu Gly Glu Glu Glu Asp Ala 
                1605                1610                1615    
Asp Glu Glu Gly Ala Glu Ser Gly Ala Gln Trp Trp Gly Ser Gly Ala 
            1620                1625                1630        
Ser Gly Gly Gly Cys Lys Val Gln Asp Ile Ala Gln Arg Gly Asp Pro 
        1635                1640                1645            
Val Gln Glu Ser Val Gly Val Ser Gly Leu Trp Asp Asp Gly Leu Arg 
    1650                1655                1660                
Gly Ala Ala Ala Asn Val Pro Ala Leu Glu Met Val Ser Gln Asp Ser 
1665                1670                1675                1680
Ala Glu Pro Ser Gly Ser Glu Glu Ser Glu Ser Ala Ser Leu Glu Gly 
                1685                1690                1695    
Glu Glu Gly Gln Val Thr Asp His Leu Asp Ala Pro Gln Glu Val Thr 
            1700                1705                1710        
Ser Met Val Pro Gly Val Gly Asp Ala Phe Asp Ile Gly Gly Gln Ser 
        1715                1720                1725            
Pro Asn Leu Asp Ser Glu Gln Val Asn Gly Lys Met Glu Asn Gly Leu 
    1730                1735                1740                
Glu Gln Ala Glu Gly Gln Val Val Leu Asp Gly Asp Glu Asp Gln Glu 
1745                1750                1755                1760
Leu Leu Leu Gln Gly Gln Glu Val Gly Ala Leu Lys Val Pro Leu Val 
                1765                1770                1775    
Ala Ser Pro Val His Leu Gly Pro Ser Gln Pro Leu Lys Phe Thr Leu 
            1780                1785                1790        
Ser Gly Val Asp Gly Asp Ser Trp Ser Ser Gly Glu Asp 
        1795                1800                1805

<210> 77
<211> 5843
<212> DNA
<213> Rattus norvegicus

<220> 
<221> source
<222> 1..5843
<223> /mol_type="DNA"
      /note="Rattus norvegicus Col1A1"
      /organism="Rattus norvegicus"

<400> 77
cgggagtttc acctccggac ggagcaggag gcacacggag tgaggccacg catgagccga       60

agctaacccc ccaccccagc cgcaaagagt ctacatgtct agggtctaga catgttcagc      120

tttgtggacc tccggctcct gctcctctta ggggccactg ccctcctgac gcatggccaa      180

gaagacatcc ctgaagtcag ctgcatacac aatggcctaa gggtccctaa tggtgagacg      240

tggaaacctg atgtatgctt gatctgtatc tgccacaatg gcacggctgt gtgcgatggc      300

gtgctatgca aagaagactt ggactgtccc aacccccaaa aacgggaggg cgagtgctgt      360

cctttctgcc cagaagaata tgtatcacca gacgcagaag tcataggagt cgagggaccc      420

aagggagacc ctggccccca aggcccacgg ggacctgttg gcccccctgg acaagatggc      480

atccctggac agcctggact tcctggtcct cctggtcccc ccggcccccc cggaccccct      540

ggtcttggag gaaactttgc ttcccagatg tcctatggct atgatgagaa atcagctgga      600

gtttccgtgc ctggccccat gggtccttct ggtcctcgtg gtctccctgg cccccctggt      660

gcacctggtc ctcaaggttt ccaaggcccc cctggtgaac ctggcgagcc tggcgcttca      720

ggtccaatgg gtccccgagg tccccctggc cctcctggca agaacggaga tgatggggaa      780

gctggtaagc ctggccgccc tggtgagcgt ggacctcctg gacctcaggg tgctcgtgga      840

ttgcctggaa cagctggcct ccccggaatg aagggacaca gaggtttcag tggtttggat      900

ggtgccaaag gagatactgg tcctgctggt cctaagggag agcctggcag tcctggtgaa      960

aatggagctc ccggccagat gggtccccga ggtctgcctg gtgagagagg tcgccctgga     1020

ccccctggca gtgctggtgc tcgtggtaac gatggtgctg tcggtgcagc tgggcccccc     1080

ggtcccaccg gccctactgg ccctcctggc ttccctggtg cagctggtgc taagggtgaa     1140

gctggtcccc agggagcccg aggctctgaa ggtccccagg gtgtgcgtgg tgagcccgga     1200

ccccctggcc ctgctggtgc tgctggtcct gctggaaacc ctggtgctga tggacaacct     1260

ggtgctaaag gtgccaatgg tgctcctggt attgctggtg ctcctggctt ccctggtgcc     1320

cgaggcccct ctggacctca gggccccagc ggcgctcctg gtcccaaagg caacagtggt     1380

gaacctggtg cccctggcaa caaaggagac actggtgcca aaggagaacc cggccctgct     1440

ggagttcaag gtccccctgg ccctgctgga gaagaaggaa aacgaggagc ccgtggtgag     1500

cctggaccta gcggcctgcc cggacctcct ggcgagcgcg gtggacctgg tagccgtggt     1560

ttccctggtg ctgatggtgt tgctggcccc aagggtcctg ctggtgaacg tggttctcct     1620

ggccctgctg gtcccaaagg ttctcctggt gaagctggtc gccctggtga agctggtctc     1680

cctggtgcca agggtctcac tggcagtcct ggcagccctg gtcctgatgg caaaaccggc     1740

ccccctggtc ccgctggtca agatggtcgc cctggacccg caggtcctcc tggagcccgt     1800

ggacaggctg gtgtgatggg attccctgga cctaagggta ctgctggaga acctggaaag     1860

gctggagaac gaggtgtccc cggaccccct ggcgctgttg gtcccgctgg caaagatggc     1920

gaagctggag ctcaaggagc ccccggccct gctggtcctg ctggtgagag aggtgaacaa     1980

ggtcccgctg gctcccctgg attccagggt cttcctggtc ccgctggtcc tcctggtgaa     2040

gcaggcaagc ctggtgaaca gggtgttcct ggagaccttg gtgcccctgg accctctggc     2100

gcaagaggcg agagaggttt ccctggtgaa cgtggtgtac aaggtccccc aggtcctgct     2160

ggtccccgag gaaacaatgg tgcccccggc aacgatggtg ccaagggtga tactggtgcc     2220

cccggagctc ctggtagcca gggtgccccc ggtcttcagg gaatgcctgg tgaacgtggt     2280

gcagctggtc ttccaggtcc taagggtgac agaggtgatg ctggtcccaa aggtgctgat     2340

ggttctcctg gcaaagatgg cgtccgtggt ctgactggtc ccattggtcc tcctggccct     2400

gctggtgccc ctggtgacaa gggtgaaact ggtcccagtg gtcctgctgg ccccaccgga     2460

gcccgtggtg cccccggaga ccgtggtgag cctggtcccc ctggtcctgc tggcttcgct     2520

ggcccccctg gtgctgatgg ccaacctggt gcgaaaggtg aacctggtga tactggtgtg     2580

aaaggtgacg ctggtcctcc tggccctgct ggtcccgctg gaccccctgg ccccattggt     2640

aacgttggtg ctcctggacc caaaggttct cgtggtgctg ctggtccccc tggtgctact     2700

ggtttccctg gtgctgctgg tcgtgttggt ccccctggtc cctctggaaa tgctggaccc     2760

cctggccctc ccggtcccgt tggcaaagaa gggggcaaag gtccccgtgg tgagactggt     2820

cccgctggac gtcctggtga agttggtccc ccaggtcccc ctggccctgc tggtgagaaa     2880

ggatctcctg gtgctgatgg acctgctggc tctcctggta cccctggacc tcagggtatt     2940

gctggacagc gtggtgtggt cggtcttccc ggtcagagag gagaaagagg cttccctggt     3000

cttcctggac cctctggtga acccggcaaa caaggtcctt ctggagcaag tggtgaacgt     3060

ggtccccctg gccctatggg cccccctgga ttggctggcc cccctggtga atctggtcgt     3120

gagggatccc ctggtgctga aggctcccct ggaagagatg gtgctcctgg tgccaagggt     3180

gaccgtggtg agactggccc tgctggcccc cctggtgctc ctggtgctcc tggtgctccc     3240

ggccctgttg gtcctgctgg caagaatggc gaccgtggtg agactggtcc tgctggtcct     3300

gctggtccca ttggccctgc tggtgcccgt ggtcctgctg gaccccaagg cccccgtggt     3360

gacaagggtg agacaggcga acaaggtgac agaggcataa agggtcatcg tggcttctct     3420

ggtctccagg gtcctcctgg ctctcctggc tctcctggtg aacaaggccc ctctggagct     3480

tctggtcctg caggtccccg gggtccccct ggctctgctg gttctcctgg caaagatgga     3540

ctcaacggtc tccctggccc cattggtccc cctggtcctc gaggtcgcac tggcgatagt     3600

ggtcctgctg gtccccccgg acctcctgga ccccctggcc ctcccggtcc tcccagcggt     3660

ggttatgact tcagcttcct gcctcagcca cctcaagaga agtctcaaga tggtggccgt     3720

tactaccggg ccgatgatgc caacgtggtc cgtgaccgtg accttgaggt ggacactacc     3780

ctcaagagcc tgagccagca gattgagaac atccgcagcc ctgagggcag ccgcaagaac     3840

cccgcccgca catgccgtga cctcaagatg tgccactctg actggaagag cggagagtac     3900

tggatcgacc ctaaccaagg ctgcaacctg gatgccatca aggtctactg caacatggag     3960

acaggtcaga cctgtgtgtt ccccactcag ccctctgtgc ctcagaagaa ctggtacatc     4020

agcccaaacc ccaaggagaa gaagcatgtc tggtttggag agagcatgac cgatggattc     4080

cagttcgagt atggaagcga aggttccgat cctgccgatg tcgctatcca gctgaccttc     4140

ctgcgcctga tgtccaccga ggcctcccag aacatcacct atcactgcaa gaacagcgta     4200

gcctacatgg accaacagac tggcaacctc aagaagtccc tgctcctcca gggctccaac     4260

gagatcgagc tcaggggcga aggcaacagt cgattcacct acagcacgct tgtggatggc     4320

tgcacgagtc acaccggaac ttggggcaag acagtcatcg aatacaaaac caccaagacc     4380

tcccgcctgc ccatcatcga tgtggctccc ttggacattg gtgccccaga ccaggaattc     4440

ggaatggaca ttggccctgc ctgcttcgtg taaactccct ccatcccaat ctggttccct     4500

cccacccagc ccactttccc ccaaccctgg aaacagacca acaacccaaa ctcaatttcc     4560

ccaaaagcca aaaattggga gacaatttca catggacttt ggaaaacatt tttttccttt     4620

gcattcatct ctcaaactta gtttttatct ttgaccaact gaacgtgacc aaaaaccaaa     4680

agtgcattca accttaccaa aaagaaaaaa aaataagaat aaataaataa ctttttaaaa     4740

aaggaagctt ggtcctcttg cttgaagacc tatgtgggta taagtccctt tctgcccact     4800

gggcttatga taccccaaat gctgcctttt ctgttccttt ctccaccccc tcttggggcc     4860

tctcctccat tgctccccaa atttaagtct cccccaaaga cacaggaaat aatgcattgt     4920

ctgcccagcc agcaaaggca atgctgaatc gtcccaccag cccctcaacc cccagcctac     4980

ttccctaccc agcaccttca aatcctgccg ggacatgggg ttctcggact attgaaggag     5040

cctaaccatc tggcatctcc atggcctctg caacaaatcc ccacacacac tttgtttttg     5100

agggcctgtg ctgggggagc cacctgcccc tcgcaggggt ttggagccag gcagggtcac     5160

agcagactgg aaacatcggc cacacatgtg caggctgggt gggagagact gttctgttcc     5220

ttgtgtaatt gtgttgctga aagactacct cgttcttgtc tttgtgtgtc accggggcaa     5280

ctgtgtgggg gcggggatgg gggcagggtg gcagcgcgcc cagtttggta tcaaaggtgc     5340

tacatctctg tgaaggggtg gggtgggaag gaatttctgg tgctatagaa tctgagatgc     5400

tcccctagac cagcaaatgt tccttttgtt caaagtattt ttttattctt ttttttttaa     5460

tggataggga cttgtgtgaa ttttcttttc ctgacggtgc tatttaacaa gggaggagag     5520

agtgccaact ccagcctgct ctctctctac ccccctcttc actcttccag ctcctgggcc     5580

tatctgatga tctctctctc ttctgaaacc ctcccctctt gctgctgctc cctaccctca     5640

gcttctctct ctctctgtcc tgcatcaggg tttcagagca ccattttcca aagcacaaag     5700

cagtttttat ccctggggtg ggaggaagca agagactctg tacctatttt gtatgtgtat     5760

aataatttga gatgttttta attattttga ttgctggaat aaagcatgtg gaaatgaccc     5820

aacgcaaaaa aaaaaaaaaa aaa                                             5843


<210> 78
<211> 1453
<212> PRT
<213> Rattus norvegicus

<220> 
<221> SOURCE
<222> 1..1453
<223> /mol_type="protein"
      /note="Rattus norvegicus Col1A1"
      /organism="Rattus norvegicus"

<400> 78
Met Phe Ser Phe Val Asp Leu Arg Leu Leu Leu Leu Leu Gly Ala Thr 
1               5                   10                   15    
Ala Leu Leu Thr His Gly Gln Glu Asp Ile Pro Glu Val Ser Cys Ile 
            20                   25                  30        
His Asn Gly Leu Arg Val Pro Asn Gly Glu Thr Trp Lys Pro Asp Val 
        35                   40                  45            
Cys Leu Ile Cys Ile Cys His Asn Gly Thr Ala Val Cys Asp Gly Val 
    50                   55                  60                
Leu Cys Lys Glu Asp Leu Asp Cys Pro Asn Pro Gln Lys Arg Glu Gly 
65                   70                  75                  80
Glu Cys Cys Pro Phe Cys Pro Glu Glu Tyr Val Ser Pro Asp Ala Glu 
                85                   90                  95    
Val Ile Gly Val Glu Gly Pro Lys Gly Asp Pro Gly Pro Gln Gly Pro 
            100                  105                110        
Arg Gly Pro Val Gly Pro Pro Gly Gln Asp Gly Ile Pro Gly Gln Pro 
        115                  120                125            
Gly Leu Pro Gly Pro Pro Gly Pro Pro Gly Pro Pro Gly Pro Pro Gly 
    130                  135                140                
Leu Gly Gly Asn Phe Ala Ser Gln Met Ser Tyr Gly Tyr Asp Glu Lys 
145                  150                155                  160
Ser Ala Gly Val Ser Val Pro Gly Pro Met Gly Pro Ser Gly Pro Arg 
                165                  170                175    
Gly Leu Pro Gly Pro Pro Gly Ala Pro Gly Pro Gln Gly Phe Gln Gly 
            180                  185                190        
Pro Pro Gly Glu Pro Gly Glu Pro Gly Ala Ser Gly Pro Met Gly Pro 
        195                  200                205            
Arg Gly Pro Pro Gly Pro Pro Gly Lys Asn Gly Asp Asp Gly Glu Ala 
    210                  215                220                
Gly Lys Pro Gly Arg Pro Gly Glu Arg Gly Pro Pro Gly Pro Gln Gly 
225                  230                235                  240
Ala Arg Gly Leu Pro Gly Thr Ala Gly Leu Pro Gly Met Lys Gly His 
                245                  250                255    
Arg Gly Phe Ser Gly Leu Asp Gly Ala Lys Gly Asp Thr Gly Pro Ala 
            260                  265                270        
Gly Pro Lys Gly Glu Pro Gly Ser Pro Gly Glu Asn Gly Ala Pro Gly 
        275                  280                285            
Gln Met Gly Pro Arg Gly Leu Pro Gly Glu Arg Gly Arg Pro Gly Pro 
    290                  295                300                
Pro Gly Ser Ala Gly Ala Arg Gly Asn Asp Gly Ala Val Gly Ala Ala 
305                  310                315                  320
Gly Pro Pro Gly Pro Thr Gly Pro Thr Gly Pro Pro Gly Phe Pro Gly 
                325                  330                335    
Ala Ala Gly Ala Lys Gly Glu Ala Gly Pro Gln Gly Ala Arg Gly Ser 
            340                  345                350        
Glu Gly Pro Gln Gly Val Arg Gly Glu Pro Gly Pro Pro Gly Pro Ala 
        355                  360                365            
Gly Ala Ala Gly Pro Ala Gly Asn Pro Gly Ala Asp Gly Gln Pro Gly 
    370                  375                380                
Ala Lys Gly Ala Asn Gly Ala Pro Gly Ile Ala Gly Ala Pro Gly Phe 
385                  390                395                  400
Pro Gly Ala Arg Gly Pro Ser Gly Pro Gln Gly Pro Ser Gly Ala Pro 
                405                  410                415    
Gly Pro Lys Gly Asn Ser Gly Glu Pro Gly Ala Pro Gly Asn Lys Gly 
            420                  425                430        
Asp Thr Gly Ala Lys Gly Glu Pro Gly Pro Ala Gly Val Gln Gly Pro 
        435                  440                445            
Pro Gly Pro Ala Gly Glu Glu Gly Lys Arg Gly Ala Arg Gly Glu Pro 
    450                  455                460                
Gly Pro Ser Gly Leu Pro Gly Pro Pro Gly Glu Arg Gly Gly Pro Gly 
465                  470                475                  480
Ser Arg Gly Phe Pro Gly Ala Asp Gly Val Ala Gly Pro Lys Gly Pro 
                485                  490                495    
Ala Gly Glu Arg Gly Ser Pro Gly Pro Ala Gly Pro Lys Gly Ser Pro 
            500                  505                510        
Gly Glu Ala Gly Arg Pro Gly Glu Ala Gly Leu Pro Gly Ala Lys Gly 
        515                  520                525            
Leu Thr Gly Ser Pro Gly Ser Pro Gly Pro Asp Gly Lys Thr Gly Pro 
    530                  535                540                
Pro Gly Pro Ala Gly Gln Asp Gly Arg Pro Gly Pro Ala Gly Pro Pro 
545                  550                555                  560
Gly Ala Arg Gly Gln Ala Gly Val Met Gly Phe Pro Gly Pro Lys Gly 
                565                  570                575    
Thr Ala Gly Glu Pro Gly Lys Ala Gly Glu Arg Gly Val Pro Gly Pro 
            580                  585                590        
Pro Gly Ala Val Gly Pro Ala Gly Lys Asp Gly Glu Ala Gly Ala Gln 
        595                  600                605            
Gly Ala Pro Gly Pro Ala Gly Pro Ala Gly Glu Arg Gly Glu Gln Gly 
    610                  615                620                
Pro Ala Gly Ser Pro Gly Phe Gln Gly Leu Pro Gly Pro Ala Gly Pro 
625                  630                635                  640
Pro Gly Glu Ala Gly Lys Pro Gly Glu Gln Gly Val Pro Gly Asp Leu 
                645                  650                655    
Gly Ala Pro Gly Pro Ser Gly Ala Arg Gly Glu Arg Gly Phe Pro Gly 
            660                  665                670        
Glu Arg Gly Val Gln Gly Pro Pro Gly Pro Ala Gly Pro Arg Gly Asn 
        675                  680                685            
Asn Gly Ala Pro Gly Asn Asp Gly Ala Lys Gly Asp Thr Gly Ala Pro 
    690                  695                700                
Gly Ala Pro Gly Ser Gln Gly Ala Pro Gly Leu Gln Gly Met Pro Gly 
705                  710                715                  720
Glu Arg Gly Ala Ala Gly Leu Pro Gly Pro Lys Gly Asp Arg Gly Asp 
                725                  730                735    
Ala Gly Pro Lys Gly Ala Asp Gly Ser Pro Gly Lys Asp Gly Val Arg 
            740                  745                750        
Gly Leu Thr Gly Pro Ile Gly Pro Pro Gly Pro Ala Gly Ala Pro Gly 
        755                  760                765            
Asp Lys Gly Glu Thr Gly Pro Ser Gly Pro Ala Gly Pro Thr Gly Ala 
    770                  775                780                
Arg Gly Ala Pro Gly Asp Arg Gly Glu Pro Gly Pro Pro Gly Pro Ala 
785                  790                795                  800
Gly Phe Ala Gly Pro Pro Gly Ala Asp Gly Gln Pro Gly Ala Lys Gly 
                805                  810                815    
Glu Pro Gly Asp Thr Gly Val Lys Gly Asp Ala Gly Pro Pro Gly Pro 
            820                  825                830        
Ala Gly Pro Ala Gly Pro Pro Gly Pro Ile Gly Asn Val Gly Ala Pro 
        835                  840                845            
Gly Pro Lys Gly Ser Arg Gly Ala Ala Gly Pro Pro Gly Ala Thr Gly 
    850                  855                860                
Phe Pro Gly Ala Ala Gly Arg Val Gly Pro Pro Gly Pro Ser Gly Asn 
865                  870                875                  880
Ala Gly Pro Pro Gly Pro Pro Gly Pro Val Gly Lys Glu Gly Gly Lys 
                885                  890                895    
Gly Pro Arg Gly Glu Thr Gly Pro Ala Gly Arg Pro Gly Glu Val Gly 
            900                  905                910        
Pro Pro Gly Pro Pro Gly Pro Ala Gly Glu Lys Gly Ser Pro Gly Ala 
        915                  920                925            
Asp Gly Pro Ala Gly Ser Pro Gly Thr Pro Gly Pro Gln Gly Ile Ala 
    930                  935                940                
Gly Gln Arg Gly Val Val Gly Leu Pro Gly Gln Arg Gly Glu Arg Gly 
945                  950                955                  960
Phe Pro Gly Leu Pro Gly Pro Ser Gly Glu Pro Gly Lys Gln Gly Pro 
                965                  970                975    
Ser Gly Ala Ser Gly Glu Arg Gly Pro Pro Gly Pro Met Gly Pro Pro 
            980                  985                990        
Gly Leu Ala Gly Pro Pro Gly Glu Ser Gly Arg Glu Gly Ser Pro Gly 
        995                  1000                1005            
Ala Glu Gly Ser Pro Gly Arg Asp Gly Ala Pro Gly Ala Lys Gly Asp 
    1010                1015                1020                
Arg Gly Glu Thr Gly Pro Ala Gly Pro Pro Gly Ala Pro Gly Ala Pro 
1025                1030                1035                1040
Gly Ala Pro Gly Pro Val Gly Pro Ala Gly Lys Asn Gly Asp Arg Gly 
                1045                1050                1055    
Glu Thr Gly Pro Ala Gly Pro Ala Gly Pro Ile Gly Pro Ala Gly Ala 
            1060                1065                1070        
Arg Gly Pro Ala Gly Pro Gln Gly Pro Arg Gly Asp Lys Gly Glu Thr 
        1075                1080                1085            
Gly Glu Gln Gly Asp Arg Gly Ile Lys Gly His Arg Gly Phe Ser Gly 
    1090                1095                1100                
Leu Gln Gly Pro Pro Gly Ser Pro Gly Ser Pro Gly Glu Gln Gly Pro 
1105                1110                1115                1120
Ser Gly Ala Ser Gly Pro Ala Gly Pro Arg Gly Pro Pro Gly Ser Ala 
                1125                1130                1135    
Gly Ser Pro Gly Lys Asp Gly Leu Asn Gly Leu Pro Gly Pro Ile Gly 
            1140                1145                1150        
Pro Pro Gly Pro Arg Gly Arg Thr Gly Asp Ser Gly Pro Ala Gly Pro 
        1155                1160                1165            
Pro Gly Pro Pro Gly Pro Pro Gly Pro Pro Gly Pro Pro Ser Gly Gly 
    1170                1175                1180                
Tyr Asp Phe Ser Phe Leu Pro Gln Pro Pro Gln Glu Lys Ser Gln Asp 
1185                1190                1195                1200
Gly Gly Arg Tyr Tyr Arg Ala Asp Asp Ala Asn Val Val Arg Asp Arg 
                1205                1210                1215    
Asp Leu Glu Val Asp Thr Thr Leu Lys Ser Leu Ser Gln Gln Ile Glu 
            1220                1225                1230        
Asn Ile Arg Ser Pro Glu Gly Ser Arg Lys Asn Pro Ala Arg Thr Cys 
        1235                1240                1245            
Arg Asp Leu Lys Met Cys His Ser Asp Trp Lys Ser Gly Glu Tyr Trp 
    1250                1255                1260                
Ile Asp Pro Asn Gln Gly Cys Asn Leu Asp Ala Ile Lys Val Tyr Cys 
1265                1270                1275                1280
Asn Met Glu Thr Gly Gln Thr Cys Val Phe Pro Thr Gln Pro Ser Val 
                1285                1290                1295    
Pro Gln Lys Asn Trp Tyr Ile Ser Pro Asn Pro Lys Glu Lys Lys His 
            1300                1305                1310        
Val Trp Phe Gly Glu Ser Met Thr Asp Gly Phe Gln Phe Glu Tyr Gly 
        1315                1320                1325            
Ser Glu Gly Ser Asp Pro Ala Asp Val Ala Ile Gln Leu Thr Phe Leu 
    1330                1335                1340                
Arg Leu Met Ser Thr Glu Ala Ser Gln Asn Ile Thr Tyr His Cys Lys 
1345                1350                1355                1360
Asn Ser Val Ala Tyr Met Asp Gln Gln Thr Gly Asn Leu Lys Lys Ser 
                1365                1370                1375    
Leu Leu Leu Gln Gly Ser Asn Glu Ile Glu Leu Arg Gly Glu Gly Asn 
            1380                1385                1390        
Ser Arg Phe Thr Tyr Ser Thr Leu Val Asp Gly Cys Thr Ser His Thr 
        1395                1400                1405            
Gly Thr Trp Gly Lys Thr Val Ile Glu Tyr Lys Thr Thr Lys Thr Ser 
    1410                1415                1420                
Arg Leu Pro Ile Ile Asp Val Ala Pro Leu Asp Ile Gly Ala Pro Asp 
1425                1430                1435                1440
Gln Glu Phe Gly Met Asp Ile Gly Pro Ala Cys Phe Val 
                1445                1450            

<210> 79
<211> 4792
<212> DNA
<213> Rattus norvegicus

<220> 
<221> source
<222> 1..4792
<223> /mol_type="DNA"
      /note="Rattus norvegicus Col3A1"
      /organism="Rattus norvegicus"

<400> 79
acgggcccgg tgctgaaggg cagggaacaa ctgatggtgc tactgtgagc tgcttcttcc       60

tctctcctct tttgcacaaa gagtctcatg tctgatattt agacatgatg agctttgtgc      120

aatgtgggac ctggtttctt ctcaccctgc ttcacccctc tcttattttg gcacagcagt      180

ccaatgtaga tgaattggga tgcaactacc ttggtcagtc ctatgagtct agagatgtct      240

ggaagccaga accatgtcaa atatgtgtct gcgactcggg atctgtcctc tgtgatgaca      300

taatgtgtga tgatgagcca ctagactgcc ccaacccaga gatcccattt ggagaatgtt      360

gtgcaatatg tccacagcct tctacacctg ctcctgtcat tcctgatggt aatagacctc      420

aaggccccaa gggagatcca ggccctcctg gcattcctgg gagaaatggc gaccctggtc      480

ttccaggaca accagggctc cctggtcctc ctggctcccc tggaatctgt gaatcatgtc      540

caactggtgg ccagaattat tctccccaat tcgactcata tgatgtcaag tctggagtcg      600

gaggaatggg tggctatcct ggaccagctg gtccaccagg ccctccagga ccccctggtt      660

cctctggaca tcctggatct cctggttctc ctggatacca aggtcctcct ggtgaaccgg      720

gtcaagctgg tcctgcaggc cctccaggac ctcctggtgc tattggtcca tctggccctg      780

caggaaagga tggagagtca ggaagacccg gacgacctgg agagcgtgga ctgcctggac      840

ctccaggtat caaaggccca gctggtatcc ctggattccc gggtatgaaa ggacacagag      900

gctttgatgg acgcaatgga gagaagggtg aaaccggtgc tcctggattg aagggtgaaa      960

acggtcttcc gggagacaac ggagctcctg gccccatggg tcccagaggg gctcctggtg     1020

agcgaggacg accaggtctt cctggagccg caggtgctcg aggcaatgat ggtgctcggg     1080

gcagtgacgg gcaaccaggt ccccctggtc ctcctggaac tgcaggattc cctggatctc     1140

ctggtgctaa gggtgaggtt ggacctgcag gatcccctgg ctcaaatggc tctccaggac     1200

aaagagggga acctggacca caaggacacg ctggtgctca aggacctcct ggccctcctg     1260

gcaataatgg cagtcctggt gggaaaggtg aaatgggtcc agctggcatt cctggagctc     1320

ctggactcct aggagctagg ggtccccctg gaccagcagg agctaatggt gcaccgggac     1380

aacgaggtcc ttcaggcgaa ccgggcaaga atggagcaaa gggagagcca ggagctcgcg     1440

gtgaacgggg cgaagctggt tccccaggga ttccaggacc taagggcgaa gacggcaaag     1500

atgggtcacc aggagaacct ggtgcaaatg gagttccagg aaacccagga gaaaggggtg     1560

cccctggctt ccgaggacct gcagggccaa atggcgcccc aggagaaaag ggtcctgctg     1620

gagagcgtgg tggcccaggt cctgcaggac ctagaggagt agctggagaa cctggccgag     1680

atggaacccc tggaggtcca gggatacggg gtatgcccgg aagtccaggt ggaccaggca     1740

atgatgggaa accaggacct cctggaagtc aaggagaaag tggtcgccct ggtcctcctg     1800

gcccatctgg ccccagaggt cagcctggtg tcatgggttt ccctggtcct aaaggaaatg     1860

atggtgcacc tggcaaaaac ggagaacggg gtggccctgg gggtcctggc cttccaggtc     1920

ctgctggaaa gaatggggag actggacctc agggtccccc aggacctact ggcgcacctg     1980

gtgacaaggg agacgctgga ccccctggtc cacaaggatt acaaggcata cctggtacca     2040

gtggtcctcc aggagaaaat ggaaaaccag gagaaccagg tccaaagggt gaagctggag     2100

cacctggagt tcctggaggc aagggtgatt ctggtgcccc tggagaacgt ggaccccctg     2160

gaaccgcagg aacccctggg cttagaggtg gagctggacc ccctgggcct gagggaggaa     2220

agggccctgc tggtccccct ggtccccctg gtacttctgg tcctcctggt ctgcaaggga     2280

tgccaggaga gagaggaggt cctgggagtc ctggcccaaa gggtgaaaag ggtgagccag     2340

gcggtgcggg tgctgatgga gttccaggaa aggatgggcc gagaggtcct gctggtccta     2400

ttggtccccc tggcccagct ggtcagcctg gagataaggg tgaaggtggt gcccctggac     2460

ttccaggtat agctggacct cgaggtggcc ctggtgagag aggtgaacat ggccctccag     2520

gacctgctgg cttcccgggt gctcctgggc agaatggtga accaggtgct aaaggagaaa     2580

gaggtgcccc cggagagaaa ggtgaaggag gccctcctgg tgccgcagga ccccctggtg     2640

gttctggacc tgctggtcct cctgggcctc aaggtgtaaa gggtgaacgg ggcagtcctg     2700

gcggtcctgg tgctgctggc tttcccggtg gccgtggtct tcctggtcct cccggcaaca     2760

atggtaatcc agggccccca ggacccagtg gtgctcctgg caaggatggc cctccaggtc     2820

ctgcaggtaa cagtggttct cctggaaacc ctggagtagc tggaccaaaa ggtgatgctg     2880

gccaaccagg agagaagggg ccacctggtg ctcagggtcc tccaggatct ccaggtccac     2940

ttggaattgc agggctaact ggagcacgag gtcttgctgg accaccaggc atgccaggtc     3000

cacggggtag ccctggacct cagggtatca agggtgaaag tggaaagcca ggagccagtg     3060

gccataatgg ggaacgtggt cctcctggac cccaaggtct tcctggtcag cctggtacag     3120

ctggtgagcc cggaagggat ggaaaccctg gatcagatgg tcagccaggt cgagacggat     3180

ctcctggtgg caagggtgat cgtggtgaaa atggttctcc tggtgcccca ggcgctcctg     3240

gtcatccagg accacctggt cctgttggtc catctggaaa aaatggtgac agaggagaaa     3300

cgggtcctgc tggtccttct ggtgctccag gtcctgctgg agctcggggt gctcctggtc     3360

cccaaggtcc acgaggtgac aaaggtgaaa ctggtgaacg tggctctaat ggcatcaaag     3420

gacatcgagg attccctggc aatccaggtc ccccaggttc tcccggtgct gctggacacc     3480

agggtgcagt tggtagtcca ggccctgcag gtcccagagg cccagttggt ccacatggac     3540

ctcctggaaa agatggatca agtggacatc caggtcccat tggaccacca gggcctcgag     3600

gtaacagagg tgaaagagga tctgagggct cgcccggtca ccctggacag ccaggacccc     3660

ctggaccccc tggtgcccct ggtccctgct gtggtggcgg tgctgccatt gctggagttg     3720

gaggtgaaaa gtctggcggc ttttcaccat attacgggga tgatccaatg gatttcaaga     3780

tcaacactga ggagatcatg tcttcactca agtctgttaa cggacaaata gagagtctta     3840

tcagccctga tggttctaga aaaaaccctg ctcggaattg cagagacctg aaattctgcc     3900

accctgaact caagagcgga gaatactggg ttgatcctaa ccaaggctgc aagatggatg     3960

ctataaaagt gttctgtaat atggaaaccg gagaaacatg cataaatgcc agtcccatga     4020

ctgtcccgcg gaagcactgg tggacagatg ctggtgctga gaagaaacat gtttggtttg     4080

gagaatctat gaatggtggc tttcagttca gctatggcaa tcctgatctt cctgaagatg     4140

tccttgatgt acagctggcc ttcctcagac ttctttccag ccgggcctcc cagaacatta     4200

cataccactg caaaaacagc attgcctaca tggatcaggc caatggcaat gtaaagaagt     4260

ctctgaagct gatgggatcc aatgagggag aattcaaggc tgaaggaaat agcaaattca     4320

cttacacagt tctagaggat ggctgcacta aacacactgg tgaatggagc aagacagtct     4380

ttgaatatca aacacgcaag gccatgagac tccccatcat agatatcgca ccctatgaca     4440

ttggtggtcc tgatcaagaa tttggtgtgg acattggccc tgtttgcttt ttataagcca     4500

aactctctga aaccccagca aaacaaaaac cacatccatg tgttcctctt gctttaatct     4560

cgtcaaccag tgaaagtgac caactaaatt ccagttattt atttccaaac ttttggaaaa     4620

agcataattt gacaaaaata gaatacaatt tttttgctgt ttcacccacc aatacagttc     4680

aaatgctttt gttttatttt tttaccaatt ccaacttcat aatgtctcaa tggtgctata     4740

ataaataaac atcaacactt ttatgataaa aaaaaaaaaa aaaaaaaaaa aa             4792


<210> 80
<211> 1463
<212> PRT
<213> Rattus norvegicus

<220> 
<221> SOURCE
<222> 1..1463
<223> /mol_type="protein"
      /note="Rattus norvegicus Col3A1"
      /organism="Rattus norvegicus"

<400> 80
Met Met Ser Phe Val Gln Cys Gly Thr Trp Phe Leu Leu Thr Leu Leu 
1               5                   10                   15    
His Pro Ser Leu Ile Leu Ala Gln Gln Ser Asn Val Asp Glu Leu Gly 
            20                   25                  30        
Cys Asn Tyr Leu Gly Gln Ser Tyr Glu Ser Arg Asp Val Trp Lys Pro 
        35                   40                  45            
Glu Pro Cys Gln Ile Cys Val Cys Asp Ser Gly Ser Val Leu Cys Asp 
    50                   55                  60                
Asp Ile Met Cys Asp Asp Glu Pro Leu Asp Cys Pro Asn Pro Glu Ile 
65                   70                  75                  80
Pro Phe Gly Glu Cys Cys Ala Ile Cys Pro Gln Pro Ser Thr Pro Ala 
                85                   90                  95    
Pro Val Ile Pro Asp Gly Asn Arg Pro Gln Gly Pro Lys Gly Asp Pro 
            100                  105                110        
Gly Pro Pro Gly Ile Pro Gly Arg Asn Gly Asp Pro Gly Leu Pro Gly 
        115                  120                125            
Gln Pro Gly Leu Pro Gly Pro Pro Gly Ser Pro Gly Ile Cys Glu Ser 
    130                  135                140                
Cys Pro Thr Gly Gly Gln Asn Tyr Ser Pro Gln Phe Asp Ser Tyr Asp 
145                  150                155                  160
Val Lys Ser Gly Val Gly Gly Met Gly Gly Tyr Pro Gly Pro Ala Gly 
                165                  170                175    
Pro Pro Gly Pro Pro Gly Pro Pro Gly Ser Ser Gly His Pro Gly Ser 
            180                  185                190        
Pro Gly Ser Pro Gly Tyr Gln Gly Pro Pro Gly Glu Pro Gly Gln Ala 
        195                  200                205            
Gly Pro Ala Gly Pro Pro Gly Pro Pro Gly Ala Ile Gly Pro Ser Gly 
    210                  215                220                
Pro Ala Gly Lys Asp Gly Glu Ser Gly Arg Pro Gly Arg Pro Gly Glu 
225                  230                235                  240
Arg Gly Leu Pro Gly Pro Pro Gly Ile Lys Gly Pro Ala Gly Ile Pro 
                245                  250                255    
Gly Phe Pro Gly Met Lys Gly His Arg Gly Phe Asp Gly Arg Asn Gly 
            260                  265                270        
Glu Lys Gly Glu Thr Gly Ala Pro Gly Leu Lys Gly Glu Asn Gly Leu 
        275                  280                285            
Pro Gly Asp Asn Gly Ala Pro Gly Pro Met Gly Pro Arg Gly Ala Pro 
    290                  295                300                
Gly Glu Arg Gly Arg Pro Gly Leu Pro Gly Ala Ala Gly Ala Arg Gly 
305                  310                315                  320
Asn Asp Gly Ala Arg Gly Ser Asp Gly Gln Pro Gly Pro Pro Gly Pro 
                325                  330                335    
Pro Gly Thr Ala Gly Phe Pro Gly Ser Pro Gly Ala Lys Gly Glu Val 
            340                  345                350        
Gly Pro Ala Gly Ser Pro Gly Ser Asn Gly Ser Pro Gly Gln Arg Gly 
        355                  360                365            
Glu Pro Gly Pro Gln Gly His Ala Gly Ala Gln Gly Pro Pro Gly Pro 
    370                  375                380                
Pro Gly Asn Asn Gly Ser Pro Gly Gly Lys Gly Glu Met Gly Pro Ala 
385                  390                395                  400
Gly Ile Pro Gly Ala Pro Gly Leu Leu Gly Ala Arg Gly Pro Pro Gly 
                405                  410                415    
Pro Ala Gly Ala Asn Gly Ala Pro Gly Gln Arg Gly Pro Ser Gly Glu 
            420                  425                430        
Pro Gly Lys Asn Gly Ala Lys Gly Glu Pro Gly Ala Arg Gly Glu Arg 
        435                  440                445            
Gly Glu Ala Gly Ser Pro Gly Ile Pro Gly Pro Lys Gly Glu Asp Gly 
    450                  455                460                
Lys Asp Gly Ser Pro Gly Glu Pro Gly Ala Asn Gly Val Pro Gly Asn 
465                  470                475                  480
Pro Gly Glu Arg Gly Ala Pro Gly Phe Arg Gly Pro Ala Gly Pro Asn 
                485                  490                495    
Gly Ala Pro Gly Glu Lys Gly Pro Ala Gly Glu Arg Gly Gly Pro Gly 
            500                  505                510        
Pro Ala Gly Pro Arg Gly Val Ala Gly Glu Pro Gly Arg Asp Gly Thr 
        515                  520                525            
Pro Gly Gly Pro Gly Ile Arg Gly Met Pro Gly Ser Pro Gly Gly Pro 
    530                  535                540                
Gly Asn Asp Gly Lys Pro Gly Pro Pro Gly Ser Gln Gly Glu Ser Gly 
545                  550                555                  560
Arg Pro Gly Pro Pro Gly Pro Ser Gly Pro Arg Gly Gln Pro Gly Val 
                565                  570                575    
Met Gly Phe Pro Gly Pro Lys Gly Asn Asp Gly Ala Pro Gly Lys Asn 
            580                  585                590        
Gly Glu Arg Gly Gly Pro Gly Gly Pro Gly Leu Pro Gly Pro Ala Gly 
        595                  600                605            
Lys Asn Gly Glu Thr Gly Pro Gln Gly Pro Pro Gly Pro Thr Gly Ala 
    610                  615                620                
Pro Gly Asp Lys Gly Asp Ala Gly Pro Pro Gly Pro Gln Gly Leu Gln 
625                  630                635                  640
Gly Ile Pro Gly Thr Ser Gly Pro Pro Gly Glu Asn Gly Lys Pro Gly 
                645                  650                655    
Glu Pro Gly Pro Lys Gly Glu Ala Gly Ala Pro Gly Val Pro Gly Gly 
            660                  665                670        
Lys Gly Asp Ser Gly Ala Pro Gly Glu Arg Gly Pro Pro Gly Thr Ala 
        675                  680                685            
Gly Thr Pro Gly Leu Arg Gly Gly Ala Gly Pro Pro Gly Pro Glu Gly 
    690                  695                700                
Gly Lys Gly Pro Ala Gly Pro Pro Gly Pro Pro Gly Thr Ser Gly Pro 
705                  710                715                  720
Pro Gly Leu Gln Gly Met Pro Gly Glu Arg Gly Gly Pro Gly Ser Pro 
                725                  730                735    
Gly Pro Lys Gly Glu Lys Gly Glu Pro Gly Gly Ala Gly Ala Asp Gly 
            740                  745                750        
Val Pro Gly Lys Asp Gly Pro Arg Gly Pro Ala Gly Pro Ile Gly Pro 
        755                  760                765            
Pro Gly Pro Ala Gly Gln Pro Gly Asp Lys Gly Glu Gly Gly Ala Pro 
    770                  775                780                
Gly Leu Pro Gly Ile Ala Gly Pro Arg Gly Gly Pro Gly Glu Arg Gly 
785                  790                795                  800
Glu His Gly Pro Pro Gly Pro Ala Gly Phe Pro Gly Ala Pro Gly Gln 
                805                  810                815    
Asn Gly Glu Pro Gly Ala Lys Gly Glu Arg Gly Ala Pro Gly Glu Lys 
            820                  825                830        
Gly Glu Gly Gly Pro Pro Gly Ala Ala Gly Pro Pro Gly Gly Ser Gly 
        835                  840                845            
Pro Ala Gly Pro Pro Gly Pro Gln Gly Val Lys Gly Glu Arg Gly Ser 
    850                  855                860                
Pro Gly Gly Pro Gly Ala Ala Gly Phe Pro Gly Gly Arg Gly Leu Pro 
865                  870                875                  880
Gly Pro Pro Gly Asn Asn Gly Asn Pro Gly Pro Pro Gly Pro Ser Gly 
                885                  890                895    
Ala Pro Gly Lys Asp Gly Pro Pro Gly Pro Ala Gly Asn Ser Gly Ser 
            900                  905                910        
Pro Gly Asn Pro Gly Val Ala Gly Pro Lys Gly Asp Ala Gly Gln Pro 
        915                  920                925            
Gly Glu Lys Gly Pro Pro Gly Ala Gln Gly Pro Pro Gly Ser Pro Gly 
    930                  935                940                
Pro Leu Gly Ile Ala Gly Leu Thr Gly Ala Arg Gly Leu Ala Gly Pro 
945                  950                955                  960
Pro Gly Met Pro Gly Pro Arg Gly Ser Pro Gly Pro Gln Gly Ile Lys 
                965                  970                975    
Gly Glu Ser Gly Lys Pro Gly Ala Ser Gly His Asn Gly Glu Arg Gly 
            980                  985                990        
Pro Pro Gly Pro Gln Gly Leu Pro Gly Gln Pro Gly Thr Ala Gly Glu 
        995                  1000                1005            
Pro Gly Arg Asp Gly Asn Pro Gly Ser Asp Gly Gln Pro Gly Arg Asp 
    1010                1015                1020                
Gly Ser Pro Gly Gly Lys Gly Asp Arg Gly Glu Asn Gly Ser Pro Gly 
1025                1030                1035                1040
Ala Pro Gly Ala Pro Gly His Pro Gly Pro Pro Gly Pro Val Gly Pro 
                1045                1050                1055    
Ser Gly Lys Asn Gly Asp Arg Gly Glu Thr Gly Pro Ala Gly Pro Ser 
            1060                1065                1070        
Gly Ala Pro Gly Pro Ala Gly Ala Arg Gly Ala Pro Gly Pro Gln Gly 
        1075                1080                1085            
Pro Arg Gly Asp Lys Gly Glu Thr Gly Glu Arg Gly Ser Asn Gly Ile 
    1090                1095                1100                
Lys Gly His Arg Gly Phe Pro Gly Asn Pro Gly Pro Pro Gly Ser Pro 
1105                1110                1115                1120
Gly Ala Ala Gly His Gln Gly Ala Val Gly Ser Pro Gly Pro Ala Gly 
                1125                1130                1135    
Pro Arg Gly Pro Val Gly Pro His Gly Pro Pro Gly Lys Asp Gly Ser 
            1140                1145                1150        
Ser Gly His Pro Gly Pro Ile Gly Pro Pro Gly Pro Arg Gly Asn Arg 
        1155                1160                1165            
Gly Glu Arg Gly Ser Glu Gly Ser Pro Gly His Pro Gly Gln Pro Gly 
    1170                1175                1180                
Pro Pro Gly Pro Pro Gly Ala Pro Gly Pro Cys Cys Gly Gly Gly Ala 
1185                1190                1195                1200
Ala Ile Ala Gly Val Gly Gly Glu Lys Ser Gly Gly Phe Ser Pro Tyr 
                1205                1210                1215    
Tyr Gly Asp Asp Pro Met Asp Phe Lys Ile Asn Thr Glu Glu Ile Met 
            1220                1225                1230        
Ser Ser Leu Lys Ser Val Asn Gly Gln Ile Glu Ser Leu Ile Ser Pro 
        1235                1240                1245            
Asp Gly Ser Arg Lys Asn Pro Ala Arg Asn Cys Arg Asp Leu Lys Phe 
    1250                1255                1260                
Cys His Pro Glu Leu Lys Ser Gly Glu Tyr Trp Val Asp Pro Asn Gln 
1265                1270                1275                1280
Gly Cys Lys Met Asp Ala Ile Lys Val Phe Cys Asn Met Glu Thr Gly 
                1285                1290                1295    
Glu Thr Cys Ile Asn Ala Ser Pro Met Thr Val Pro Arg Lys His Trp 
            1300                1305                1310        
Trp Thr Asp Ala Gly Ala Glu Lys Lys His Val Trp Phe Gly Glu Ser 
        1315                1320                1325            
Met Asn Gly Gly Phe Gln Phe Ser Tyr Gly Asn Pro Asp Leu Pro Glu 
    1330                1335                1340                
Asp Val Leu Asp Val Gln Leu Ala Phe Leu Arg Leu Leu Ser Ser Arg 
1345                1350                1355                1360
Ala Ser Gln Asn Ile Thr Tyr His Cys Lys Asn Ser Ile Ala Tyr Met 
                1365                1370                1375    
Asp Gln Ala Asn Gly Asn Val Lys Lys Ser Leu Lys Leu Met Gly Ser 
            1380                1385                1390        
Asn Glu Gly Glu Phe Lys Ala Glu Gly Asn Ser Lys Phe Thr Tyr Thr 
        1395                1400                1405            
Val Leu Glu Asp Gly Cys Thr Lys His Thr Gly Glu Trp Ser Lys Thr 
    1410                1415                1420                
Val Phe Glu Tyr Gln Thr Arg Lys Ala Met Arg Leu Pro Ile Ile Asp 
1425                1430                1435                1440
Ile Ala Pro Tyr Asp Ile Gly Gly Pro Asp Gln Glu Phe Gly Val Asp 
                1445                1450                1455    
Ile Gly Pro Val Cys Phe Leu 
            1460            

<210> 81
<211> 1388
<212> DNA
<213> Rattus norvegicus

<220> 
<221> source
<222> 1..1388
<223> /mol_type="DNA"
      /note="Rattus norvegicus Oct-4/POU5F1"
      /organism="Rattus norvegicus"

<400> 81
ggggagggag agaggtgcaa acagtcccta ggtgagtcgt ccttccacca ggcccccggc      60

tcggggagcc caccttcccc atggctggac acctggcttc agacttcgcc ttctcacccc     120

cacctggtgg gggtgatggg tcagcagggc tggagccggg ctgggtggac cctcgaacct     180

ggctaagctt ccaggggcct ccaagtgggc ctggaatcgg accaggttca gaggtgctgg     240

ggatctcccc gtgtccccca gcatacgagt tctgtggagg gatggcatac tgtggacctc     300

aggttggact gggcctagtc ccccaagttg gcgtggagac tctgcagccc gagggccagg     360

caggagcacg agtggagagc aactcggagg gagcctcctc tgggccctgt actgcccgcc     420

ccagcgccgt gaagttggag aaggtggaac ctagtcccga ggagtcccag gatatgaaag     480

ccctgcagaa ggagctagag cagtttgcca agctgctgaa acagaagagg atcaccttgg     540

ggtacaccca ggccgacgtg gggctcaccc tgggcgttct ctttggaaag gtgttcagcc     600

agacaaccat ctgccgcttc gaggccctgc agctcagcct taagaacatg tgtaagctgc     660

ggcccctgct ggagaagtgg gtggaggaag ctgacaacaa cgagaacctt caggagatat     720

gcaaatcgga gaccctggtg caggcccgga agagaaagcg gactagcatt gagaaccgtg     780

tgaggtggaa cctggagaac atgtttctgc agtgcccgaa gccctccctg cagcagatca     840

ctagcattgc caagcagctt gggctggaga gggatgtggt tcgagtgtgg ttctgtaacc     900

ggcgccagaa ggggaaaaga tcgagcattg aatattccca acgagaagag tatgaggccg     960

cggggaaacc tttcccaggg ggggctgtgt cctttcctct gcccccaggc ccccactttg    1020

gtgctccagg ctatgggagc ccccatttca ccacactcta ctcggtccct tttcctgagg    1080

gcgaggcctt tccctctgtt cctgtcactg ctctgggctc tcccatgcat tcaaactgag    1140

gcaccagccc tccctgggga tgaggtgagc caaggcaagg aagggaggta gacaaagaga    1200

acctgaagct ttggggccta gattctttta ctggggagga attgaaagca caaacagggg    1260

tggttggggg ggcggggggg gagagatgaa gttcagtgac gctgttgatc aggaacccgt    1320

ccgaagttct taagttctta aataaagtct gggatacaca gtaaaaaaaa aaaaaaaaaa    1380

aaaaaaaa                                                             1388


<210> 82
<211> 352
<212> PRT
<213> Rattus norvegicus

<220> 
<221> SOURCE
<222> 1..352
<223> /mol_type="protein"
      /note="Rattus norvegicus Oct-4"
      /organism="Rattus norvegicus"

<400> 82
Met Ala Gly His Leu Ala Ser Asp Phe Ala Phe Ser Pro Pro Pro Gly 
1               5                   10                   15    
Gly Gly Asp Gly Ser Ala Gly Leu Glu Pro Gly Trp Val Asp Pro Arg 
            20                   25                  30        
Thr Trp Leu Ser Phe Gln Gly Pro Pro Ser Gly Pro Gly Ile Gly Pro 
        35                   40                  45            
Gly Ser Glu Val Leu Gly Ile Ser Pro Cys Pro Pro Ala Tyr Glu Phe 
    50                   55                  60                
Cys Gly Gly Met Ala Tyr Cys Gly Pro Gln Val Gly Leu Gly Leu Val 
65                   70                  75                  80
Pro Gln Val Gly Val Glu Thr Leu Gln Pro Glu Gly Gln Ala Gly Ala 
                85                   90                  95    
Arg Val Glu Ser Asn Ser Glu Gly Ala Ser Ser Gly Pro Cys Thr Ala 
            100                  105                110        
Arg Pro Ser Ala Val Lys Leu Glu Lys Val Glu Pro Ser Pro Glu Glu 
        115                  120                125            
Ser Gln Asp Met Lys Ala Leu Gln Lys Glu Leu Glu Gln Phe Ala Lys 
    130                  135                140                
Leu Leu Lys Gln Lys Arg Ile Thr Leu Gly Tyr Thr Gln Ala Asp Val 
145                  150                155                  160
Gly Leu Thr Leu Gly Val Leu Phe Gly Lys Val Phe Ser Gln Thr Thr 
                165                  170                175    
Ile Cys Arg Phe Glu Ala Leu Gln Leu Ser Leu Lys Asn Met Cys Lys 
            180                  185                190        
Leu Arg Pro Leu Leu Glu Lys Trp Val Glu Glu Ala Asp Asn Asn Glu 
        195                  200                205            
Asn Leu Gln Glu Ile Cys Lys Ser Glu Thr Leu Val Gln Ala Arg Lys 
    210                  215                220                
Arg Lys Arg Thr Ser Ile Glu Asn Arg Val Arg Trp Asn Leu Glu Asn 
225                  230                235                  240
Met Phe Leu Gln Cys Pro Lys Pro Ser Leu Gln Gln Ile Thr Ser Ile 
                245                  250                255    
Ala Lys Gln Leu Gly Leu Glu Arg Asp Val Val Arg Val Trp Phe Cys 
            260                  265                270        
Asn Arg Arg Gln Lys Gly Lys Arg Ser Ser Ile Glu Tyr Ser Gln Arg 
        275                  280                285            
Glu Glu Tyr Glu Ala Ala Gly Lys Pro Phe Pro Gly Gly Ala Val Ser 
    290                  295                300                
Phe Pro Leu Pro Pro Gly Pro His Phe Gly Ala Pro Gly Tyr Gly Ser 
305                  310                315                  320
Pro His Phe Thr Thr Leu Tyr Ser Val Pro Phe Pro Glu Gly Glu Ala 
                325                  330                335    
Phe Pro Ser Val Pro Val Thr Ala Leu Gly Ser Pro Met His Ser Asn 
            340                  345                350        

<210> 83
<211> 2057
<212> DNA
<213> Rattus norvegicus

<220> 
<221> source
<222> 1..2057
<223> /mol_type="DNA"
      /note="Rattus norvegicus Galc"
      /organism="Rattus norvegicus"

<400> 83
atgtaacagc cgacctaagg cttcccagca acgccaagca aaagtcatga ccgccgccgc      60

gggctcggcg agccgtgtcg cggtgccctt gttgttgtgc gcgatgctgg cgcccagcgg     120

cgcctacgag ctagacgact ccgacgggct gggcctggag ttcgatggca tcggcgcagt     180

cagcggcggc ggggcaacct cccggcttct agtaaattac ccagagccct atcgttctga     240

aatactggat tatctattta agccaaactt cggtgcctct ctgcatattc taaaagtgga     300

aataggtggc gatggacaaa caacagacgg cactgaaccc tcccacatgc actatgagct     360

agatgagaat tatttccgag gctatgagtg gtggctaatg aaggaagcta agaagaggaa     420

cccaaatatt atacttatgg ggttgccatg gtcattccct ggatggctgg gcaaaggctt     480

cagttggcct tatgtaaatc ttcagctgac tgccttctat attgtgagat ggattttggg     540

tgccaagcat tatcatgacc tggacattga ttatattggg atatggaatg aaaggccgtt     600

tgatgccaac tatataaagg aattaagaaa aatgcttgat tatgaaggtc tccagcgagt     660

gagaatcata gcaagtgata atctctggga gccaatttcc tcttctgtgc tgcttgacca     720

ggagctctgg aaggtggttg atgttatagg agctcattat cccggaacct acacagtctg     780

gaatgcaaag atgtcaggga agaagctttg gtcgtcggaa gactttagca ctgtcaacag     840

taatgttggc gcaggctgtt ggggtcgcat attgaaccag aattacatca acggcaatat     900

gaccgccaca attgcttgga atttggtggc tagttactat gaagaattgc cctatggacg     960

aagtggattg atgacagccc aggagccgtg gagtggacat tatgtagtag catctcctat    1020

ctgggtatca gctcatacaa ctcaatttac tcaaccaggc tggtattacc tgaagacagt    1080

tggccatcta gagaaaggag gaagctatgt agctctgact gatggcttgg ggaatttcac    1140

catcatcgtt gaaactatga gtcgtcaaca ttctatgtgt atacggccat atctaccgta    1200

ttataatgtc tcacgtcagc tggccacctt cattctaaag gggtctttga aagaaataca    1260

agagctgcag gtgtggtaca ccaagcttgg aacaacacca gagaaacttc attttaaaca    1320

actggaaact ctatggctcc ttgacggcag cggcagtttc tcactggaac tggaggagga    1380

tgagatgttc acactcacca ctctgaccac agggcacaaa ggcagctacc gtccccctcc    1440

caagtcacag cccttcccaa ccagctataa ggatgatttc aacgttgagt acccattatt    1500

tagtgaagct ccgaattttg ctgatcagac cggcgtgttc gagtactaca cgaataacga    1560

agaccttgag catcgcttca cactgcgcca agttctcaac caacgaccta ttacctgggc    1620

cgcggatgcc tccagcacga tcagtgtcat aggcgatcac cactggagca acatgactgt    1680

gcagtgtgat gtttacatag agactcctcg gactggcggt gtgttcattg ctggaagagt    1740

gaataaaggt ggtatcttga tcagaactgc ttcaggagtt ttcttctgga tttttgcaaa    1800

tggctcttac agagttacag ccgacctggg tgggtggata acatatgctt caggacatgc    1860

tgacgttaca gcaaagcgat ggtatacact caccttaggc attaagggtt atctcgcctc    1920

tggtatgttg aacggcaaga tcctgtggga aaatgtgccc gtgaaatacc cagggcatgg    1980

ctgggctgcg atcggaacgc ataccttcga gtttgcgcag tttgacaact ttcatgtgga    2040

agctgctcgc taatatt                                                   2057


<210> 84
<211> 668
<212> PRT
<213> Rattus norvegicus

<220> 
<221> SOURCE
<222> 1..668
<223> /mol_type="protein"
      /note="Rattus norvegicus Galc"
      /organism="Rattus norvegicus"

<400> 84
Met Thr Ala Ala Ala Gly Ser Ala Ser Arg Val Ala Val Pro Leu Leu 
1               5                   10                   15    
Leu Cys Ala Met Leu Ala Pro Ser Gly Ala Tyr Glu Leu Asp Asp Ser 
            20                   25                  30        
Asp Gly Leu Gly Leu Glu Phe Asp Gly Ile Gly Ala Val Ser Gly Gly 
        35                   40                  45            
Gly Ala Thr Ser Arg Leu Leu Val Asn Tyr Pro Glu Pro Tyr Arg Ser 
    50                   55                  60                
Glu Ile Leu Asp Tyr Leu Phe Lys Pro Asn Phe Gly Ala Ser Leu His 
65                   70                  75                  80
Ile Leu Lys Val Glu Ile Gly Gly Asp Gly Gln Thr Thr Asp Gly Thr 
                85                   90                  95    
Glu Pro Ser His Met His Tyr Glu Leu Asp Glu Asn Tyr Phe Arg Gly 
            100                  105                110        
Tyr Glu Trp Trp Leu Met Lys Glu Ala Lys Lys Arg Asn Pro Asn Ile 
        115                  120                125            
Ile Leu Met Gly Leu Pro Trp Ser Phe Pro Gly Trp Leu Gly Lys Gly 
    130                  135                140                
Phe Ser Trp Pro Tyr Val Asn Leu Gln Leu Thr Ala Phe Tyr Ile Val 
145                  150                155                  160
Arg Trp Ile Leu Gly Ala Lys His Tyr His Asp Leu Asp Ile Asp Tyr 
                165                  170                175    
Ile Gly Ile Trp Asn Glu Arg Pro Phe Asp Ala Asn Tyr Ile Lys Glu 
            180                  185                190        
Leu Arg Lys Met Leu Asp Tyr Glu Gly Leu Gln Arg Val Arg Ile Ile 
        195                  200                205            
Ala Ser Asp Asn Leu Trp Glu Pro Ile Ser Ser Ser Val Leu Leu Asp 
    210                  215                220                
Gln Glu Leu Trp Lys Val Val Asp Val Ile Gly Ala His Tyr Pro Gly 
225                  230                235                  240
Thr Tyr Thr Val Trp Asn Ala Lys Met Ser Gly Lys Lys Leu Trp Ser 
                245                  250                255    
Ser Glu Asp Phe Ser Thr Val Asn Ser Asn Val Gly Ala Gly Cys Trp 
            260                  265                270        
Gly Arg Ile Leu Asn Gln Asn Tyr Ile Asn Gly Asn Met Thr Ala Thr 
        275                  280                285            
Ile Ala Trp Asn Leu Val Ala Ser Tyr Tyr Glu Glu Leu Pro Tyr Gly 
    290                  295                300                
Arg Ser Gly Leu Met Thr Ala Gln Glu Pro Trp Ser Gly His Tyr Val 
305                  310                315                  320
Val Ala Ser Pro Ile Trp Val Ser Ala His Thr Thr Gln Phe Thr Gln 
                325                  330                335    
Pro Gly Trp Tyr Tyr Leu Lys Thr Val Gly His Leu Glu Lys Gly Gly 
            340                  345                350        
Ser Tyr Val Ala Leu Thr Asp Gly Leu Gly Asn Phe Thr Ile Ile Val 
        355                  360                365            
Glu Thr Met Ser Arg Gln His Ser Met Cys Ile Arg Pro Tyr Leu Pro 
    370                  375                380                
Tyr Tyr Asn Val Ser Arg Gln Leu Ala Thr Phe Ile Leu Lys Gly Ser 
385                  390                395                  400
Leu Lys Glu Ile Gln Glu Leu Gln Val Trp Tyr Thr Lys Leu Gly Thr 
                405                  410                415    
Thr Pro Glu Lys Leu His Phe Lys Gln Leu Glu Thr Leu Trp Leu Leu 
            420                  425                430        
Asp Gly Ser Gly Ser Phe Ser Leu Glu Leu Glu Glu Asp Glu Met Phe 
        435                  440                445            
Thr Leu Thr Thr Leu Thr Thr Gly His Lys Gly Ser Tyr Arg Pro Pro 
    450                  455                460                
Pro Lys Ser Gln Pro Phe Pro Thr Ser Tyr Lys Asp Asp Phe Asn Val 
465                  470                475                  480
Glu Tyr Pro Leu Phe Ser Glu Ala Pro Asn Phe Ala Asp Gln Thr Gly 
                485                  490                495    
Val Phe Glu Tyr Tyr Thr Asn Asn Glu Asp Leu Glu His Arg Phe Thr 
            500                  505                510        
Leu Arg Gln Val Leu Asn Gln Arg Pro Ile Thr Trp Ala Ala Asp Ala 
        515                  520                525            
Ser Ser Thr Ile Ser Val Ile Gly Asp His His Trp Ser Asn Met Thr 
    530                  535                540                
Val Gln Cys Asp Val Tyr Ile Glu Thr Pro Arg Thr Gly Gly Val Phe 
545                  550                555                  560
Ile Ala Gly Arg Val Asn Lys Gly Gly Ile Leu Ile Arg Thr Ala Ser 
                565                  570                575    
Gly Val Phe Phe Trp Ile Phe Ala Asn Gly Ser Tyr Arg Val Thr Ala 
            580                  585                590        
Asp Leu Gly Gly Trp Ile Thr Tyr Ala Ser Gly His Ala Asp Val Thr 
        595                  600                605            
Ala Lys Arg Trp Tyr Thr Leu Thr Leu Gly Ile Lys Gly Tyr Leu Ala 
    610                  615                620                
Ser Gly Met Leu Asn Gly Lys Ile Leu Trp Glu Asn Val Pro Val Lys 
625                  630                635                  640
Tyr Pro Gly His Gly Trp Ala Ala Ile Gly Thr His Thr Phe Glu Phe 
                645                  650                655    
Ala Gln Phe Asp Asn Phe His Val Glu Ala Ala Arg 
            660                  665            

<210> 85
<211> 1134
<212> DNA
<213> Rattus norvegicus

<220> 
<221> source
<222> 1..1134
<223> /mol_type="DNA"
      /note="Rattus norvegicus Scleraxis"
      /organism="Rattus norvegicus"

<400> 85
gatccgctgg cggccccact ccagtccgaa cacatgtgcc cgcctcgccc ggcagccacc      60

accgcggggc gcagcggaga cccctggccc ggcggcctgt ggggacctaa agaggcggca     120

tgagcagcgc accgtggagc tgacgccgcg ccccctgccc ggcccatgtc cttcgccatg     180

ctgcgttcag cgccaccgcc gggccgctac ctgtaccctg aggtgagccc gctgtccgag     240

gatgaggacc gcggaagcga gagctcgggc tccgacgaaa aaccctgtcg tgttcatgct     300

gcgcgctgcg gcctccaggg cgcccggcgg cgggcaggag gacggagggc cgcgggtagt     360

gggccaggac ccggggggcg gccaggccgc gagccccggc agcggcacac agcgaatgcg     420

cgcgagcggg accgcaccaa cagcgtgaac acggccttca ctgcgctgcg cacactcatc     480

ccgaccgagc cagcagatcg caagctctcc aagattgaga cgctgcgcct ggcctccagc     540

tacatttctc acctgggcaa cgtgctactg gtgggtgaag cctgcggtga cgggcagccc     600

tgccactcgg gacccgcttt cttccacagc ggtcgtgcgg gcagcccact accaccgcca     660

ccgccgccgc ccccactacc actggccaga gacggcggcg agaacaccca gcccaaacag     720

atctgcacct tctgcctcag caaccagaga aagttgagca aagaccgtga cagaaagacg     780

gcgattcgaa gttagaagga ggagggtcca cagcagccaa gaggtgatgc cactagtgaa     840

ggtggaagcc actgaagagt catggagagc cccaccttgg acctgatctg agcacaggtc     900

cccaagagcg cgctcaccag gccagacctg ccccagctct gagcagggcc tgtgaacaga     960

gagatggaca ggcgggctat ggcttgactc taagtagctg aacacttgta cccaggccca    1020

ctggaacttt ccatgctggc tctctacctg ggccaagtgt tggcatcttg tgtctttaat    1080

atgataatat aaagtctgga aattttgtat aattaaagtg aaacagtatc ttcc          1134


<210> 86
<211> 209
<212> PRT
<213> Rattus norvegicus

<220> 
<221> SOURCE
<222> 1..209
<223> /mol_type="protein"
      /note="Rattus norvegicus Scleraxis"
      /organism="Rattus norvegicus"

<400> 86
Met Ser Phe Ala Met Leu Arg Ser Ala Pro Pro Pro Gly Arg Tyr Leu 
1               5                   10                   15    
Tyr Pro Glu Val Ser Pro Leu Ser Glu Asp Glu Asp Arg Gly Ser Glu 
            20                   25                  30        
Ser Ser Gly Ser Asp Glu Lys Pro Cys Arg Val His Ala Ala Arg Cys 
        35                   40                  45            
Gly Leu Gln Gly Ala Arg Arg Arg Ala Gly Gly Arg Arg Ala Ala Gly 
    50                   55                  60                
Ser Gly Pro Gly Pro Gly Gly Arg Pro Gly Arg Glu Pro Arg Gln Arg 
65                   70                  75                  80
His Thr Ala Asn Ala Arg Glu Arg Asp Arg Thr Asn Ser Val Asn Thr 
                85                   90                  95    
Ala Phe Thr Ala Leu Arg Thr Leu Ile Pro Thr Glu Pro Ala Asp Arg 
            100                  105                110        
Lys Leu Ser Lys Ile Glu Thr Leu Arg Leu Ala Ser Ser Tyr Ile Ser 
        115                  120                125            
His Leu Gly Asn Val Leu Leu Val Gly Glu Ala Cys Gly Asp Gly Gln 
    130                  135                140                
Pro Cys His Ser Gly Pro Ala Phe Phe His Ser Gly Arg Ala Gly Ser 
145                  150                155                  160
Pro Leu Pro Pro Pro Pro Pro Pro Pro Pro Leu Pro Leu Ala Arg Asp 
                165                  170                175    
Gly Gly Glu Asn Thr Gln Pro Lys Gln Ile Cys Thr Phe Cys Leu Ser 
            180                  185                190        
Asn Gln Arg Lys Leu Ser Lys Asp Arg Asp Arg Lys Thr Ala Ile Arg 
        195                  200                205            
Ser 
    

<210> 87
<211> 885
<212> DNA
<213> Rattus norvegicus

<220> 
<221> source
<222> 1..885
<223> /mol_type="DNA"
      /note="Rattus norvegicus Sox-9"
      /organism="Rattus norvegicus"

<400> 87
atgaagtcac tccctcccac ctcctccagg cgcctccccc cacctgatgg agccctgtgt      60

ctaagaagag actctgggct gggagccgga gagctgagag cgttgctcgg aactgtctgg     120

aaacttcagt gggagcgaca actttaccag tttcggtcca ggaacttttc tttgcaaaag     180

agacggggtg caagtagccc tggtttcgtt ctctgttttc cctccctcct cctccgctcc     240

gattcgcctt ccccgggttt ggagcgggca actgagcact ggccacccag cgcctctgct     300

aagtgctcgc cgccgcagcc gggtgacgcg ccaacctccc cgggagccgt tcgctcggcg     360

tccgcgtccg ggcagctgag ggaagaggag ccccagcagc cgcggcttct ctcctttccc     420

ggccacccgc cccctgcccc gggctcgcgt atgaatctcc tggacccctt catgaagatg     480

accgacgagc aggagaaggg cttgtctggc gcccccagcc ccaccatgtc ggaggactcg     540

gctggttcgc cctgcccctc gggctcaggc tccgacacgg agaacacacg gccccaggag     600

aacacgttcc ccaagggcga gccggatctg aagaaggaga gcgaggaaga taaattccca     660

gtgtgcatcc gcgaggcggt cagccaggtg ctgaagggct acgactggac cctggtgccc     720

atgccggtgc gcgtcaacgg ctccagcaag aacaagccac acgtcaagcg gcccatgaac     780

gccttcatgg tgtgggcgca ggctgcgcgc aggaagctgg cagaccagta cccgcatctg     840

cacaacgcgg agctcagcaa gactctgggc aagctctgga ggtga                     885


<210> 88
<211> 294
<212> PRT
<213> Rattus norvegicus

<220> 
<221> SOURCE
<222> 1..294
<223> /mol_type="protein"
      /note="Rattus norvegicus Sox-9"
      /organism="Rattus norvegicus"

<400> 88
Met Lys Ser Leu Pro Pro Thr Ser Ser Arg Arg Leu Pro Pro Pro Asp 
1               5                   10                   15    
Gly Ala Leu Cys Leu Arg Arg Asp Ser Gly Leu Gly Ala Gly Glu Leu 
            20                   25                  30        
Arg Ala Leu Leu Gly Thr Val Trp Lys Leu Gln Trp Glu Arg Gln Leu 
        35                   40                  45            
Tyr Gln Phe Arg Ser Arg Asn Phe Ser Leu Gln Lys Arg Arg Gly Ala 
    50                   55                  60                
Ser Ser Pro Gly Phe Val Leu Cys Phe Pro Ser Leu Leu Leu Arg Ser 
65                   70                  75                  80
Asp Ser Pro Ser Pro Gly Leu Glu Arg Ala Thr Glu His Trp Pro Pro 
                85                   90                  95    
Ser Ala Ser Ala Lys Cys Ser Pro Pro Gln Pro Gly Asp Ala Pro Thr 
            100                  105                110        
Ser Pro Gly Ala Val Arg Ser Ala Ser Ala Ser Gly Gln Leu Arg Glu 
        115                  120                125            
Glu Glu Pro Gln Gln Pro Arg Leu Leu Ser Phe Pro Gly His Pro Pro 
    130                  135                140                
Pro Ala Pro Gly Ser Arg Met Asn Leu Leu Asp Pro Phe Met Lys Met 
145                  150                155                  160
Thr Asp Glu Gln Glu Lys Gly Leu Ser Gly Ala Pro Ser Pro Thr Met 
                165                  170                175    
Ser Glu Asp Ser Ala Gly Ser Pro Cys Pro Ser Gly Ser Gly Ser Asp 
            180                  185                190        
Thr Glu Asn Thr Arg Pro Gln Glu Asn Thr Phe Pro Lys Gly Glu Pro 
        195                  200                205            
Asp Leu Lys Lys Glu Ser Glu Glu Asp Lys Phe Pro Val Cys Ile Arg 
    210                  215                220                
Glu Ala Val Ser Gln Val Leu Lys Gly Tyr Asp Trp Thr Leu Val Pro 
225                  230                235                  240
Met Pro Val Arg Val Asn Gly Ser Ser Lys Asn Lys Pro His Val Lys 
                245                  250                255    
Arg Pro Met Asn Ala Phe Met Val Trp Ala Gln Ala Ala Arg Arg Lys 
            260                  265                270        
Leu Ala Asp Gln Tyr Pro His Leu His Asn Ala Glu Leu Ser Lys Thr 
        275                  280                285            
Leu Gly Lys Leu Trp Arg 
    290                

<210> 89
<211> 2355
<212> DNA
<213> Rattus norvegicus

<220> 
<221> source
<222> 1..2355
<223> /mol_type="DNA"
      /note="Rattus norvegicus c-Myc"
      /organism="Rattus norvegicus"

<400> 89
acccccgggc tgcgctgctc tccgctgccg cctccgccgc gcccactccg ctcgcctcct      60

gcctccaaaa gggcagggct tcgccgaggc ttggcgggaa aaagaagcga ggggagggat     120

ccggagtcgc agtataaaag aagcttttcg ggcgtttttt ttctgactcg ctgtagtaat     180

tccagcgaga gacagaggga gtgagcgggc gggttggaag agcccagtgt gcagagcccc     240

actccgggct tcctaggaag gcagctctgg agtgagaagg gctttgcctc caggcttgct     300

gcctcctcga cccaatcctc ccgctgaccc aacatcagcg gtcgcaaccc tcgccgcctc     360

tgggaaactt tgcccattgc aacgggcaga cacttctcac tggaacttac aatctgcgag     420

ccaggacagg actccccagg cgcaggggag ggaatttttg tctatttggg gacagtgttc     480

tctgcctctg cccgcgatcg gctcccctga aaagagctcc tcgcgttatt tgaagcctga     540

atttcctttg ggaggtggaa aacccgacag tcacgacgat gcccctcaac gtgagcttcg     600

ctaacaggaa ctatgacctc gactacgact cggtgcagcc ctatttcatc tgcgacgagg     660

aagagaattt ctatcaccag caacagcaga gcgagctgca gccgcccgca cccagtgagg     720

atatctggaa gaaattcgag ctgctgccca ccccgcccct gtcccccagc cgccgctccg     780

ggctctgctc tccgtcctat gttgcggtcg ctacgtcctt ctccccaagg gaggacgatg     840

acggtggcgg tggcaacttc tccaccgccg atcagctgga gatgatgacc gagctacttg     900

gaggagacat ggtgaatcag agcttcatct gcgatcctga cgatgagacc ttcatcaaga     960

acatcatcat ccaggactgt atgtggagcg gcttctcggc cgctgccaaa ctggtctccg    1020

agaagctggc ctcttaccag gctgcgcgca aagacagcac cagcctgagc cccgcccgcg    1080

ggcacagcgt ctgctccacc tccagcctgt acctgcagga cctcaccgcc gcagcgtccg    1140

agtgcatcga cccctcagtg gtcttcccct acccgctcaa cgacagcagc tcgcccaaat    1200

cctgtacctc gtccgattcc acggccttct cttcttcctc ggactcgctg ctgtcctccg    1260

agtcctcccc acgggccacc cctgagcccc tagtgctgca tgaagagaca ccgcccacca    1320

ccagcagcga ctctgaagaa gaacaagatg atgaggaaga aattgatgtg gtgtctgtgg    1380

aaaagaggca accccctgcc aagaggtccg agtcagggtc atccccatca agaggccaca    1440

gcaaacctcc acacagccca ctggtcctca agaggtgcca tgtctctact caccagcaca    1500

attatgcagc acccccctcc acaaggaagg actatccagc tgccaagagg gccaagttgg    1560

acagtggcag ggtcctgaaa cagatcagca acaaccgcaa atgctccagc cccaggtcct    1620

cagacaccga ggaaaacgac aagaggcgga cacacaacgt cttggaacgt cagaggagaa    1680

acgagctgaa gcgtagcttt tttgccctgc gcgaccagat ccctgagttg gaaaacaacg    1740

aaaaggcccc caaggtagtt atcctcaaaa aagccaccgc ctacatcctg tccgttcaag    1800

cagatgagca caaactcatc tcagaaaagg acttactgag gaaacggcga gaacagttga    1860

aacacaaact cgaacagctt cgaaactctg gtgcataaac tgaccggaag tgaggaggag    1920

ctggaatctc gagtgtaagg agaacggttc cttctgacag aacttggact tcaaaaaatg    1980

catgctcaaa gcctaacctc acaaccttgg ctggggcttt gggacttcag ccataatgtt    2040

aactgcctca aagttaaggc ataaaagaac ttttttttat gcttcccatc ttctttcttt    2100

ttcctttaac agatttgtat ttaattgttt tttttaaaaa aatcttccgg tgtacatagg    2160

gcctttaaat gtaaataact ttaataaaac gtttataaca gttatacaag attttaagac    2220

atgtatgata aaccataatt ttttttattt aaagaccttt tcatttttaa agttgatttt    2280

tttctattgt ttttagaaaa aataaaataa ttggaaaaaa tataattgag ccaactctta    2340

aaaaaaaaaa aaaaa                                                     2355


<210> 90
<211> 453
<212> PRT
<213> Rattus norvegicus

<220> 
<221> SOURCE
<222> 1..453
<223> /mol_type="protein"
      /note="Rattus norvegicus c-Myc"
      /organism="Rattus norvegicus"

<400> 90
Met Asn Phe Leu Trp Glu Val Glu Asn Pro Thr Val Thr Thr Met Pro 
1               5                   10                   15    
Leu Asn Val Ser Phe Ala Asn Arg Asn Tyr Asp Leu Asp Tyr Asp Ser 
            20                   25                  30        
Val Gln Pro Tyr Phe Ile Cys Asp Glu Glu Glu Asn Phe Tyr His Gln 
        35                   40                  45            
Gln Gln Gln Ser Glu Leu Gln Pro Pro Ala Pro Ser Glu Asp Ile Trp 
    50                   55                  60                
Lys Lys Phe Glu Leu Leu Pro Thr Pro Pro Leu Ser Pro Ser Arg Arg 
65                   70                  75                  80
Ser Gly Leu Cys Ser Pro Ser Tyr Val Ala Val Ala Thr Ser Phe Ser 
                85                   90                  95    
Pro Arg Glu Asp Asp Asp Gly Gly Gly Gly Asn Phe Ser Thr Ala Asp 
            100                  105                110        
Gln Leu Glu Met Met Thr Glu Leu Leu Gly Gly Asp Met Val Asn Gln 
        115                  120                125            
Ser Phe Ile Cys Asp Pro Asp Asp Glu Thr Phe Ile Lys Asn Ile Ile 
    130                  135                140                
Ile Gln Asp Cys Met Trp Ser Gly Phe Ser Ala Ala Ala Lys Leu Val 
145                  150                155                  160
Ser Glu Lys Leu Ala Ser Tyr Gln Ala Ala Arg Lys Asp Ser Thr Ser 
                165                  170                175    
Leu Ser Pro Ala Arg Gly His Ser Val Cys Ser Thr Ser Ser Leu Tyr 
            180                  185                190        
Leu Gln Asp Leu Thr Ala Ala Ala Ser Glu Cys Ile Asp Pro Ser Val 
        195                  200                205            
Val Phe Pro Tyr Pro Leu Asn Asp Ser Ser Ser Pro Lys Ser Cys Thr 
    210                  215                220                
Ser Ser Asp Ser Thr Ala Phe Ser Ser Ser Ser Asp Ser Leu Leu Ser 
225                  230                235                  240
Ser Glu Ser Ser Pro Arg Ala Thr Pro Glu Pro Leu Val Leu His Glu 
                245                  250                255    
Glu Thr Pro Pro Thr Thr Ser Ser Asp Ser Glu Glu Glu Gln Asp Asp 
            260                  265                270        
Glu Glu Glu Ile Asp Val Val Ser Val Glu Lys Arg Gln Pro Pro Ala 
        275                  280                285            
Lys Arg Ser Glu Ser Gly Ser Ser Pro Ser Arg Gly His Ser Lys Pro 
    290                  295                300                
Pro His Ser Pro Leu Val Leu Lys Arg Cys His Val Ser Thr His Gln 
305                  310                315                  320
His Asn Tyr Ala Ala Pro Pro Ser Thr Arg Lys Asp Tyr Pro Ala Ala 
                325                  330                335    
Lys Arg Ala Lys Leu Asp Ser Gly Arg Val Leu Lys Gln Ile Ser Asn 
            340                  345                350        
Asn Arg Lys Cys Ser Ser Pro Arg Ser Ser Asp Thr Glu Glu Asn Asp 
        355                  360                365            
Lys Arg Arg Thr His Asn Val Leu Glu Arg Gln Arg Arg Asn Glu Leu 
    370                  375                380                
Lys Arg Ser Phe Phe Ala Leu Arg Asp Gln Ile Pro Glu Leu Glu Asn 
385                  390                395                  400
Asn Glu Lys Ala Pro Lys Val Val Ile Leu Lys Lys Ala Thr Ala Tyr 
                405                  410                415    
Ile Leu Ser Val Gln Ala Asp Glu His Lys Leu Ile Ser Glu Lys Asp 
            420                  425                430        
Leu Leu Arg Lys Arg Arg Glu Gln Leu Lys His Lys Leu Glu Gln Leu 
        435                  440                445            
Arg Asn Ser Gly Ala 
    450            

<210> 91
<211> 2393
<212> DNA
<213> Rattus norvegicus

<220> 
<221> source
<222> 1..2393
<223> /mol_type="DNA"
      /note="Rattus norvegicus Klf-4"
      /organism="Rattus norvegicus"

<400> 91
atcttcgttg acttcggggt ttgggtaccc ctctctcttc ttcggactcc ggaggacctt      60

ctgggccccc acattaatga ggcagccacc tggcgagtct gacatggctg tcagcgacgc     120

tctgctcccg tccttctcca cgttcgcgtc cggcccggcg ggaagggaga agacactgcg     180

tccagcaggt gccccgacta accgttggcg agaggaactc tctcacatga agcgacttcc     240

cccacttccc ggccgcccct acgacctggc ggcgacggtg gccacagacc tggaaagtgg     300

tggagctggt gcagcttgca gcagtaacaa cccggcccta ccccggaggg agaccgagga     360

gttcaacgat ctcctggacc tagactttat cctttccaac tcgctatccc accaggaatc     420

ggtggccgcc accgtgacca cctcggcgtc agcttcatcc tcgtcttccc cagctagcag     480

cggccctgcc agcgcgccct ccacctgcag cttcagctat ccgatccggg ccgggggtga     540

cccgggcgtg gctgcgggca acacaggtgg agggctcctc tacagccgag aatctgcgcc     600

acctcccacg gcccccttca acctggcgga catcaatgac gtgagcccct cgggcggctt     660

cgtggctgag ctcctgcggc cggagttgga cccagtatac attccgccac agcagcctca     720

gccgccaggt ggcgggctga tgggcaagtt tgtgctgaag gcgtctctga gcacccctgg     780

cagcgagtac accagccctt cggtcatcag tgttagcaaa ggaagcccag acggcagcca     840

ccctgtggta gtggcgccct acagcggtgg cccgccgcgt atgtgcccca agattaagca     900

agaggccgtc ccgtcctgca cggtcagccg gtccctagag gcccacttga gcgctggacc     960

ccagctcagc aacggccaca ggcccaacac acacgacttc cccctggggc ggcagctccc    1020

caccaggact acccctacac tgagtcccga ggaactgctg aacagcaggg actgtcaccc    1080

tggcctgcct cttcccccag gattccatcc ccatccgggg cccagctacc ctcctttcct    1140

gccagaccag atgcagtcgc aagtcccctc tctccattat caagagctca tgccaccggg    1200

atcctgcctg ccagaggagc ccaagccaaa gaggggaaga aggtcttggc cccggaaaag    1260

aacagccacc cacacttgtg actatgcagg ctgtggcaaa acctatacga agagttctca    1320

tctcaaggca cacctgcgaa ctcacacagg cgagaaacct taccactgtg actgggacgg    1380

ctgtgggtgg aaattcgccc gctcagatga actgaccagg cactaccgca aacacaccgg    1440

gcaccggccc tttcagtgcc agaagtgcga cagggccttt tccaggtcgg accaccttgc    1500

cttacacatg aagaggcact tttaaattcc acatcgtgga catgacccac actgccagga    1560

gagagttcag tatttttttt taacctttca cactgtcttc ccacgagggg aggagcccag    1620

ctggcaagcg ctacaatcat ggtcaagttc ccagcaagtc agcttgtgaa tggataatca    1680

ggagaaagga agagtccaag ggacaaaaga aaagaaaaga aaaaaatact aaaaaacaaa    1740

caaacaaaaa aaaaaaacaa aagaaaaaaa tcacagaaca gatggggtct gagactggat    1800

cttctatcat tccaatacca aatccgactt gaacaagact ggacttacaa aatgccaagg    1860

ggtgactgga agtttgtgga tatcagggta tacattaaat cagtgacctg gggggaggga    1920

agaccagagt tcccttgaat tgtgcttcaa tgatgcaata tacatggaaa gaccaccttg    1980

tatgctcttt gccttctaaa aagccattat gacgtcagag gaagaggaag caattcaggt    2040

acagaacgtg ttctaatagc ctaaacgatg gtgcttggtg agtcgtggtt ctaaaggtac    2100

caaacggggg agccaaagtt ctccaactgc tgcatacttt gacaaggaaa atctattttt    2160

gtcttccgat ctacatttat gacctaagtc aggtaaataa gcctggttta tttctgtaac    2220

attttttatg cagacagtct gttatgcact gtggtttcag atgtgcaata atttgtacaa    2280

tggtttattc ccaagtatgc ctttaagcag aacaaatgtg tttttctata tagttccttg    2340

ccttaataaa tatgtaatat aaatttaaaa aaaaaaaaaa aaaaaaaaaa aaa           2393


<210> 92
<211> 482
<212> PRT
<213> Rattus norvegicus

<220> 
<221> SOURCE
<222> 1..482
<223> /mol_type="protein"
      /note="Rattus norvegicus Klf-4"
      /organism="Rattus norvegicus"

<400> 92
Met Arg Gln Pro Pro Gly Glu Ser Asp Met Ala Val Ser Asp Ala Leu 
1               5                   10                   15    
Leu Pro Ser Phe Ser Thr Phe Ala Ser Gly Pro Ala Gly Arg Glu Lys 
            20                   25                  30        
Thr Leu Arg Pro Ala Gly Ala Pro Thr Asn Arg Trp Arg Glu Glu Leu 
        35                   40                  45            
Ser His Met Lys Arg Leu Pro Pro Leu Pro Gly Arg Pro Tyr Asp Leu 
    50                   55                  60                
Ala Ala Thr Val Ala Thr Asp Leu Glu Ser Gly Gly Ala Gly Ala Ala 
65                   70                  75                  80
Cys Ser Ser Asn Asn Pro Ala Leu Pro Arg Arg Glu Thr Glu Glu Phe 
                85                   90                  95    
Asn Asp Leu Leu Asp Leu Asp Phe Ile Leu Ser Asn Ser Leu Ser His 
            100                  105                110        
Gln Glu Ser Val Ala Ala Thr Val Thr Thr Ser Ala Ser Ala Ser Ser 
        115                  120                125            
Ser Ser Ser Pro Ala Ser Ser Gly Pro Ala Ser Ala Pro Ser Thr Cys 
    130                  135                140                
Ser Phe Ser Tyr Pro Ile Arg Ala Gly Gly Asp Pro Gly Val Ala Ala 
145                  150                155                  160
Gly Asn Thr Gly Gly Gly Leu Leu Tyr Ser Arg Glu Ser Ala Pro Pro 
                165                  170                175    
Pro Thr Ala Pro Phe Asn Leu Ala Asp Ile Asn Asp Val Ser Pro Ser 
            180                  185                190        
Gly Gly Phe Val Ala Glu Leu Leu Arg Pro Glu Leu Asp Pro Val Tyr 
        195                  200                205            
Ile Pro Pro Gln Gln Pro Gln Pro Pro Gly Gly Gly Leu Met Gly Lys 
    210                  215                220                
Phe Val Leu Lys Ala Ser Leu Ser Thr Pro Gly Ser Glu Tyr Thr Ser 
225                  230                235                  240
Pro Ser Val Ile Ser Val Ser Lys Gly Ser Pro Asp Gly Ser His Pro 
                245                  250                255    
Val Val Val Ala Pro Tyr Ser Gly Gly Pro Pro Arg Met Cys Pro Lys 
            260                  265                270        
Ile Lys Gln Glu Ala Val Pro Ser Cys Thr Val Ser Arg Ser Leu Glu 
        275                  280                285            
Ala His Leu Ser Ala Gly Pro Gln Leu Ser Asn Gly His Arg Pro Asn 
    290                  295                300                
Thr His Asp Phe Pro Leu Gly Arg Gln Leu Pro Thr Arg Thr Thr Pro 
305                  310                315                  320
Thr Leu Ser Pro Glu Glu Leu Leu Asn Ser Arg Asp Cys His Pro Gly 
                325                  330                335    
Leu Pro Leu Pro Pro Gly Phe His Pro His Pro Gly Pro Ser Tyr Pro 
            340                  345                350        
Pro Phe Leu Pro Asp Gln Met Gln Ser Gln Val Pro Ser Leu His Tyr 
        355                  360                365            
Gln Glu Leu Met Pro Pro Gly Ser Cys Leu Pro Glu Glu Pro Lys Pro 
    370                  375                380                
Lys Arg Gly Arg Arg Ser Trp Pro Arg Lys Arg Thr Ala Thr His Thr 
385                  390                395                  400
Cys Asp Tyr Ala Gly Cys Gly Lys Thr Tyr Thr Lys Ser Ser His Leu 
                405                  410                415    
Lys Ala His Leu Arg Thr His Thr Gly Glu Lys Pro Tyr His Cys Asp 
            420                  425                430        
Trp Asp Gly Cys Gly Trp Lys Phe Ala Arg Ser Asp Glu Leu Thr Arg 
        435                  440                445            
His Tyr Arg Lys His Thr Gly His Arg Pro Phe Gln Cys Gln Lys Cys 
    450                  455                460                
Asp Arg Ala Phe Ser Arg Ser Asp His Leu Ala Leu His Met Lys Arg 
465                  470                475                  480
His Phe 
        

<210> 93
<211> 2323
<212> DNA
<213> Rattus norvegicus

<220> 
<221> source
<222> 1..2323
<223> /mol_type="DNA"
      /note="Rattus norvegicus Sox-2"
      /organism="Rattus norvegicus"

<400> 93
gtgtttgcaa aaagggaaaa gtactttgct gcctctttaa gactagggct gggagaaaga      60

agaggagaga aaaagaaagg agagaagttt ggagcccgag gcttaagcct ttccaaaaac     120

taatcacaac aatcgcggcg gcccgaggag gagagcgact gttttttcat cccaattgca     180

cttcgcccgt ctcgagctcc gcttcccccc aactattctc cgccagatct ccgcgcaagg     240

ccgtgcacgc cgacgacccc gcccgcggcc cctgcatccc ggcccccgcg cgcggccccc     300

gcagtcccgg ccgggccgag ggtcggcggc cgccggcggg ccgcgcccgc gcccagcgcc     360

cgcatgtata acatgatgga gacggagctg aagccgccgg gccctcagca agcttcgggg     420

ggcggcggcg gaggaggcaa cgccacggcg gcggcgaccg gcggcaacca gaagaacagc     480

ccggaccgcg tcaagaggcc catgaatgcc ttcatggtgt ggtcccgggg gcagcggcgt     540

aagatggccc aggagaaccc caagatgcac aactcggaga tcagcaagcg cctgggcgcc     600

gagtggaaac ttttgtcgga gaccgagaag cggccgttca tcgacgaggc caagcggctg     660

cgcgctctgc acatgaagga gcacccggat tataaatacc ggccgcggcg gaaaaccaag     720

acgctcatga agaaggataa gtacacgctt cccggaggct tgctggcccc cggcgggaac     780

agcatggcga gcggggttgg ggtgggcgcc ggcctgggtg cgggcgtgaa ccagcgcatg     840

gacagctacg cgcacatgaa cggctggagc aacggcagct acagcatgat gcaggagcag     900

ctgggctacc cgcagcaccc gggcctcaac gctcacggcg cggcacagat gcagccgatg     960

caccgctacg acgtcagcgc cctgcagtac aactccatga ccagctcgca gacctacatg    1020

aacggctcgc ccacctacag catgtcctac tcgcagcagg gcacccccgg tatggcgctg    1080

ggctccatgg gctctgtggt caagtccgag gccagttcca gcccccccgt ggttacctct    1140

tcctcccact ccagggcgcc ctgccaggcc ggggacctcc gggacatgat cagcatgtac    1200

ctccccggcg ccgaggtgcc ggagcccgct gcgcccagta gactgcacat ggcccagcac    1260

taccagagcg gcccggtgcc cggcacggcc attaacggca cactgcccct gtcgcacatg    1320

tgagggccgg accgcgaact ggagaagggg agagattttt caaaaagata caagggaatt    1380

gggaggggtg caaaagagga gagtaagaaa aatctgaatg ctcaaaagga aaaaaaaaat    1440

ctcattaccc gcagcaaaat gacagctgcg gaaaaaaacc accaatccca tccaaattaa    1500

cgcaaaaacc gtgatgccga ctagaaaact tttatgagag atctggagga aaaaaactac    1560

gcaaaacttt tttttaaagt tctagtggta cgttaggcgc ttcgcaggga gttctcaaaa    1620

gtctttacca gtaatattta gaactagact ccgggcgatg aaaaaagttt taatatttgc    1680

aagcaacttt tgtacagtat ttatcgagat aaacatggca atcaaatgtc cattgtttat    1740

aagctgagaa tttgccaata tttttcgagg aaagggttct tgctgggttt tgattctgca    1800

gcttaaatta aggaccgtta cagacaagga aggaatttat tcggatttga acgttttagt    1860

tttaaaattg tacaaaagga aaacatgaga gcaagtactg gcaagaccat tttcgtggtc    1920

ttgtttaggg caaacgttct agattgtact aaatttttaa cttactgtta aaggcaaaaa    1980

aaaaatgtcc atgcaggttg atatcgttgg taatttataa tagcttttgt tcaatcccac    2040

ccttttcatt ttgttcacat aaaaatatgg aaattactgt gtttgaaata ttttcttatg    2100

gtttgtaata tttctgtaaa ttgtgatatt ttaaggtttt ttcccccttt tattttccgt    2160

agttgtattt taaaagattc ggctgttatt ggaaccaggc tgccgagaat ccatgtatat    2220

atttgaacta ataccatcct tataacagtt acgtttccaa cttaagtttt tactccatta    2280

tgcacagttt gagataaata aatttttgaa atatggacac tga                      2323


<210> 94
<211> 319
<212> PRT
<213> Rattus norvegicus

<220> 
<221> SOURCE
<222> 1..319
<223> /mol_type="protein"
      /note="Rattus norvegicus Sox-2"
      /organism="Rattus norvegicus"

<400> 94
Met Tyr Asn Met Met Glu Thr Glu Leu Lys Pro Pro Gly Pro Gln Gln 
1               5                   10                   15    
Ala Ser Gly Gly Gly Gly Gly Gly Gly Asn Ala Thr Ala Ala Ala Thr 
            20                   25                  30        
Gly Gly Asn Gln Lys Asn Ser Pro Asp Arg Val Lys Arg Pro Met Asn 
        35                   40                  45            
Ala Phe Met Val Trp Ser Arg Gly Gln Arg Arg Lys Met Ala Gln Glu 
    50                   55                  60                
Asn Pro Lys Met His Asn Ser Glu Ile Ser Lys Arg Leu Gly Ala Glu 
65                   70                  75                  80
Trp Lys Leu Leu Ser Glu Thr Glu Lys Arg Pro Phe Ile Asp Glu Ala 
                85                   90                  95    
Lys Arg Leu Arg Ala Leu His Met Lys Glu His Pro Asp Tyr Lys Tyr 
            100                  105                110        
Arg Pro Arg Arg Lys Thr Lys Thr Leu Met Lys Lys Asp Lys Tyr Thr 
        115                  120                125            
Leu Pro Gly Gly Leu Leu Ala Pro Gly Gly Asn Ser Met Ala Ser Gly 
    130                  135                140                
Val Gly Val Gly Ala Gly Leu Gly Ala Gly Val Asn Gln Arg Met Asp 
145                  150                155                  160
Ser Tyr Ala His Met Asn Gly Trp Ser Asn Gly Ser Tyr Ser Met Met 
                165                  170                175    
Gln Glu Gln Leu Gly Tyr Pro Gln His Pro Gly Leu Asn Ala His Gly 
            180                  185                190        
Ala Ala Gln Met Gln Pro Met His Arg Tyr Asp Val Ser Ala Leu Gln 
        195                  200                205            
Tyr Asn Ser Met Thr Ser Ser Gln Thr Tyr Met Asn Gly Ser Pro Thr 
    210                  215                220                
Tyr Ser Met Ser Tyr Ser Gln Gln Gly Thr Pro Gly Met Ala Leu Gly 
225                  230                235                  240
Ser Met Gly Ser Val Val Lys Ser Glu Ala Ser Ser Ser Pro Pro Val 
                245                  250                255    
Val Thr Ser Ser Ser His Ser Arg Ala Pro Cys Gln Ala Gly Asp Leu 
            260                  265                270        
Arg Asp Met Ile Ser Met Tyr Leu Pro Gly Ala Glu Val Pro Glu Pro 
        275                  280                285            
Ala Ala Pro Ser Arg Leu His Met Ala Gln His Tyr Gln Ser Gly Pro 
    290                  295                300                
Val Pro Gly Thr Ala Ile Asn Gly Thr Leu Pro Leu Ser His Met 
305                  310                315                

<210> 95
<211> 2358
<212> DNA
<213> Rattus norvegicus

<220> 
<221> source
<222> 1..2358
<223> /mol_type="DNA"
      /note="Rattus norvegicus NANOG"
      /organism="Rattus norvegicus"

<400> 95
tcagataggc tgatttcgag tctttctctt ttgtgggaag accgaggctc gcttcttttt      60

ggcttgttga ctcttttaca tctggacatt taactcttac ttttaagatc tttccctcta     120

gacactgagt tttaaagtct taactttttg gttgttaaaa actttttttt ttttaaagtc     180

ccttcccttg ccgttgggct gacatgagcg tggatctttc tggtccccac agtctgccta     240

gttgtgagga agcatcgaac tctggggatt cctcgccgat gcctgccgtt catcttcctg     300

aggaaaatta ttcttgctta caagtgtctg ctactgagat gctctgcaca gagactgcct     360

ctcctccgcc ttcctctggg gacctacctc ttcaagatag ccctgattct tctagcaatc     420

ccaagctaaa gctgtctggt cccgaggctg acgagggccc tgagaagaaa gaagagaaca     480

aggtcctcac caagaagcag aagatgcgga ctgtgttctc tcaggcccag ttgtgtgcac     540

tcaaggatag gtttcagagg caaaggtacc tcagcctcca gcagatgcaa gatctctcta     600

ccattctgaa cctgagctat aagcaggtga agacctggtt ccaaaaccaa agaatgaagt     660

gcaagaggtg gcagaaaaac caatggttga agactagcaa cggcctgact cagaagggct     720

cagcgccggt ggagtatccc agcatccatt gcagctattc tcagggctat ctgatgaacg     780

cgtctggaaa ccttccagta tggggcagtc agacctggac caacccaact tggaacaacc     840

agacctggac caacccaacc tggagcaacc agacctggac caacccaact tggagcaacc     900

aggcctggag cactcagtcc tggtgtactc aggcctggaa cagccagact tggaacgctg     960

ctccgctcca taacttcggg gaggactccc tgcagcctta tgtgccgttg cagcaaaact    1020

tctccgccag tgatttggag gcgaatttgg aagccactag ggaaagccag gcgcatttta    1080

gtaccccgca agccttggaa ttgttcctga actactccgt gaattctcca ggcgaaatat    1140

gaggtttaca caacaactgg gcttaaagtc agggcagggc cagggtcagc tttcttcctt    1200

cttccaaaga gttttatatt gttcttattt tttttttaat tattattttg tttttgtttt    1260

ttgtttatca aggtagggtt tctctgtgtg gttctggctg tcctggaatt cactctgtag    1320

accaggctgg cctcgtactc agagatctgc ctacttttgc ctcctgaagg ctagggctaa    1380

agattttcta aagattttca tagtttttat ttttttaatt attatctgtt ttcatgtttg    1440

tgtttttttg ttttgttttt gtttttgttt ttgtttatca agatagggtt tctctgtgtg    1500

gctctagtag tcccggaaac tggctctgta gaccaggctg tccttgaact cagaaatctg    1560

cctttgcctc cggactgcgg ggactaaagg cagtatataa ccacctggca cattgttttt    1620

atttttattc ttttggtgcc agaaagcaaa cctaggactt tgagctgggc acccactcaa    1680

ccactgagct ctgtttgcga cccccgtgtt ggctgcattt gtctgagctg ggtaacttgt    1740

ctttttttcc gtgttaacga tgggcttcgg agacagtgca ctatacactc tatcctcccc    1800

caggtctcac acacccaccc tactccatac caacccaggc ttgtctgtct tttttttttt    1860

tggagctgag gactgaaccc agggccttgc gctttctagg caagcgctct acctctgagc    1920

taaatcccca acccttgtct gtctttttag aagcttgggt cttggtgtgc actgtgtatc    1980

gttttgaggg gtgaggttta aaagtataca aattataaag attcatgcag atatggtggc    2040

tcctctcaag gacgagacag aaggatcacc agtttgaggc tatctcagat ataaaataag    2100

ttcaagacca gcctgtacta tgtctaaata gtaagacagc atctcaacaa aataataaaa    2160

ctaaggtaag gagataaaag taaagtctca acaaaataca agatctcgcc tgttacagtt    2220

ctttgatttc ctccgtgtct ttgcagttcc gccaagaggc ttctatgtta atatctgtag    2280

aaagatgttt atatttgact gtaccatgat aaaccagtgc cagctggact agtttaaata    2340

aaacactaat tttaccca                                                  2358


<210> 96
<211> 312
<212> PRT
<213> Rattus norvegicus

<220> 
<221> SOURCE
<222> 1..312
<223> /mol_type="protein"
      /note="Rattus norvegicus NANOG"
      /organism="Rattus norvegicus"

<400> 96
Met Ser Val Asp Leu Ser Gly Pro His Ser Leu Pro Ser Cys Glu Glu 
1               5                   10                   15    
Ala Ser Asn Ser Gly Asp Ser Ser Pro Met Pro Ala Val His Leu Pro 
            20                   25                  30        
Glu Glu Asn Tyr Ser Cys Leu Gln Val Ser Ala Thr Glu Met Leu Cys 
        35                   40                  45            
Thr Glu Thr Ala Ser Pro Pro Pro Ser Ser Gly Asp Leu Pro Leu Gln 
    50                   55                  60                
Asp Ser Pro Asp Ser Ser Ser Asn Pro Lys Leu Lys Leu Ser Gly Pro 
65                   70                  75                  80
Glu Ala Asp Glu Gly Pro Glu Lys Lys Glu Glu Asn Lys Val Leu Thr 
                85                   90                  95    
Lys Lys Gln Lys Met Arg Thr Val Phe Ser Gln Ala Gln Leu Cys Ala 
            100                  105                110        
Leu Lys Asp Arg Phe Gln Arg Gln Arg Tyr Leu Ser Leu Gln Gln Met 
        115                  120                125            
Gln Asp Leu Ser Thr Ile Leu Asn Leu Ser Tyr Lys Gln Val Lys Thr 
    130                  135                140                
Trp Phe Gln Asn Gln Arg Met Lys Cys Lys Arg Trp Gln Lys Asn Gln 
145                  150                155                  160
Trp Leu Lys Thr Ser Asn Gly Leu Thr Gln Lys Gly Ser Ala Pro Val 
                165                  170                175    
Glu Tyr Pro Ser Ile His Cys Ser Tyr Ser Gln Gly Tyr Leu Met Asn 
            180                  185                190        
Ala Ser Gly Asn Leu Pro Val Trp Gly Ser Gln Thr Trp Thr Asn Pro 
        195                  200                205            
Thr Trp Asn Asn Gln Thr Trp Thr Asn Pro Thr Trp Ser Asn Gln Thr 
    210                  215                220                
Trp Thr Asn Pro Thr Trp Ser Asn Gln Ala Trp Ser Thr Gln Ser Trp 
225                  230                235                  240
Cys Thr Gln Ala Trp Asn Ser Gln Thr Trp Asn Ala Ala Pro Leu His 
                245                  250                255    
Asn Phe Gly Glu Asp Ser Leu Gln Pro Tyr Val Pro Leu Gln Gln Asn 
            260                  265                270        
Phe Ser Ala Ser Asp Leu Glu Ala Asn Leu Glu Ala Thr Arg Glu Ser 
        275                  280                285            
Gln Ala His Phe Ser Thr Pro Gln Ala Leu Glu Leu Phe Leu Asn Tyr 
    290                  295                300                
Ser Val Asn Ser Pro Gly Glu Ile 
305                  310        

<210> 97
<211> 463
<212> DNA
<213> Rattus norvegicus

<220> 
<221> source
<222> 1..463
<223> /mol_type="DNA"
      /note="Rattus norvegicus Insulin"
      /organism="Rattus norvegicus"

<400> 97
aaccctaagt gaccagctac aatcatagac catcagcaag caggtcattg ttccaacatg      60

gccctgtgga tgcgcttcct gcccctgctg gccctgctcg tcctctggga gcccaagcct     120

gcccaggctt ttgtcaaaca gcacctttgt ggtcctcacc tggtggaggc tctgtacctg     180

gtgtgtgggg aacgtggttt cttctacaca cccaagtccc gtcgtgaagt ggaggacccg     240

caagtgccac aactggagct gggtggaggc ccggaggccg gggatcttca gaccttggca     300

ctggaggttg cccggcagaa gcgtggcatt gtggatcagt gctgcaccag catctgctcc     360

ctctaccaac tggagaacta ctgcaactga gtccaccact ccccgcccac ccctctgcaa     420

tgaataaagc ctttgaatga gcaccaaaaa aaaaaaaaaa aaa                       463


<210> 98
<211> 110
<212> PRT
<213> Rattus norvegicus

<220> 
<221> SOURCE
<222> 1..110
<223> /mol_type="protein"
      /note="Rattus norvegicus Insulin"
      /organism="Rattus norvegicus"

<400> 98
Met Ala Leu Trp Met Arg Phe Leu Pro Leu Leu Ala Leu Leu Val Leu 
1               5                   10                   15    
Trp Glu Pro Lys Pro Ala Gln Ala Phe Val Lys Gln His Leu Cys Gly 
            20                   25                  30        
Pro His Leu Val Glu Ala Leu Tyr Leu Val Cys Gly Glu Arg Gly Phe 
        35                   40                  45            
Phe Tyr Thr Pro Lys Ser Arg Arg Glu Val Glu Asp Pro Gln Val Pro 
    50                   55                  60                
Gln Leu Glu Leu Gly Gly Gly Pro Glu Ala Gly Asp Leu Gln Thr Leu 
65                   70                  75                  80
Ala Leu Glu Val Ala Arg Gln Lys Arg Gly Ile Val Asp Gln Cys Cys 
                85                   90                  95    
Thr Ser Ile Cys Ser Leu Tyr Gln Leu Glu Asn Tyr Cys Asn 
            100                  105                110

<210> 99
<211> 1307
<212> DNA
<213> Rattus norvegicus

<220> 
<221> source
<222> 1..1307
<223> /mol_type="DNA"
      /note="Rattus norvegicus GAPDH"
      /organism="Rattus norvegicus"

<400> 99
gggggctctc tgctcctccc tgttctagag acagccgcat cttcttgtgc agtgccagcc      60

tcgtctcata gacaagatgg tgaaggtcgg tgtgaacgga tttggccgta tcggacgcct     120

ggttaccagg gctgccttct cttgtgacaa agtggacatt gttgccatca acgacccctt     180

cattgacctc aactacatgg tctacatgtt ccagtatgac tctacccacg gcaagttcaa     240

cggcacagtc aaggctgaga atgggaagct ggtcatcaac gggaaaccca tcaccatctt     300

ccaggagcga gatcccgcta acatcaaatg gggtgatgct ggtgctgagt atgtcgtgga     360

gtctactggc gtcttcacca ccatggagaa ggctggggct cacctgaagg gtggggccaa     420

aagggtcatc atctccgccc cttccgctga tgcccccatg tttgtgatgg gtgtgaacca     480

cgagaaatat gacaactccc tcaagattgt cagcaatgca tcctgcacca ccaactgctt     540

agcccccctg gccaaggtca tccatgacaa ctttggcatc gtggaagggc tcatgaccac     600

agtccatgcc atcactgcca ctcagaagac tgtggatggc ccctctggaa agctgtggcg     660

tgatggccgt ggggcagccc agaacatcat ccctgcatcc actggtgctg ccaaggctgt     720

gggcaaggtc atcccagagc tgaacgggaa gctcactggc atggccttcc gtgttcctac     780

ccccaatgta tccgttgtgg atctgacatg ccgcctggag aaacctgcca agtatgatga     840

catcaagaag gtggtgaagc aggcggccga gggcccacta aagggcatcc tgggctacac     900

tgaggaccag gttgtctcct gtgacttcaa cagcaactcc cattcttcca cctttgatgc     960

tggggctggc attgctctca atgacaactt tgtgaagctc atttcctggt atgacaatga    1020

atatggctac agcaacaggg tggtggacct catggcctac atggcctcca aggagtaaga    1080

aaccctggac cacccagccc agcaaggata ctgagagcaa gagagaggcc ctcagttgct    1140

gaggagtccc catcccaact cagcccccaa cactgagcat ctccctcaca attccatccc    1200

agaccccata acaacaggag gggcctgggg agccctccct tctctcgaat accatcaata    1260

aagttcgctg caccctcaaa aaaaaaaaaa aaaaaaaaaa aaaaaaa                  1307


<210> 100
<211> 323
<212> PRT
<213> Rattus norvegicus

<220> 
<221> SOURCE
<222> 1..323
<223> /mol_type="protein"
      /note="Rattus norvegicus GAPDH"
      /organism="Rattus norvegicus"

<400> 100
Met Val Lys Val Gly Val Asn Gly Phe Gly Arg Ile Gly Arg Leu Val 
1               5                   10                   15    
Thr Arg Ala Ala Phe Ser Cys Asp Lys Val Asp Ile Val Ala Ile Asn 
            20                   25                  30        
Asp Pro Phe Ile Asp Leu Asn Tyr Met Val Tyr Met Phe Gln Tyr Asp 
        35                   40                  45            
Ser Thr His Gly Lys Phe Asn Gly Thr Val Lys Ala Glu Asn Gly Lys 
    50                   55                  60                
Leu Val Ile Asn Gly Lys Pro Ile Thr Ile Phe Gln Glu Arg Asp Pro 
65                   70                  75                  80
Ala Asn Ile Lys Trp Gly Asp Ala Gly Ala Glu Tyr Val Val Glu Ser 
                85                   90                  95    
Thr Gly Val Phe Thr Thr Met Glu Lys Ala Gly Ala His Leu Lys Gly 
            100                  105                110        
Gly Ala Lys Arg Val Ile Ile Ser Ala Pro Ser Ala Asp Ala Pro Met 
        115                  120                125            
Phe Val Met Gly Val Asn His Glu Lys Tyr Asp Asn Ser Leu Lys Ile 
    130                  135                140                
Val Ser Asn Ala Ser Cys Thr Thr Asn Cys Leu Ala Pro Leu Ala Lys 
145                  150                155                  160
Val Ile His Asp Asn Phe Gly Ile Val Glu Gly Leu Met Thr Thr Val 
                165                  170                175    
His Ala Ile Thr Ala Thr Gln Lys Thr Val Asp Gly Pro Ser Gly Lys 
            180                  185                190        
Leu Trp Arg Asp Gly Arg Gly Ala Ala Gln Asn Ile Ile Pro Ala Ser 
        195                  200                205            
Thr Gly Ala Ala Lys Ala Val Gly Lys Val Ile Pro Glu Leu Asn Gly 
    210                  215                220                
Lys Leu Thr Gly Met Ala Phe Arg Val Pro Thr Pro Asn Val Ser Val 
225                  230                235                  240
Val Asp Leu Thr Cys Arg Leu Glu Lys Pro Ala Lys Tyr Asp Asp Ile 
                245                  250                255    
Lys Lys Val Val Lys Gln Ala Ala Glu Gly Pro Leu Lys Gly Ile Leu 
            260                  265                270        
Gly Tyr Thr Glu Asp Gln Val Val Ser Cys Asp Phe Asn Ser Asn Ser 
        275                  280                285            
His Ser Ser Thr Phe Asp Ala Gly Ala Gly Ile Ala Leu Asn Asp Asn 
    290                  295                300                
Phe Val Lys Leu Ile Ser Trp Tyr Asp Asn Glu Tyr Gly Tyr Ser Asn 
305                  310                315                  320
Arg Val Val 
            

<210> 101
<211> 1575
<212> DNA
<213> Homo sapiens

<220> 
<221> source
<222> 1..1575
<223> /mol_type="DNA"
      /note="Homo sapiens Glut-2 (SLC2A2)"
      /organism="Homo sapiens"

<400> 101
atgacagaag ataaggtcac tgggaccctg gttttcactg tcatcactgc tgtgctgggt      60

tccttccagt ttggatatga cattggtgtg atcaatgcac ctcaacaggt aataatatct     120

cactatagac atgttttggg tgttccactg gatgaccgaa aagctatcaa caactatgtt     180

atcaacagta cagatgaact gcccacaatc tcatactcaa tgaacccaaa accaacccct     240

tgggctgagg aagagactgt ggcagctgct caactaatca ccatgctctg gtccctgtct     300

gtatccagct ttgcagttgg tggaatgact gcatcattct ttggtgggtg gcttggggac     360

acacttggaa gaatcaaagc catgttagta gcaaacattc tgtcattagt tggagctctc     420

ttgatggggt tttcaaaatt gggaccatct catatactta taattgctgg aagaagcata     480

tcaggactat attgtgggct aatttcaggc ctggttccta tgtatatcgg tgaaattgct     540

ccaaccgctc tcaggggagc acttggcact tttcatcagc tggccatcgt cacgggcatt     600

cttattagtc agattattgg tcttgaattt atcttgggca attatgatct gtggcacatc     660

ctgcttggcc tgtctggtgt gcgagccatc cttcagtctc tgctactctt tttctgtcca     720

gaaagcccca gataccttta catcaagtta gatgaggaag tcaaagcaaa acaaagcttg     780

aaaagactca gaggatatga tgatgtcacc aaagatatta atgaaatgag aaaagaaaga     840

gaagaagcat cgagtgagca gaaagtctct ataattcagc tcttcaccaa ttccagctac     900

cgacagccta ttctagtggc actgatgctg catgtggctc agcaattttc cggaatcaat     960

ggcatttttt actactcaac cagcattttt cagacggctg gtatcagcaa acctgtttat    1020

gcaaccattg gagttggcgc tgtaaacatg gttttcactg ctgtctctgt attccttgtg    1080

gagaaggcag ggcgacgttc tctctttcta attggaatga gtgggatgtt tgtttgtgcc    1140

atcttcatgt cagtgggact tgtgctgctg aataagttct cttggatgag ttatgtgagc    1200

atgatagcca tcttcctctt tgtcagcttc tttgaaattg ggccaggccc gatcccctgg    1260

ttcatggtgg ctgagttttt cagtcaagga ccacgtcctg ctgctttagc aatagctgca    1320

ttcagcaatt ggacctgcaa tttcattgta gctctgtgtt tccagtacat tgcggacttc    1380

tgtggacctt atgtgttttt cctctttgct ggagtgctcc tggcctttac cctgttcaca    1440

ttttttaaag ttccagaaac caaaggaaag tcttttgagg aaattgctgc agaattccaa    1500

aagaagagtg gctcagccca caggccaaaa gctgctgtag aaatgaaatt cctaggagct    1560

acagagactg tgtaa                                                     1575


<210> 102
<211> 524
<212> PRT
<213> Homo sapiens

<220> 
<221> SOURCE
<222> 1..524
<223> /mol_type="protein"
      /note="Homo sapiens Glut-2 (SLC2A2)"
      /organism="Homo sapiens"

<400> 102
Met Thr Glu Asp Lys Val Thr Gly Thr Leu Val Phe Thr Val Ile Thr 
1               5                   10                   15    
Ala Val Leu Gly Ser Phe Gln Phe Gly Tyr Asp Ile Gly Val Ile Asn 
            20                   25                  30        
Ala Pro Gln Gln Val Ile Ile Ser His Tyr Arg His Val Leu Gly Val 
        35                   40                  45            
Pro Leu Asp Asp Arg Lys Ala Ile Asn Asn Tyr Val Ile Asn Ser Thr 
    50                   55                  60                
Asp Glu Leu Pro Thr Ile Ser Tyr Ser Met Asn Pro Lys Pro Thr Pro 
65                   70                  75                  80
Trp Ala Glu Glu Glu Thr Val Ala Ala Ala Gln Leu Ile Thr Met Leu 
                85                   90                  95    
Trp Ser Leu Ser Val Ser Ser Phe Ala Val Gly Gly Met Thr Ala Ser 
            100                  105                110        
Phe Phe Gly Gly Trp Leu Gly Asp Thr Leu Gly Arg Ile Lys Ala Met 
        115                  120                125            
Leu Val Ala Asn Ile Leu Ser Leu Val Gly Ala Leu Leu Met Gly Phe 
    130                  135                140                
Ser Lys Leu Gly Pro Ser His Ile Leu Ile Ile Ala Gly Arg Ser Ile 
145                  150                155                  160
Ser Gly Leu Tyr Cys Gly Leu Ile Ser Gly Leu Val Pro Met Tyr Ile 
                165                  170                175    
Gly Glu Ile Ala Pro Thr Ala Leu Arg Gly Ala Leu Gly Thr Phe His 
            180                  185                190        
Gln Leu Ala Ile Val Thr Gly Ile Leu Ile Ser Gln Ile Ile Gly Leu 
        195                  200                205            
Glu Phe Ile Leu Gly Asn Tyr Asp Leu Trp His Ile Leu Leu Gly Leu 
    210                  215                220                
Ser Gly Val Arg Ala Ile Leu Gln Ser Leu Leu Leu Phe Phe Cys Pro 
225                  230                235                  240
Glu Ser Pro Arg Tyr Leu Tyr Ile Lys Leu Asp Glu Glu Val Lys Ala 
                245                  250                255    
Lys Gln Ser Leu Lys Arg Leu Arg Gly Tyr Asp Asp Val Thr Lys Asp 
            260                  265                270        
Ile Asn Glu Met Arg Lys Glu Arg Glu Glu Ala Ser Ser Glu Gln Lys 
        275                  280                285            
Val Ser Ile Ile Gln Leu Phe Thr Asn Ser Ser Tyr Arg Gln Pro Ile 
    290                  295                300                
Leu Val Ala Leu Met Leu His Val Ala Gln Gln Phe Ser Gly Ile Asn 
305                  310                315                  320
Gly Ile Phe Tyr Tyr Ser Thr Ser Ile Phe Gln Thr Ala Gly Ile Ser 
                325                  330                335    
Lys Pro Val Tyr Ala Thr Ile Gly Val Gly Ala Val Asn Met Val Phe 
            340                  345                350        
Thr Ala Val Ser Val Phe Leu Val Glu Lys Ala Gly Arg Arg Ser Leu 
        355                  360                365            
Phe Leu Ile Gly Met Ser Gly Met Phe Val Cys Ala Ile Phe Met Ser 
    370                  375                380                
Val Gly Leu Val Leu Leu Asn Lys Phe Ser Trp Met Ser Tyr Val Ser 
385                  390                395                  400
Met Ile Ala Ile Phe Leu Phe Val Ser Phe Phe Glu Ile Gly Pro Gly 
                405                  410                415    
Pro Ile Pro Trp Phe Met Val Ala Glu Phe Phe Ser Gln Gly Pro Arg 
            420                  425                430        
Pro Ala Ala Leu Ala Ile Ala Ala Phe Ser Asn Trp Thr Cys Asn Phe 
        435                  440                445            
Ile Val Ala Leu Cys Phe Gln Tyr Ile Ala Asp Phe Cys Gly Pro Tyr 
    450                  455                460                
Val Phe Phe Leu Phe Ala Gly Val Leu Leu Ala Phe Thr Leu Phe Thr 
465                  470                475                  480
Phe Phe Lys Val Pro Glu Thr Lys Gly Lys Ser Phe Glu Glu Ile Ala 
                485                  490                495    
Ala Glu Phe Gln Lys Lys Ser Gly Ser Ala His Arg Pro Lys Ala Ala 
            500                  505                510        
Val Glu Met Lys Phe Leu Gly Ala Thr Glu Thr Val 
        515                  520                

<210> 103
<211> 1569
<212> DNA
<213> Rattus norvegicus

<220> 
<221> source
<222> 1..1569
<223> /mol_type="DNA"
      /note="Rattus norvegicus Glut-2 (SLC2A2)"
      /organism="Rattus norvegicus"

<400> 103
atgtcagaag acaagatcac cggaaccttg gctttcactg tcttcactgc agtgctgggt      60

tccttccagt tcggatatga catcggtgtg atcaatgcac ctcaagaggt aataatatcc     120

cattatcgac atgttttggg tgttcctctg gatgaccgaa gagctaccat taactatgac     180

atcaatggca cagacacccc actcatagtc acaccagcac atacgacacc agacgcctgg     240

gaagaagaga ctgaaggatc tgctcacata gtcactatgc tctggtctct gtctgtgtcc     300

agctttgcag taggcggaat ggtcgcctcg ttctttggtg ggtggcttgg ggacaaactc     360

ggaaggatca aagccatgtt ggctgcaaac agcctctcgt tgactggagc cctcttgatg     420

gggtgttcca aatttggacc ggcacatgct ctcatcattg ctggaagaag cgtatcagga     480

ctgtactgtg ggctaatttc aggactggtt ccaatgtaca ttggcgagat tgctccaacc     540

acactcaggg gtgccctggg cactcttcac caactggctc ttgtcacagg cattcttatt     600

agtcagattg ctggcctcag cttcattctg ggcaatcagg attactggca catcctactt     660

ggcctatctg ctgtaccagc tctcctgcag tgtctgctac tgctcttctg tccagaaagc     720

cccagatacc tttacctaaa gttggaagag gaagtcaggg caaagaaaag cttgaaaaga     780

ctaaggggca ctgaggacgt caccaaagat attaatgaga tgaggaaaga aaaggaagag     840

gcgtcgactg agcagaaggt ctccgtgatc cagctcttca cggatccgaa ttatcggcag     900

cccattgtgg tggcactgat gctacacttg gctcagcagt tctctggaat caatgggata     960

ttttactatt caaccagcat ttttcagaca gctggcatca gccagcctgt gtatgcaacc    1020

atcggcgttg gtgccatcaa catgatcttc acggctgtct ctgtgctgct tgtggagaaa    1080

gcggggcggc ggaccctgtt cctggccggg atgattggca tgtttttctg tgccgtcttc    1140

atgtcgctgg gactggtgtt gctggataag ttcacctgga tgagttatgt gagcatgacg    1200

gccatcttcc tcttcgtcag tttctttgag attgggccag gtccaatccc ttggttcatg    1260

gttgctgaat ttttcagcca aggaccccgt cccacggctc tggcactggc tgccttcagc    1320

aactgggtct gcaatttcat catcgccctc tgcttccagt acattgcgga cttcctcggg    1380

ccttacgtgt tcttcctttt tgctggggtg gtcctgatct tcaccctgtt cacatttttt    1440

aaagttccag aaaccaaagg aaagtctttt gacgaaattg ctgcagaatt ccggaagaag    1500

agtggttcgg ccccaccacg caaagccgct gtacaaatgg aattcctggg gtcttcagag    1560

actgtgtga                                                            1569


<210> 104
<211> 522
<212> PRT
<213> Rattus norvegicus

<220> 
<221> SOURCE
<222> 1..522
<223> /mol_type="protein"
      /note="Rattus norvegicus (SLC2A2)"
      /organism="Rattus norvegicus"

<400> 104
Met Ser Glu Asp Lys Ile Thr Gly Thr Leu Ala Phe Thr Val Phe Thr 
1               5                   10                   15    
Ala Val Leu Gly Ser Phe Gln Phe Gly Tyr Asp Ile Gly Val Ile Asn 
            20                   25                  30        
Ala Pro Gln Glu Val Ile Ile Ser His Tyr Arg His Val Leu Gly Val 
        35                   40                  45            
Pro Leu Asp Asp Arg Arg Ala Thr Ile Asn Tyr Asp Ile Asn Gly Thr 
    50                   55                  60                
Asp Thr Pro Leu Ile Val Thr Pro Ala His Thr Thr Pro Asp Ala Trp 
65                   70                  75                  80
Glu Glu Glu Thr Glu Gly Ser Ala His Ile Val Thr Met Leu Trp Ser 
                85                   90                  95    
Leu Ser Val Ser Ser Phe Ala Val Gly Gly Met Val Ala Ser Phe Phe 
            100                  105                110        
Gly Gly Trp Leu Gly Asp Lys Leu Gly Arg Ile Lys Ala Met Leu Ala 
        115                  120                125            
Ala Asn Ser Leu Ser Leu Thr Gly Ala Leu Leu Met Gly Cys Ser Lys 
    130                  135                140                
Phe Gly Pro Ala His Ala Leu Ile Ile Ala Gly Arg Ser Val Ser Gly 
145                  150                155                  160
Leu Tyr Cys Gly Leu Ile Ser Gly Leu Val Pro Met Tyr Ile Gly Glu 
                165                  170                175    
Ile Ala Pro Thr Thr Leu Arg Gly Ala Leu Gly Thr Leu His Gln Leu 
            180                  185                190        
Ala Leu Val Thr Gly Ile Leu Ile Ser Gln Ile Ala Gly Leu Ser Phe 
        195                  200                205            
Ile Leu Gly Asn Gln Asp Tyr Trp His Ile Leu Leu Gly Leu Ser Ala 
    210                  215                220                
Val Pro Ala Leu Leu Gln Cys Leu Leu Leu Leu Phe Cys Pro Glu Ser 
225                  230                235                  240
Pro Arg Tyr Leu Tyr Leu Lys Leu Glu Glu Glu Val Arg Ala Lys Lys 
                245                  250                255    
Ser Leu Lys Arg Leu Arg Gly Thr Glu Asp Val Thr Lys Asp Ile Asn 
            260                  265                270        
Glu Met Arg Lys Glu Lys Glu Glu Ala Ser Thr Glu Gln Lys Val Ser 
        275                  280                285            
Val Ile Gln Leu Phe Thr Asp Pro Asn Tyr Arg Gln Pro Ile Val Val 
    290                  295                300                
Ala Leu Met Leu His Leu Ala Gln Gln Phe Ser Gly Ile Asn Gly Ile 
305                  310                315                  320
Phe Tyr Tyr Ser Thr Ser Ile Phe Gln Thr Ala Gly Ile Ser Gln Pro 
                325                  330                335    
Val Tyr Ala Thr Ile Gly Val Gly Ala Ile Asn Met Ile Phe Thr Ala 
            340                  345                350        
Val Ser Val Leu Leu Val Glu Lys Ala Gly Arg Arg Thr Leu Phe Leu 
        355                  360                365            
Ala Gly Met Ile Gly Met Phe Phe Cys Ala Val Phe Met Ser Leu Gly 
    370                  375                380                
Leu Val Leu Leu Asp Lys Phe Thr Trp Met Ser Tyr Val Ser Met Thr 
385                  390                395                  400
Ala Ile Phe Leu Phe Val Ser Phe Phe Glu Ile Gly Pro Gly Pro Ile 
                405                  410                415    
Pro Trp Phe Met Val Ala Glu Phe Phe Ser Gln Gly Pro Arg Pro Thr 
            420                  425                430        
Ala Leu Ala Leu Ala Ala Phe Ser Asn Trp Val Cys Asn Phe Ile Ile 
        435                  440                445            
Ala Leu Cys Phe Gln Tyr Ile Ala Asp Phe Leu Gly Pro Tyr Val Phe 
    450                  455                460                
Phe Leu Phe Ala Gly Val Val Leu Ile Phe Thr Leu Phe Thr Phe Phe 
465                  470                475                  480
Lys Val Pro Glu Thr Lys Gly Lys Ser Phe Asp Glu Ile Ala Ala Glu 
                485                  490                495    
Phe Arg Lys Lys Ser Gly Ser Ala Pro Pro Arg Lys Ala Ala Val Gln 
            500                  505                510        
Met Glu Phe Leu Gly Ser Ser Glu Thr Val 
        515                  520        

<210> 105
<211> 1769
<212> DNA
<213> Homo sapiens

<220> 
<221> source
<222> 1..1769
<223> /mol_type="DNA"
      /note="beta-III-tubulin"
      /organism="Homo sapiens"

<400> 105
gacatcagcc gatgcgaagg gcggggccgc ggctataaga gcgcgcggcc gcggtccccg      60

accctcagca gccagcccgg cccgcccgcg cccgtccgca gccgcccgcc agacgcgccc     120

agtatgaggg agatcgtgca catccaggcc ggccagtgcg gcaaccagat cggggccaag     180

ttctgggaag tcatcagtga tgagcatggc atcgacccca gcggcaacta cgtgggcgac     240

tcggacttgc agctggagcg gatcagcgtc tactacaacg aggcctcttc tcacaagtac     300

gtgcctcgag ccattctggt ggacctggaa cccggaacca tggacagtgt ccgctcaggg     360

gcctttggac atctcttcag gcctgacaat ttcatctttg gtcagagtgg ggccggcaac     420

aactgggcca agggtcacta cacggagggg gcggagctgg tggattcggt cctggatgtg     480

gtgcggaagg agtgtgaaaa ctgcgactgc ctgcagggct tccagctgac ccactcgctg     540

gggggcggca cgggctccgg catgggcacg ttgctcatca gcaaggtgcg tgaggagtat     600

cccgaccgca tcatgaacac cttcagcgtc gtgccctcac ccaaggtgtc agacacggtg     660

gtggagccct acaacgccac gctgtccatc caccagctgg tggagaacac ggatgagacc     720

tactgcatcg acaacgaggc gctctacgac atctgcttcc gcaccctcaa gctggccacg     780

cccacctacg gggacctcaa ccacctggta tcggccacca tgagcggagt caccacctcc     840

ttgcgcttcc cgggccagct caacgctgac ctgcgcaagc tggccgtcaa catggtgccc     900

ttcccgcgcc tgcacttctt catgcccggc ttcgcccccc tcacagcccg gggcagccag     960

cagtaccggg ccctgaccgt gcccgagctc acccagcaga tgttcgatgc caagaacatg    1020

atggccgcct gcgacccgcg ccacggccgc tacctgacgg tggccaccgt gttccggggc    1080

cgcatgtcca tgaaggaggt ggacgagcag atgctggcca tccagagcaa gaacagcagc    1140

tacttcgtgg agtggatccc caacaacgtg aaggtggccg tgtgtgacat cccgccccgc    1200

ggcctcaaga tgtcctccac cttcatcggg aacagcacgg ccatccagga gctgttcaag    1260

cgcatctccg agcagttcac ggccatgttc cggcgcaagg ccttcctgca ctggtacacg    1320

ggcgagggca tggacgagat ggagttcacc gaggccgaga gcaacatgaa cgacctggtg    1380

tccgagtacc agcagtacca ggacgccacg gccgaggaag agggcgagat gtacgaagac    1440

gacgaggagg agtcggaggc ccagggcccc aagtgaagct gctcgcagct ggagtgagag    1500

gcaggtggcg gccggggccg aagccagcag tgtctaaacc cccggagcca tcttgctgcc    1560

gacaccctgc tttcccctcg ccctagggct cccttgccgc cctcctgcag tatttatggc    1620

ctcgtcctcc ccacctaggc cacgtgtgag ctgctcctgt ctctgtctta ttgcagctcc    1680

aggcctgacg ttttacggtt ttgtttttta ctggtttgtg tttatatttt cggggatact    1740

taataaatct attgctgtca gataccctt                                      1769


<210> 106
<211> 450
<212> PRT
<213> Homo sapiens

<220> 
<221> SOURCE
<222> 1..450
<223> /mol_type="protein"
      /note="beta-III-tubulin"
      /organism="Homo sapiens"

<400> 106
Met Arg Glu Ile Val His Ile Gln Ala Gly Gln Cys Gly Asn Gln Ile 
1               5                   10                   15    
Gly Ala Lys Phe Trp Glu Val Ile Ser Asp Glu His Gly Ile Asp Pro 
            20                   25                  30        
Ser Gly Asn Tyr Val Gly Asp Ser Asp Leu Gln Leu Glu Arg Ile Ser 
        35                   40                  45            
Val Tyr Tyr Asn Glu Ala Ser Ser His Lys Tyr Val Pro Arg Ala Ile 
    50                   55                  60                
Leu Val Asp Leu Glu Pro Gly Thr Met Asp Ser Val Arg Ser Gly Ala 
65                   70                  75                  80
Phe Gly His Leu Phe Arg Pro Asp Asn Phe Ile Phe Gly Gln Ser Gly 
                85                   90                  95    
Ala Gly Asn Asn Trp Ala Lys Gly His Tyr Thr Glu Gly Ala Glu Leu 
            100                  105                110        
Val Asp Ser Val Leu Asp Val Val Arg Lys Glu Cys Glu Asn Cys Asp 
        115                  120                125            
Cys Leu Gln Gly Phe Gln Leu Thr His Ser Leu Gly Gly Gly Thr Gly 
    130                  135                140                
Ser Gly Met Gly Thr Leu Leu Ile Ser Lys Val Arg Glu Glu Tyr Pro 
145                  150                155                  160
Asp Arg Ile Met Asn Thr Phe Ser Val Val Pro Ser Pro Lys Val Ser 
                165                  170                175    
Asp Thr Val Val Glu Pro Tyr Asn Ala Thr Leu Ser Ile His Gln Leu 
            180                  185                190        
Val Glu Asn Thr Asp Glu Thr Tyr Cys Ile Asp Asn Glu Ala Leu Tyr 
        195                  200                205            
Asp Ile Cys Phe Arg Thr Leu Lys Leu Ala Thr Pro Thr Tyr Gly Asp 
    210                  215                220                
Leu Asn His Leu Val Ser Ala Thr Met Ser Gly Val Thr Thr Ser Leu 
225                  230                235                  240
Arg Phe Pro Gly Gln Leu Asn Ala Asp Leu Arg Lys Leu Ala Val Asn 
                245                  250                255    
Met Val Pro Phe Pro Arg Leu His Phe Phe Met Pro Gly Phe Ala Pro 
            260                  265                270        
Leu Thr Ala Arg Gly Ser Gln Gln Tyr Arg Ala Leu Thr Val Pro Glu 
        275                  280                285            
Leu Thr Gln Gln Met Phe Asp Ala Lys Asn Met Met Ala Ala Cys Asp 
    290                  295                300                
Pro Arg His Gly Arg Tyr Leu Thr Val Ala Thr Val Phe Arg Gly Arg 
305                  310                315                  320
Met Ser Met Lys Glu Val Asp Glu Gln Met Leu Ala Ile Gln Ser Lys 
                325                  330                335    
Asn Ser Ser Tyr Phe Val Glu Trp Ile Pro Asn Asn Val Lys Val Ala 
            340                  345                350        
Val Cys Asp Ile Pro Pro Arg Gly Leu Lys Met Ser Ser Thr Phe Ile 
        355                  360                365            
Gly Asn Ser Thr Ala Ile Gln Glu Leu Phe Lys Arg Ile Ser Glu Gln 
    370                  375                380                
Phe Thr Ala Met Phe Arg Arg Lys Ala Phe Leu His Trp Tyr Thr Gly 
385                  390                395                  400
Glu Gly Met Asp Glu Met Glu Phe Thr Glu Ala Glu Ser Asn Met Asn 
                405                  410                415    
Asp Leu Val Ser Glu Tyr Gln Gln Tyr Gln Asp Ala Thr Ala Glu Glu 
            420                  425                430        
Glu Gly Glu Met Tyr Glu Asp Asp Glu Glu Glu Ser Glu Ala Gln Gly 
        435                  440                445            
Pro Lys 
    450

<210> 107
<211> 1704
<212> DNA
<213> Rattus norvegicus

<220> 
<221> source
<222> 1..1704
<223> /mol_type="DNA"
      /note="beta-III-tubulin"
      /organism="Rattus norvegicus"

<400> 107
atcctccgca gcccgctgtc cgcctgcctc ttcgtctcta gccgagtgaa gtcagcatga      60

gggagatcgt gcacatccag gccggccagt gcggcaacca gataggggcc aagttctggg     120

aggtcatcag tgacgagcat ggcatagacc ccagcggcaa ctatgtgggg gactcggacc     180

tgcagctgga acgcatcagt gtctactaca atgaggcctc ctctcacaag tatgtgccca     240

gagccattct ggtggacctg gagcctggaa ccatggacag cgttcggtct ggggcctttg     300

gacacctatt caggcctgac aactttatct tcggtcagag tggtgctggc aacaactggg     360

ccaaagggca ctatacagag ggcgccgagc tggtggactc agtcctggat gtcgtgagga     420

aagaatgtga gaattgtgac tgcctgcagg gcttccagct cactcactca ctgggtgggg     480

gcacgggctc aggcatgggc acactgctca tcagcaaagt gcgtgaggag taccctgacc     540

gcatcatgaa caccttcagc gtggtgccct cacccaaagt gtcagacacc gtggtagagc     600

cctacaacgc caccctgtcc atccaccagc tagtggagaa cacggatgag acctactgca     660

tcgacaatga agccctctac gacatctgct tccgcaccct caagctggct acacccacct     720

acggggacct caaccacctt gtgtctgcta ccatgagcgg agtcaccacc tcccttcgat     780

tccctggtca gctcaatgcc gacctccgca agctagctgt caacatggtg cccttccccc     840

gcttgcattt cttcatgccc ggctttgccc cactaacagc ccggggcagc caacagtacc     900

gtgccctgac ggtgcctgag ctcacccagc agatgttcga cgccaagaac atgatggctg     960

cctgtgaccc acgccacggc cgctacctga ccgtggccac cgtcttccgt gggcgcatgt    1020

ccatgaagga ggtggatgag cagatgctgg ccattcagag taagaacagt agttacttcg    1080

tggagtggat ccccaacaac gtcaaggtag cggtgtgtga catcccgccc cgagggctca    1140

agatgtcgtc caccttcatc ggcaacagca cggccatcca ggagctgttc aagcgcatct    1200

ccgagcagtt tacggccatg ttccggcgca aggccttcct ccactggtac acgggcgaag    1260

gcatggatga gatggagttc accgaggccg agagcaacat gaacgacctg gtgtctgagt    1320

accagcagta ccaggacgcc actgccgagg aggaggggga gatgtatgaa gatgacgacg    1380

aggagtcgga agcccagggg cccaagtgaa gttgcttgca gctggggtgt ggggccaagt    1440

ggcagccagg gccaagacaa gcagcatctg tcccccagag ccatctagct actgacactg    1500

cccccagctt accttcctac cagctcttca gggcacccta gggctcccgg gttaaagtcc    1560

ttcagtattt atggccatcc cccaccccac gtgagtccac ttggctctgt cctccccgtt    1620

ttagccacct ttgtatttat gttgcttttg tgtctgtttt attatggctc caggcctgat    1680

gttttatgtt tttttttttt ttta                                           1704


<210> 108
<211> 450
<212> PRT
<213> Rattus norvegicus

<220> 
<221> SOURCE
<222> 1..450
<223> /mol_type="protein"
      /note="beta-III-tubulin"
      /organism="Rattus norvegicus"

<400> 108
Met Arg Glu Ile Val His Ile Gln Ala Gly Gln Cys Gly Asn Gln Ile 
1               5                   10                   15    
Gly Ala Lys Phe Trp Glu Val Ile Ser Asp Glu His Gly Ile Asp Pro 
            20                   25                  30        
Ser Gly Asn Tyr Val Gly Asp Ser Asp Leu Gln Leu Glu Arg Ile Ser 
        35                   40                  45            
Val Tyr Tyr Asn Glu Ala Ser Ser His Lys Tyr Val Pro Arg Ala Ile 
    50                   55                  60                
Leu Val Asp Leu Glu Pro Gly Thr Met Asp Ser Val Arg Ser Gly Ala 
65                   70                  75                  80
Phe Gly His Leu Phe Arg Pro Asp Asn Phe Ile Phe Gly Gln Ser Gly 
                85                   90                  95    
Ala Gly Asn Asn Trp Ala Lys Gly His Tyr Thr Glu Gly Ala Glu Leu 
            100                  105                110        
Val Asp Ser Val Leu Asp Val Val Arg Lys Glu Cys Glu Asn Cys Asp 
        115                  120                125            
Cys Leu Gln Gly Phe Gln Leu Thr His Ser Leu Gly Gly Gly Thr Gly 
    130                  135                140                
Ser Gly Met Gly Thr Leu Leu Ile Ser Lys Val Arg Glu Glu Tyr Pro 
145                  150                155                  160
Asp Arg Ile Met Asn Thr Phe Ser Val Val Pro Ser Pro Lys Val Ser 
                165                  170                175    
Asp Thr Val Val Glu Pro Tyr Asn Ala Thr Leu Ser Ile His Gln Leu 
            180                  185                190        
Val Glu Asn Thr Asp Glu Thr Tyr Cys Ile Asp Asn Glu Ala Leu Tyr 
        195                  200                205            
Asp Ile Cys Phe Arg Thr Leu Lys Leu Ala Thr Pro Thr Tyr Gly Asp 
    210                  215                220                
Leu Asn His Leu Val Ser Ala Thr Met Ser Gly Val Thr Thr Ser Leu 
225                  230                235                  240
Arg Phe Pro Gly Gln Leu Asn Ala Asp Leu Arg Lys Leu Ala Val Asn 
                245                  250                255    
Met Val Pro Phe Pro Arg Leu His Phe Phe Met Pro Gly Phe Ala Pro 
            260                  265                270        
Leu Thr Ala Arg Gly Ser Gln Gln Tyr Arg Ala Leu Thr Val Pro Glu 
        275                  280                285            
Leu Thr Gln Gln Met Phe Asp Ala Lys Asn Met Met Ala Ala Cys Asp 
    290                  295                300                
Pro Arg His Gly Arg Tyr Leu Thr Val Ala Thr Val Phe Arg Gly Arg 
305                  310                315                  320
Met Ser Met Lys Glu Val Asp Glu Gln Met Leu Ala Ile Gln Ser Lys 
                325                  330                335    
Asn Ser Ser Tyr Phe Val Glu Trp Ile Pro Asn Asn Val Lys Val Ala 
            340                  345                350        
Val Cys Asp Ile Pro Pro Arg Gly Leu Lys Met Ser Ser Thr Phe Ile 
        355                  360                365            
Gly Asn Ser Thr Ala Ile Gln Glu Leu Phe Lys Arg Ile Ser Glu Gln 
    370                  375                380                
Phe Thr Ala Met Phe Arg Arg Lys Ala Phe Leu His Trp Tyr Thr Gly 
385                  390                395                  400
Glu Gly Met Asp Glu Met Glu Phe Thr Glu Ala Glu Ser Asn Met Asn 
                405                  410                415    
Asp Leu Val Ser Glu Tyr Gln Gln Tyr Gln Asp Ala Thr Ala Glu Glu 
            420                  425                430        
Glu Gly Glu Met Tyr Glu Asp Asp Asp Glu Glu Ser Glu Ala Gln Gly 
        435                  440                445            
Pro Lys 
    450

<210> 109
<211> 1691
<212> DNA
<213> Homo sapiens

<220> 
<221> source
<222> 1..1691
<223> /mol_type="DNA"
      /note="GAP43 isoform 2"
      /organism="Homo sapiens"

<400> 109
tccgagaaag agacggagag agagggaaga aaaagacaga tagatagata ttggggggaa      60

ggagaaaaaa ggagaagaga gggaagagag gacagcggag agagagcacc agagagagag     120

ggagagagag agagagcgct agagagaggg agcgagcatg tgcgatgagc aatagctgtg     180

gaccttacag ttgctgctaa ctgccctggt gtgtgtgagg gagagagagg gagggaggga     240

gagagagcgc gctagcgcga gagagcgagt gagcaagcga gcagaaaaga ggtggagagg     300

gggggaataa gaaagagaga gaaggaaagg agagaaggca ggaagaaggc aagggacgag     360

acaaccatgc tgtgctgtat gagaagaacc aaacaggttg aaaaaaatga tgacgaccaa     420

aagattgaac aagatggtat caaaccagaa gataaagctc ataaggccgc aaccaaaatt     480

caggctagct tccgtggaca cataacaagg aaaaagctca aaggagagaa gaaggatgat     540

gtccaagctg ctgaggctga agctaataag aaggatgaag cccctgttgc cgatggggtg     600

gagaagaagg gagaaggcac cactactgcc gaagcagccc cagccactgg ctccaagcct     660

gatgagcccg gcaaagcagg agaaactcct tccgaggaga agaaggggga gggtgatgct     720

gccacagagc aggcagcccc ccaggctcct gcatcctcag aggagaaggc cggctcagct     780

gagacagaaa gtgccactaa agcttccact gataactcgc cgtcctccaa ggctgaagat     840

gccccagcca aggaggagcc taaacaagcc gatgtgcctg ctgctgtcac tgctgctgct     900

gccaccaccc ctgccgcaga ggatgctgct gccaaggcaa cagcccagcc tccaacggag     960

actggggaga gcagccaagc tgaagagaac atagaagctg tagatgaaac caaacctaag    1020

gaaagtgccc ggcaggacga gggtaaagaa gaggaacctg aggctgacca agaacatgcc    1080

tgaactctaa gaaatggctt tccacatccc caccctcccc tctcctgagc ctgtctctcc    1140

ctaccctctt ctcagctcca ctctgaagtc ccttcctgtc ctgctcacgt ctgtgagtct    1200

gtcctttccc acccactagc cctctttctc tctgtgtggc aaacatttaa aaaaaaaaaa    1260

aaaaagcagg aaagatccca agtcaaacag tgtggcttaa acattttttg tttcttggtg    1320

ttgttatggc aagtttttgg taatgatgat tcaatcattt tgggaaattc ttgcactgta    1380

tccaagttat ttgatctggt gcgtgtggcc ctgtgggagt ccactttcct ctctctctct    1440

ctctctgttc caagtgtgtg tgcaatgttc cgttcatctg aggagtccaa aatatcgagt    1500

gaattcaaaa tcatttttgt tttcctcctt ttcaatgtga tggaatgaac aaaaaggaaa    1560

aaattcaaaa aacccagttt gttttaaaaa taaataaata aagcaaatgt gccaattagc    1620

gtaaacttgc ggctctaagg ctcctttttc aacccgaata ttaataaatc atgagagtaa    1680

tcaaggtcca a                                                         1691


<210> 110
<211> 238
<212> PRT
<213> Homo sapiens

<220> 
<221> SOURCE
<222> 1..238
<223> /mol_type="protein"
      /note="GAP43 isoform 2"
      /organism="Homo sapiens"

<400> 110
Met Leu Cys Cys Met Arg Arg Thr Lys Gln Val Glu Lys Asn Asp Asp 
1               5                   10                   15    
Asp Gln Lys Ile Glu Gln Asp Gly Ile Lys Pro Glu Asp Lys Ala His 
            20                   25                  30        
Lys Ala Ala Thr Lys Ile Gln Ala Ser Phe Arg Gly His Ile Thr Arg 
        35                   40                  45            
Lys Lys Leu Lys Gly Glu Lys Lys Asp Asp Val Gln Ala Ala Glu Ala 
    50                   55                  60                
Glu Ala Asn Lys Lys Asp Glu Ala Pro Val Ala Asp Gly Val Glu Lys 
65                   70                  75                  80
Lys Gly Glu Gly Thr Thr Thr Ala Glu Ala Ala Pro Ala Thr Gly Ser 
                85                   90                  95    
Lys Pro Asp Glu Pro Gly Lys Ala Gly Glu Thr Pro Ser Glu Glu Lys 
            100                  105                110        
Lys Gly Glu Gly Asp Ala Ala Thr Glu Gln Ala Ala Pro Gln Ala Pro 
        115                  120                125            
Ala Ser Ser Glu Glu Lys Ala Gly Ser Ala Glu Thr Glu Ser Ala Thr 
    130                  135                140                
Lys Ala Ser Thr Asp Asn Ser Pro Ser Ser Lys Ala Glu Asp Ala Pro 
145                  150                155                  160
Ala Lys Glu Glu Pro Lys Gln Ala Asp Val Pro Ala Ala Val Thr Ala 
                165                  170                175    
Ala Ala Ala Thr Thr Pro Ala Ala Glu Asp Ala Ala Ala Lys Ala Thr 
            180                  185                190        
Ala Gln Pro Pro Thr Glu Thr Gly Glu Ser Ser Gln Ala Glu Glu Asn 
        195                  200                205            
Ile Glu Ala Val Asp Glu Thr Lys Pro Lys Glu Ser Ala Arg Gln Asp 
    210                  215                220                
Glu Gly Lys Glu Glu Glu Pro Glu Ala Asp Gln Glu His Ala 
225                  230                235            

<210> 111
<211> 1901
<212> DNA
<213> Homo sapiens

<220> 
<221> source
<222> 1..1901
<223> /mol_type="DNA"
      /note="GAP43 isoform 1"
      /organism="Homo sapiens"

<400> 111
acagttgctg ctaactgccc tggtgtgtgt gagggagaga gagggaggga gggagagaga      60

gcgcgctagc gcgagagagc gagtgagcaa gcgagcagaa aagaggtgga gaggggggga     120

ataagaaaga gagagaagga aaggagagaa ggcaggaaga aggcaaggga cgagacaacc     180

atgctgtgct gtatgagaag aaccaaacag aattaaaagg gaacctggtc tctgggttgt     240

tttcaacatc tcaagtgtga attttccctg tcaaaatctt cacaaggaaa atgagtcaca     300

gcatcacctg ggtgacgagg tcataacacc tcagcccttg cttaaaaaat tttatttcta     360

cttttctatt gtaaagagat ctcaaaacag gaagataaaa ttggactgac agctctacag     420

cctagtcttt tagacagtga actaggccag cattggcaga cactggcgat gacaaagtcc     480

tgctctgaat tatgccaccc cgcactccac tttttacctt gcctgggagg cttgaggaaa     540

aatcttcaga gagcagttcg acctagtcct tattcacttg gcttcttgac tttctggatt     600

tcaagggttg aaaaaaatga tgacgaccaa aagattgaac aagatggtat caaaccagaa     660

gataaagctc ataaggccgc aaccaaaatt caggctagct tccgtggaca cataacaagg     720

aaaaagctca aaggagagaa gaaggatgat gtccaagctg ctgaggctga agctaataag     780

aaggatgaag cccctgttgc cgatggggtg gagaagaagg gagaaggcac cactactgcc     840

gaagcagccc cagccactgg ctccaagcct gatgagcccg gcaaagcagg agaaactcct     900

tccgaggaga agaaggggga gggtgatgct gccacagagc aggcagcccc ccaggctcct     960

gcatcctcag aggagaaggc cggctcagct gagacagaaa gtgccactaa agcttccact    1020

gataactcgc cgtcctccaa ggctgaagat gccccagcca aggaggagcc taaacaagcc    1080

gatgtgcctg ctgctgtcac tgctgctgct gccaccaccc ctgccgcaga ggatgctgct    1140

gccaaggcaa cagcccagcc tccaacggag actggggaga gcagccaagc tgaagagaac    1200

atagaagctg tagatgaaac caaacctaag gaaagtgccc ggcaggacga gggtaaagaa    1260

gaggaacctg aggctgacca agaacatgcc tgaactctaa gaaatggctt tccacatccc    1320

caccctcccc tctcctgagc ctgtctctcc ctaccctctt ctcagctcca ctctgaagtc    1380

ccttcctgtc ctgctcacgt ctgtgagtct gtcctttccc acccactagc cctctttctc    1440

tctgtgtggc aaacatttaa aaaaaaaaaa aaaaagcagg aaagatccca agtcaaacag    1500

tgtggcttaa acattttttg tttcttggtg ttgttatggc aagtttttgg taatgatgat    1560

tcaatcattt tgggaaattc ttgcactgta tccaagttat ttgatctggt gcgtgtggcc    1620

ctgtgggagt ccactttcct ctctctctct ctctctgttc caagtgtgtg tgcaatgttc    1680

cgttcatctg aggagtccaa aatatcgagt gaattcaaaa tcatttttgt tttcctcctt    1740

ttcaatgtga tggaatgaac aaaaaggaaa aaattcaaaa aacccagttt gttttaaaaa    1800

taaataaata aagcaaatgt gccaattagc gtaaacttgc ggctctaagg ctcctttttc    1860

aacccgaata ttaataaatc atgagagtaa tcaaggtcca a                        1901


<210> 112
<211> 274
<212> PRT
<213> Homo sapiens

<220> 
<221> SOURCE
<222> 1..274
<223> /mol_type="protein"
      /note="GAP43 isoform 1"
      /organism="Homo sapiens"

<400> 112
Met Thr Lys Ser Cys Ser Glu Leu Cys His Pro Ala Leu His Phe Leu 
1               5                   10                   15    
Pro Cys Leu Gly Gly Leu Arg Lys Asn Leu Gln Arg Ala Val Arg Pro 
            20                   25                  30        
Ser Pro Tyr Ser Leu Gly Phe Leu Thr Phe Trp Ile Ser Arg Val Glu 
        35                   40                  45            
Lys Asn Asp Asp Asp Gln Lys Ile Glu Gln Asp Gly Ile Lys Pro Glu 
    50                   55                  60                
Asp Lys Ala His Lys Ala Ala Thr Lys Ile Gln Ala Ser Phe Arg Gly 
65                   70                  75                  80
His Ile Thr Arg Lys Lys Leu Lys Gly Glu Lys Lys Asp Asp Val Gln 
                85                   90                  95    
Ala Ala Glu Ala Glu Ala Asn Lys Lys Asp Glu Ala Pro Val Ala Asp 
            100                  105                110        
Gly Val Glu Lys Lys Gly Glu Gly Thr Thr Thr Ala Glu Ala Ala Pro 
        115                  120                125            
Ala Thr Gly Ser Lys Pro Asp Glu Pro Gly Lys Ala Gly Glu Thr Pro 
    130                  135                140                
Ser Glu Glu Lys Lys Gly Glu Gly Asp Ala Ala Thr Glu Gln Ala Ala 
145                  150                155                  160
Pro Gln Ala Pro Ala Ser Ser Glu Glu Lys Ala Gly Ser Ala Glu Thr 
                165                  170                175    
Glu Ser Ala Thr Lys Ala Ser Thr Asp Asn Ser Pro Ser Ser Lys Ala 
            180                  185                190        
Glu Asp Ala Pro Ala Lys Glu Glu Pro Lys Gln Ala Asp Val Pro Ala 
        195                  200                205            
Ala Val Thr Ala Ala Ala Ala Thr Thr Pro Ala Ala Glu Asp Ala Ala 
    210                  215                220                
Ala Lys Ala Thr Ala Gln Pro Pro Thr Glu Thr Gly Glu Ser Ser Gln 
225                  230                235                  240
Ala Glu Glu Asn Ile Glu Ala Val Asp Glu Thr Lys Pro Lys Glu Ser 
                245                  250                255    
Ala Arg Gln Asp Glu Gly Lys Glu Glu Glu Pro Glu Ala Asp Gln Glu 
            260                  265                270        
His Ala 
        

<210> 113
<211> 1481
<212> DNA
<213> Rattus norvegicus

<220> 
<221> source
<222> 1..1481
<223> /mol_type="DNA"
      /note="GAP43"
      /organism="Rattus norvegicus"

<400> 113
ctgatcgctg tagaccttac agttgctgct aactgccctg gtgtgtgtga gggagagaga      60

gggagagaga gggagaggga gggagggagg gagggagagc gcgctagcgc gagagagcga     120

gtgagcaagc gagcagaaaa gaggtggaga gggggggaat aaggaagaga ggaggaaagg     180

agagaaggca ggaagaaggc aggggaagat accaccatgc tgtgctgtat gagaagaacc     240

aaacaggttg aaaagaatga tgaggaccaa aagattgaac aagatggtgt caaaccggag     300

gataaggctc ataaggctgc aaccaaaatt caggctagct tccgtggaca cataacaagg     360

aaaaagctca aagacgagaa gaagggtgat gcaccagctg ctgaggccga ggccaaggag     420

aaggatgatg ctcccgttgc tgatggtgtg gagaagaagg agggagatgg ctctgctact     480

accgatgcag ccccagccac cagccctaag gctgaggagc ccagcaaggc aggagatgca     540

ccttctgagg agaagaaggg cgaaggggat gcggcccctt cagaggaaaa ggccggctca     600

gctgagacag aaagtgctgc taaagctacc actgataact cgccgtcctc caaggccgaa     660

gatggcccag ccaaggagga gcctaaacaa gccgatgtgc ctgctgctgt cactgatgct     720

gctgccacca cccctgctgc agaggatgct gccaaggcag cgcagcctcc aacggagact     780

gcagaaagca gccaagctga ggaggagaaa gaagctgtag atgaagccaa acctaaggaa     840

agtgcccgac aggatgaggg taaagaagac cccgaggctg accaagaaca tgcctgaact     900

ttaagaaacg gctttccacg ttgcccccac ctgaaccctg tctctcctgc cctttctcag     960

atccactctg aagtttcctc tcctgtcctg ctcacgtgtg tgagcctgtc ctctcctacc    1020

tatgagccct ctctctctgt gtggcaaaca ttaaaaaaaa aaaaaagcag gaaagatccc    1080

aagtccaaca gtgtggctta aacatttgtt tcttggtgtt gttatggcga gtttttggta    1140

atgatgatgc agtcatcttg ggaaattctt gcactgtacc ccggtttttt gatctggtgc    1200

gtgtggccct gtgggagtcc actttcctct ctatttctct ctgttccaag tgtgtgtgtg    1260

caatgttccg ttctgaggag tccaaaatat taagtgaatt caaaaaacca tttctgtttc    1320

ctcattttca atgtgatgga atgaacaaaa aggttaaaaa aattaaaaaa aaaacggttt    1380

gttttaaaaa taaataaata aagcaaatgt gccaattagc gtaacttaag gctgtgaggc    1440

tcctttttca atctgaatat taataaatca tgagagtaat c                        1481


<210> 114
<211> 226
<212> PRT
<213> Rattus norvegicus

<220> 
<221> SOURCE
<222> 1..226
<223> /mol_type="protein"
      /note="GAP43"
      /organism="Rattus norvegicus"

<400> 114
Met Leu Cys Cys Met Arg Arg Thr Lys Gln Val Glu Lys Asn Asp Glu 
1               5                   10                   15    
Asp Gln Lys Ile Glu Gln Asp Gly Val Lys Pro Glu Asp Lys Ala His 
            20                   25                  30        
Lys Ala Ala Thr Lys Ile Gln Ala Ser Phe Arg Gly His Ile Thr Arg 
        35                   40                  45            
Lys Lys Leu Lys Asp Glu Lys Lys Gly Asp Ala Pro Ala Ala Glu Ala 
    50                   55                  60                
Glu Ala Lys Glu Lys Asp Asp Ala Pro Val Ala Asp Gly Val Glu Lys 
65                   70                  75                  80
Lys Glu Gly Asp Gly Ser Ala Thr Thr Asp Ala Ala Pro Ala Thr Ser 
                85                   90                  95    
Pro Lys Ala Glu Glu Pro Ser Lys Ala Gly Asp Ala Pro Ser Glu Glu 
            100                  105                110        
Lys Lys Gly Glu Gly Asp Ala Ala Pro Ser Glu Glu Lys Ala Gly Ser 
        115                  120                125            
Ala Glu Thr Glu Ser Ala Ala Lys Ala Thr Thr Asp Asn Ser Pro Ser 
    130                  135                140                
Ser Lys Ala Glu Asp Gly Pro Ala Lys Glu Glu Pro Lys Gln Ala Asp 
145                  150                155                  160
Val Pro Ala Ala Val Thr Asp Ala Ala Ala Thr Thr Pro Ala Ala Glu 
                165                  170                175    
Asp Ala Ala Lys Ala Ala Gln Pro Pro Thr Glu Thr Ala Glu Ser Ser 
            180                  185                190        
Gln Ala Glu Glu Glu Lys Glu Ala Val Asp Glu Ala Lys Pro Lys Glu 
        195                  200                205            
Ser Ala Arg Gln Asp Glu Gly Lys Glu Asp Pro Glu Ala Asp Gln Glu 
    210                  215                220                
His Ala 
225    

<210> 115
<211> 3081
<212> DNA
<213> Homo sapiens

<220> 
<221> source
<222> 1..3081
<223> /mol_type="DNA"
      /note="GFAP"
      /organism="Homo sapiens"

<400> 115
agtctagccc actccttcat aaagccctcg catcccagga gcgagcagag ccagagcagg      60

atggagagga gacgcatcac ctccgctgct cgccgctcct acgtctcctc aggggagatg     120

atggtggggg gcctggctcc tggccgccgt ctgggtcctg gcacccgcct ctccctggct     180

cgaatgcccc ctccactccc gacccgggtg gatttctccc tggctggggc actcaatgct     240

ggcttcaagg agacccgggc cagtgagcgg gcagagatga tggagctcaa tgaccgcttt     300

gccagctaca tcgagaaggt tcgcttcctg gaacagcaaa acaaggcgct ggctgctgag     360

ctgaaccagc tgcgggccaa ggagcccacc aagctggcag acgtctacca ggctgagctg     420

cgagagctgc ggctgcggct cgatcaactc accgccaaca gcgcccggct ggaggttgag     480

agggacaatc tggcacagga cctggccact gtgaggcaga agctccagga tgaaaccaac     540

ctgaggctgg aagccgagaa caacctggct gcctatagac aggaagcaga tgaagccacc     600

ctggcccgtc tggatctgga gaggaagatt gagtcgctgg aggaggagat ccggttcttg     660

aggaagatcc acgaggagga ggttcgggaa ctccaggagc agctggcccg acagcaggtc     720

catgtggagc ttgacgtggc caagccagac ctcaccgcag ccctgaaaga gatccgcacg     780

cagtatgagg caatggcgtc cagcaacatg catgaagccg aagagtggta ccgctccaag     840

tttgcagacc tgacagacgc tgctgcccgc aacgcggagc tgctccgcca ggccaagcac     900

gaagccaacg actaccggcg ccagttgcag tccttgacct gcgacctgga gtctctgcgc     960

ggcacgaacg agtccctgga gaggcagatg cgcgagcagg aggagcggca cgtgcgggag    1020

gcggccagtt atcaggaggc gctggcgcgg ctggaggaag aggggcagag cctcaaggac    1080

gagatggccc gccacttgca ggagtaccag gacctgctca atgtcaagct ggccctggac    1140

atcgagatcg ccacctacag gaagctgcta gagggcgagg agaaccggat caccattccc    1200

gtgcagacct tctccaacct gcagattcga gaaaccagcc tggacaccaa gtctgtgtca    1260

gaaggccacc tcaagaggaa catcgtggtg aagaccgtgg agatgcggga tggagaggtc    1320

attaaggagt ccaagcagga gcacaaggat gtgatgtgag gcaggaccca cctggtggcc    1380

tctgccccgt ctcatgaggg gcccgagcag aagcaggata gttgctccgc ctctgctggc    1440

acatttcccc agacctgagc tccccaccac cccagctgct cccctccctc ctctgtccct    1500

aggtcagctt gctgccctag gctccgtcag tatcaggcct gccagacggc acccacccag    1560

cacccagcaa ctccaactaa caagaaactc acccccaagg ggcagtctgg aggggcatgg    1620

ccagcagctt gcgttagaat gaggaggaag gagagaaggg gaggagggcg gggggcacct    1680

actacatcgc cctccacatc cctgattcct gttgttatgg aaactgttgc cagagatgga    1740

ggttctctcg gagtatctgg gaactgtgcc tttgagtttc ctcaggctgc tggaggaaaa    1800

ctgagactca gacaggaaag ggaaggcccc acagacaagg tagccctggc cagaggcttg    1860

ttttgtcttt tggtttttat gaggtgggat atccctatgc tgcctaggct gaccttgaac    1920

tcctgggctc aagcagtcta cccacctcag cctcctgtgt agctgggatt atagattgga    1980

gccaccatgc ccagctcaga gggttgttct cctagactga ccctgatcag tctaagatgg    2040

gtggggacgt cctgccacct ggggcagtca cctgcccaga tcccagaagg acctcctgag    2100

cgatgactca agtgtctcag tccacctgag ctgccatcca gggatgccat ctgtgggcac    2160

gctgtgggca ggtgggagct tgattctcag cacttggggg atctgttgtg tacgtggaga    2220

gggatgaggt gctgggaggg atagaggggg gctgcctggc ccccagctgt gggtacagag    2280

aggtcaagcc caggaggact gccccgtgca gactggaggg gacgctggta gagatggagg    2340

aggaggcaat tgggatggcg ctaggcatac aagtaggggt tgtgggtgac cagttgcact    2400

tggcctctgg attgtgggaa ttaaggaagt gactcatcct cttgaagatg ctgaaacagg    2460

agagaaaggg gatgtatcca tgggggcagg gcatgacttt gtcccatttc taaaggcctc    2520

ttccttgctg tgtcatacca ggccgcccca gcctctgagc ccctgggact gctgcttctt    2580

aaccccagta agccactgcc acacgtctga ccctctccac cccatagtga ccggctgctt    2640

ttccctaagc caagggcctc ttgcggtccc ttcttactca cacacaaaat gtacccagta    2700

ttctaggtag tgccctattt tacaattgta aaactgaggc acgagcaaag tgaagacact    2760

ggctcatatt cctgcagcct ggaggccggg tgctcagggc tgacacgtcc accccagtgc    2820

acccactctg ctttgactga gcagactggt gagcagactg gtgggatctg tgcccagaga    2880

tgggactggg agggcccact tcagggttct cctctcccct ctaaggccga agaagggtcc    2940

ttccctctcc ccaagacttg gtgtcctttc cctccactcc ttcctgccac ctgctgctgc    3000

tgctgctgct aatcttcagg gcactgctgc tgcctttagt cgctgaggaa aaataaagac    3060

aaatgctgcg cccttcccca g                                              3081


<210> 116
<211> 432
<212> PRT
<213> Homo sapiens

<220> 
<221> SOURCE
<222> 1..432
<223> /mol_type="protein"
      /note="GFAP"
      /organism="Homo sapiens"

<400> 116
Met Glu Arg Arg Arg Ile Thr Ser Ala Ala Arg Arg Ser Tyr Val Ser 
1               5                   10                   15    
Ser Gly Glu Met Met Val Gly Gly Leu Ala Pro Gly Arg Arg Leu Gly 
            20                   25                  30        
Pro Gly Thr Arg Leu Ser Leu Ala Arg Met Pro Pro Pro Leu Pro Thr 
        35                   40                  45            
Arg Val Asp Phe Ser Leu Ala Gly Ala Leu Asn Ala Gly Phe Lys Glu 
    50                   55                  60                
Thr Arg Ala Ser Glu Arg Ala Glu Met Met Glu Leu Asn Asp Arg Phe 
65                   70                  75                  80
Ala Ser Tyr Ile Glu Lys Val Arg Phe Leu Glu Gln Gln Asn Lys Ala 
                85                   90                  95    
Leu Ala Ala Glu Leu Asn Gln Leu Arg Ala Lys Glu Pro Thr Lys Leu 
            100                  105                110        
Ala Asp Val Tyr Gln Ala Glu Leu Arg Glu Leu Arg Leu Arg Leu Asp 
        115                  120                125            
Gln Leu Thr Ala Asn Ser Ala Arg Leu Glu Val Glu Arg Asp Asn Leu 
    130                  135                140                
Ala Gln Asp Leu Ala Thr Val Arg Gln Lys Leu Gln Asp Glu Thr Asn 
145                  150                155                  160
Leu Arg Leu Glu Ala Glu Asn Asn Leu Ala Ala Tyr Arg Gln Glu Ala 
                165                  170                175    
Asp Glu Ala Thr Leu Ala Arg Leu Asp Leu Glu Arg Lys Ile Glu Ser 
            180                  185                190        
Leu Glu Glu Glu Ile Arg Phe Leu Arg Lys Ile His Glu Glu Glu Val 
        195                  200                205            
Arg Glu Leu Gln Glu Gln Leu Ala Arg Gln Gln Val His Val Glu Leu 
    210                  215                220                
Asp Val Ala Lys Pro Asp Leu Thr Ala Ala Leu Lys Glu Ile Arg Thr 
225                  230                235                  240
Gln Tyr Glu Ala Met Ala Ser Ser Asn Met His Glu Ala Glu Glu Trp 
                245                  250                255    
Tyr Arg Ser Lys Phe Ala Asp Leu Thr Asp Ala Ala Ala Arg Asn Ala 
            260                  265                270        
Glu Leu Leu Arg Gln Ala Lys His Glu Ala Asn Asp Tyr Arg Arg Gln 
        275                  280                285            
Leu Gln Ser Leu Thr Cys Asp Leu Glu Ser Leu Arg Gly Thr Asn Glu 
    290                  295                300                
Ser Leu Glu Arg Gln Met Arg Glu Gln Glu Glu Arg His Val Arg Glu 
305                  310                315                  320
Ala Ala Ser Tyr Gln Glu Ala Leu Ala Arg Leu Glu Glu Glu Gly Gln 
                325                  330                335    
Ser Leu Lys Asp Glu Met Ala Arg His Leu Gln Glu Tyr Gln Asp Leu 
            340                  345                350        
Leu Asn Val Lys Leu Ala Leu Asp Ile Glu Ile Ala Thr Tyr Arg Lys 
        355                  360                365            
Leu Leu Glu Gly Glu Glu Asn Arg Ile Thr Ile Pro Val Gln Thr Phe 
    370                  375                380                
Ser Asn Leu Gln Ile Arg Glu Thr Ser Leu Asp Thr Lys Ser Val Ser 
385                  390                395                  400
Glu Gly His Leu Lys Arg Asn Ile Val Val Lys Thr Val Glu Met Arg 
                405                  410                415    
Asp Gly Glu Val Ile Lys Glu Ser Lys Gln Glu His Lys Asp Val Met 
            420                  425                430        

<210> 117
<211> 1318
<212> DNA
<213> Rattus norvegicus

<220> 
<221> source
<222> 1..1318
<223> /mol_type="DNA"
      /note="GFAP"
      /organism="Rattus norvegicus"

<400> 117
caggagccag cagaagcagg gcaagatgga gcggagacgt atcacctctg cacgccgctc      60

ctatgcctcc tccgagacga tggtcagggg ccatggtcct accagacacc tgggtaccat     120

tccgcgcctc tccctgtctc gaatgacgcc tccactccct gccagggtag acttctccct     180

ggccggggcg ctcaatgccg gcttcaaaga gactcgggcc agcgagcgtg cggagatgat     240

ggagctcaat gaccgctttg ctagctacat cgagaaggtc cgcttcctgg aacagcaaaa     300

caaggcgctg gcagctgagc tgaaccagct tcgagccaag gagcccacca aactggctga     360

cgtttaccag gcagaacttc gggagctgcg gctgcgtctg gaccagctta ctaccaacag     420

tgcccggctg gaggtggaga gggacaatct cacacaggac ctcggcaccc tgaggcagaa     480

gctccaagat gaaaccaacc tgaggctgga ggcggagaac aacctggctg tgtacagaca     540

ggaggcggat gaagccacct tggctcgtgt ggatctggag aggaaggttg agtcgctgga     600

ggaggagatc cagttcttga ggaagatcca tgaggaggaa gttcgagaac tccaggagca     660

gctggcccag cagcaggtcc acgtggagat ggatgtggcc aagccagacc tcacagcggc     720

tctgagagag attcgcactc agtacgaggc agtggccacc agtaacatgc aagaaacaga     780

agagtggtat cggtccaagt ttgcagacct cacagacgtt gcttcccgca acgcagagct     840

gctccgccag gccaagcacg aggctaatga ctatcgccgc caactgcagg ccttgacctg     900

cgaccttgag tccttgcgcg gcacgaacga gtccttggag aggcaaatgc gcgaacagga     960

ggagcgccac gcgcgggagt cggcgagtta ccaggaggca ctcgctcggc tggaggagga    1020

gggccaaagc ctcaaggagg agatggcccg ccacctgcag gagtaccagg atctactcaa    1080

cgttaagcta gccctggaca tcgagatcgc cacctacagg aaattgctgg agggcgaaga    1140

aaaccgcatc accattcctg tacagacttt ctccaacctc cagatccgag aaaccagcct    1200

ggacaccaaa tctgtgtcag aaggccacct caagaggaac atcgtggtaa agacggtgga    1260

gatgcgggat ggcgaggtca ttaaggagtc gaagcaggag cacaaggatg tgatgctg      1318


<210> 118
<211> 430
<212> PRT
<213> Rattus norvegicus

<220> 
<221> SOURCE
<222> 1..430
<223> /mol_type="protein"
      /note="GFAP"
      /organism="Rattus norvegicus"

<400> 118
Met Glu Arg Arg Arg Ile Thr Ser Ala Arg Arg Ser Tyr Ala Ser Ser 
1               5                   10                   15    
Glu Thr Met Val Arg Gly His Gly Pro Thr Arg His Leu Gly Thr Ile 
            20                   25                  30        
Pro Arg Leu Ser Leu Ser Arg Met Thr Pro Pro Leu Pro Ala Arg Val 
        35                   40                  45            
Asp Phe Ser Leu Ala Gly Ala Leu Asn Ala Gly Phe Lys Glu Thr Arg 
    50                   55                  60                
Ala Ser Glu Arg Ala Glu Met Met Glu Leu Asn Asp Arg Phe Ala Ser 
65                   70                  75                  80
Tyr Ile Glu Lys Val Arg Phe Leu Glu Gln Gln Asn Lys Ala Leu Ala 
                85                   90                  95    
Ala Glu Leu Asn Gln Leu Arg Ala Lys Glu Pro Thr Lys Leu Ala Asp 
            100                  105                110        
Val Tyr Gln Ala Glu Leu Arg Glu Leu Arg Leu Arg Leu Asp Gln Leu 
        115                  120                125            
Thr Thr Asn Ser Ala Arg Leu Glu Val Glu Arg Asp Asn Leu Thr Gln 
    130                  135                140                
Asp Leu Gly Thr Leu Arg Gln Lys Leu Gln Asp Glu Thr Asn Leu Arg 
145                  150                155                  160
Leu Glu Ala Glu Asn Asn Leu Ala Val Tyr Arg Gln Glu Ala Asp Glu 
                165                  170                175    
Ala Thr Leu Ala Arg Val Asp Leu Glu Arg Lys Val Glu Ser Leu Glu 
            180                  185                190        
Glu Glu Ile Gln Phe Leu Arg Lys Ile His Glu Glu Glu Val Arg Glu 
        195                  200                205            
Leu Gln Glu Gln Leu Ala Gln Gln Gln Val His Val Glu Met Asp Val 
    210                  215                220                
Ala Lys Pro Asp Leu Thr Ala Ala Leu Arg Glu Ile Arg Thr Gln Tyr 
225                  230                235                  240
Glu Ala Val Ala Thr Ser Asn Met Gln Glu Thr Glu Glu Trp Tyr Arg 
                245                  250                255    
Ser Lys Phe Ala Asp Leu Thr Asp Val Ala Ser Arg Asn Ala Glu Leu 
            260                  265                270        
Leu Arg Gln Ala Lys His Glu Ala Asn Asp Tyr Arg Arg Gln Leu Gln 
        275                  280                285            
Ala Leu Thr Cys Asp Leu Glu Ser Leu Arg Gly Thr Asn Glu Ser Leu 
    290                  295                300                
Glu Arg Gln Met Arg Glu Gln Glu Glu Arg His Ala Arg Glu Ser Ala 
305                  310                315                  320
Ser Tyr Gln Glu Ala Leu Ala Arg Leu Glu Glu Glu Gly Gln Ser Leu 
                325                  330                335    
Lys Glu Glu Met Ala Arg His Leu Gln Glu Tyr Gln Asp Leu Leu Asn 
            340                  345                350        
Val Lys Leu Ala Leu Asp Ile Glu Ile Ala Thr Tyr Arg Lys Leu Leu 
        355                  360                365            
Glu Gly Glu Glu Asn Arg Ile Thr Ile Pro Val Gln Thr Phe Ser Asn 
    370                  375                380                
Leu Gln Ile Arg Glu Thr Ser Leu Asp Thr Lys Ser Val Ser Glu Gly 
385                  390                395                  400
His Leu Lys Arg Asn Ile Val Val Lys Thr Val Glu Met Arg Asp Gly 
                405                  410                415    
Glu Val Ile Lys Glu Ser Lys Gln Glu His Lys Asp Val Met 
            420                  425                430

